11c2a3de1SBarry Smith 2397b6df1SKris Buschelman /* 3c2b5dc30SHong Zhang Provides an interface to the MUMPS sparse solver 4397b6df1SKris Buschelman */ 551d5961aSHong Zhang 6c6db04a5SJed Brown #include <../src/mat/impls/aij/mpi/mpiaij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <../src/mat/impls/sbaij/mpi/mpisbaij.h> 8b5fa320bSStefano Zampini #include <petscblaslapack.h> 9397b6df1SKris Buschelman 10397b6df1SKris Buschelman EXTERN_C_BEGIN 11397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 122907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 132907cef9SHong Zhang #include <cmumps_c.h> 142907cef9SHong Zhang #else 15c6db04a5SJed Brown #include <zmumps_c.h> 162907cef9SHong Zhang #endif 172907cef9SHong Zhang #else 182907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 192907cef9SHong Zhang #include <smumps_c.h> 20397b6df1SKris Buschelman #else 21c6db04a5SJed Brown #include <dmumps_c.h> 22397b6df1SKris Buschelman #endif 232907cef9SHong Zhang #endif 24397b6df1SKris Buschelman EXTERN_C_END 25397b6df1SKris Buschelman #define JOB_INIT -1 263d472b54SHong Zhang #define JOB_FACTSYMBOLIC 1 273d472b54SHong Zhang #define JOB_FACTNUMERIC 2 283d472b54SHong Zhang #define JOB_SOLVE 3 29397b6df1SKris Buschelman #define JOB_END -2 303d472b54SHong Zhang 312907cef9SHong Zhang /* calls to MUMPS */ 322907cef9SHong Zhang #if defined(PETSC_USE_COMPLEX) 332907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 342907cef9SHong Zhang #define PetscMUMPS_c cmumps_c 352907cef9SHong Zhang #else 362907cef9SHong Zhang #define PetscMUMPS_c zmumps_c 372907cef9SHong Zhang #endif 382907cef9SHong Zhang #else 392907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 402907cef9SHong Zhang #define PetscMUMPS_c smumps_c 412907cef9SHong Zhang #else 422907cef9SHong Zhang #define PetscMUMPS_c dmumps_c 432907cef9SHong Zhang #endif 442907cef9SHong Zhang #endif 452907cef9SHong Zhang 46940cd9d6SSatish Balay /* declare MumpsScalar */ 47940cd9d6SSatish Balay #if defined(PETSC_USE_COMPLEX) 48940cd9d6SSatish Balay #if defined(PETSC_USE_REAL_SINGLE) 49940cd9d6SSatish Balay #define MumpsScalar mumps_complex 50940cd9d6SSatish Balay #else 51940cd9d6SSatish Balay #define MumpsScalar mumps_double_complex 52940cd9d6SSatish Balay #endif 53940cd9d6SSatish Balay #else 54940cd9d6SSatish Balay #define MumpsScalar PetscScalar 55940cd9d6SSatish Balay #endif 563d472b54SHong Zhang 57397b6df1SKris Buschelman /* macros s.t. indices match MUMPS documentation */ 58397b6df1SKris Buschelman #define ICNTL(I) icntl[(I)-1] 59397b6df1SKris Buschelman #define CNTL(I) cntl[(I)-1] 60397b6df1SKris Buschelman #define INFOG(I) infog[(I)-1] 61a7aca84bSHong Zhang #define INFO(I) info[(I)-1] 62397b6df1SKris Buschelman #define RINFOG(I) rinfog[(I)-1] 63adc1d99fSHong Zhang #define RINFO(I) rinfo[(I)-1] 64397b6df1SKris Buschelman 65397b6df1SKris Buschelman typedef struct { 66397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 672907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 682907cef9SHong Zhang CMUMPS_STRUC_C id; 692907cef9SHong Zhang #else 70397b6df1SKris Buschelman ZMUMPS_STRUC_C id; 712907cef9SHong Zhang #endif 722907cef9SHong Zhang #else 732907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 742907cef9SHong Zhang SMUMPS_STRUC_C id; 75397b6df1SKris Buschelman #else 76397b6df1SKris Buschelman DMUMPS_STRUC_C id; 77397b6df1SKris Buschelman #endif 782907cef9SHong Zhang #endif 792907cef9SHong Zhang 80397b6df1SKris Buschelman MatStructure matstruc; 81c1490034SHong Zhang PetscMPIInt myid,size; 82a5e57a09SHong Zhang PetscInt *irn,*jcn,nz,sym; 83397b6df1SKris Buschelman PetscScalar *val; 84397b6df1SKris Buschelman MPI_Comm comm_mumps; 856f3cc6f9SBarry Smith PetscBool isAIJ; 86a5e57a09SHong Zhang PetscInt ICNTL9_pre; /* check if ICNTL(9) is changed from previous MatSolve */ 87801fbe65SHong Zhang VecScatter scat_rhs, scat_sol; /* used by MatSolve() */ 88801fbe65SHong Zhang Vec b_seq,x_seq; 89b34f08ffSHong Zhang PetscInt ninfo,*info; /* display INFO */ 90b5fa320bSStefano Zampini PetscInt sizeredrhs; 91b5fa320bSStefano Zampini PetscInt *schur_pivots; 9259ac8732SStefano Zampini PetscInt schur_B_lwork; 93b5fa320bSStefano Zampini PetscScalar *schur_work; 9459ac8732SStefano Zampini PetscScalar *schur_sol; 9559ac8732SStefano Zampini PetscInt schur_sizesol; 9659ac8732SStefano Zampini PetscBool schur_factored; 9759ac8732SStefano Zampini PetscBool schur_inverted; 982205254eSKarl Rupp 99bccb9932SShri Abhyankar PetscErrorCode (*ConvertToTriples)(Mat, int, MatReuse, int*, int**, int**, PetscScalar**); 100f0c56d0fSKris Buschelman } Mat_MUMPS; 101f0c56d0fSKris Buschelman 10209573ac7SBarry Smith extern PetscErrorCode MatDuplicate_MUMPS(Mat,MatDuplicateOption,Mat*); 103b24902e0SBarry Smith 10459ac8732SStefano Zampini #undef __FUNCT__ 10559ac8732SStefano Zampini #define __FUNCT__ "MatMumpsResetSchur_Private" 10659ac8732SStefano Zampini static PetscErrorCode MatMumpsResetSchur_Private(Mat_MUMPS* mumps) 107b5fa320bSStefano Zampini { 108b5fa320bSStefano Zampini PetscErrorCode ierr; 109b5fa320bSStefano Zampini 110b5fa320bSStefano Zampini PetscFunctionBegin; 11159ac8732SStefano Zampini ierr = PetscFree2(mumps->id.listvar_schur,mumps->id.schur);CHKERRQ(ierr); 11259ac8732SStefano Zampini ierr = PetscFree(mumps->id.redrhs);CHKERRQ(ierr); 11359ac8732SStefano Zampini ierr = PetscFree(mumps->schur_sol);CHKERRQ(ierr); 11459ac8732SStefano Zampini ierr = PetscFree(mumps->schur_pivots);CHKERRQ(ierr); 11559ac8732SStefano Zampini ierr = PetscFree(mumps->schur_work);CHKERRQ(ierr); 11659ac8732SStefano Zampini mumps->id.size_schur = 0; 11759ac8732SStefano Zampini mumps->id.ICNTL(19) = 0; 11859ac8732SStefano Zampini PetscFunctionReturn(0); 11959ac8732SStefano Zampini } 12059ac8732SStefano Zampini 12159ac8732SStefano Zampini #undef __FUNCT__ 12259ac8732SStefano Zampini #define __FUNCT__ "MatMumpsFactorSchur_Private" 12359ac8732SStefano Zampini static PetscErrorCode MatMumpsFactorSchur_Private(Mat_MUMPS* mumps) 12459ac8732SStefano Zampini { 12559ac8732SStefano Zampini PetscBLASInt B_N,B_ierr,B_slda; 12659ac8732SStefano Zampini PetscErrorCode ierr; 12759ac8732SStefano Zampini 12859ac8732SStefano Zampini PetscFunctionBegin; 12959ac8732SStefano Zampini if (mumps->schur_factored) { 13059ac8732SStefano Zampini PetscFunctionReturn(0); 13159ac8732SStefano Zampini } 13259ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.size_schur,&B_N);CHKERRQ(ierr); 13359ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.schur_lld,&B_slda);CHKERRQ(ierr); 13459ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full Schur matrix */ 13559ac8732SStefano Zampini if (!mumps->schur_pivots) { 13659ac8732SStefano Zampini ierr = PetscMalloc1(B_N,&mumps->schur_pivots);CHKERRQ(ierr); 13759ac8732SStefano Zampini } 13859ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 13959ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetrf",LAPACKgetrf_(&B_N,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,&B_ierr)); 14059ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 14159ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GETRF Lapack routine %d",(int)B_ierr); 14259ac8732SStefano Zampini } else { /* either full or lower-triangular (not packed) */ 14359ac8732SStefano Zampini char ord[2]; 14459ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 14559ac8732SStefano Zampini sprintf(ord,"L"); 14659ac8732SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 14759ac8732SStefano Zampini sprintf(ord,"U"); 14859ac8732SStefano Zampini } 14959ac8732SStefano Zampini if (mumps->id.sym == 2) { 15059ac8732SStefano Zampini if (!mumps->schur_pivots) { 15159ac8732SStefano Zampini PetscScalar lwork; 15259ac8732SStefano Zampini 15359ac8732SStefano Zampini ierr = PetscMalloc1(B_N,&mumps->schur_pivots);CHKERRQ(ierr); 15459ac8732SStefano Zampini mumps->schur_B_lwork=-1; 15559ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 15659ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytrf",LAPACKsytrf_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,&lwork,&mumps->schur_B_lwork,&B_ierr)); 15759ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 15859ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SYTRF Lapack routine %d",(int)B_ierr); 15959ac8732SStefano Zampini ierr = PetscBLASIntCast((PetscInt)PetscRealPart(lwork),&mumps->schur_B_lwork);CHKERRQ(ierr); 16059ac8732SStefano Zampini ierr = PetscMalloc1(mumps->schur_B_lwork,&mumps->schur_work);CHKERRQ(ierr); 16159ac8732SStefano Zampini } 16259ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 16359ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytrf",LAPACKsytrf_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,mumps->schur_work,&mumps->schur_B_lwork,&B_ierr)); 16459ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 16559ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYTRF Lapack routine %d",(int)B_ierr); 16659ac8732SStefano Zampini } else { 16759ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 16859ac8732SStefano Zampini PetscStackCallBLAS("LAPACKpotrf",LAPACKpotrf_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,&B_ierr)); 16959ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 17059ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in POTRF Lapack routine %d",(int)B_ierr); 17159ac8732SStefano Zampini } 17259ac8732SStefano Zampini } 17359ac8732SStefano Zampini mumps->schur_factored = PETSC_TRUE; 17459ac8732SStefano Zampini PetscFunctionReturn(0); 17559ac8732SStefano Zampini } 17659ac8732SStefano Zampini 17759ac8732SStefano Zampini #undef __FUNCT__ 17859ac8732SStefano Zampini #define __FUNCT__ "MatMumpsInvertSchur_Private" 17959ac8732SStefano Zampini static PetscErrorCode MatMumpsInvertSchur_Private(Mat_MUMPS* mumps) 18059ac8732SStefano Zampini { 18159ac8732SStefano Zampini PetscBLASInt B_N,B_ierr,B_slda; 18259ac8732SStefano Zampini PetscErrorCode ierr; 18359ac8732SStefano Zampini 18459ac8732SStefano Zampini PetscFunctionBegin; 18559ac8732SStefano Zampini ierr = MatMumpsFactorSchur_Private(mumps);CHKERRQ(ierr); 18659ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.size_schur,&B_N);CHKERRQ(ierr); 18759ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.schur_lld,&B_slda);CHKERRQ(ierr); 18859ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full Schur matrix */ 18959ac8732SStefano Zampini if (!mumps->schur_work) { 19059ac8732SStefano Zampini PetscScalar lwork; 19159ac8732SStefano Zampini 19259ac8732SStefano Zampini mumps->schur_B_lwork = -1; 19359ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 19459ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetri",LAPACKgetri_(&B_N,(PetscScalar*)mumps->id.schur,&B_N,mumps->schur_pivots,&lwork,&mumps->schur_B_lwork,&B_ierr)); 19559ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 19659ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to GETRI Lapack routine %d",(int)B_ierr); 19759ac8732SStefano Zampini ierr = PetscBLASIntCast((PetscInt)PetscRealPart(lwork),&mumps->schur_B_lwork);CHKERRQ(ierr); 19859ac8732SStefano Zampini ierr = PetscMalloc1(mumps->schur_B_lwork,&mumps->schur_work);CHKERRQ(ierr); 19959ac8732SStefano Zampini } 20059ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 20159ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetri",LAPACKgetri_(&B_N,(PetscScalar*)mumps->id.schur,&B_N,mumps->schur_pivots,mumps->schur_work,&mumps->schur_B_lwork,&B_ierr)); 20259ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 20359ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GETRI Lapack routine %d",(int)B_ierr); 20459ac8732SStefano Zampini } else { /* either full or lower-triangular (not packed) */ 20559ac8732SStefano Zampini char ord[2]; 20659ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 20759ac8732SStefano Zampini sprintf(ord,"L"); 20859ac8732SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 20959ac8732SStefano Zampini sprintf(ord,"U"); 21059ac8732SStefano Zampini } 21159ac8732SStefano Zampini if (mumps->id.sym == 2) { 21259ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 21359ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytri",LAPACKsytri_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_N,mumps->schur_pivots,mumps->schur_work,&B_ierr)); 21459ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 21559ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYTRI Lapack routine %d",(int)B_ierr); 21659ac8732SStefano Zampini } else { 21759ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 21859ac8732SStefano Zampini PetscStackCallBLAS("LAPACKpotri",LAPACKpotri_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_N,&B_ierr)); 21959ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 22059ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in POTRI Lapack routine %d",(int)B_ierr); 22159ac8732SStefano Zampini } 22259ac8732SStefano Zampini } 22359ac8732SStefano Zampini mumps->schur_inverted = PETSC_TRUE; 22459ac8732SStefano Zampini PetscFunctionReturn(0); 22559ac8732SStefano Zampini } 22659ac8732SStefano Zampini 22759ac8732SStefano Zampini #undef __FUNCT__ 22859ac8732SStefano Zampini #define __FUNCT__ "MatMumpsSolveSchur_Private" 229e807eca7SStefano Zampini static PetscErrorCode MatMumpsSolveSchur_Private(Mat_MUMPS* mumps, PetscBool sol_in_redrhs) 23059ac8732SStefano Zampini { 23159ac8732SStefano Zampini PetscBLASInt B_N,B_Nrhs,B_ierr,B_slda,B_rlda; 23259ac8732SStefano Zampini PetscScalar one=1.,zero=0.; 23359ac8732SStefano Zampini PetscErrorCode ierr; 23459ac8732SStefano Zampini 23559ac8732SStefano Zampini PetscFunctionBegin; 23659ac8732SStefano Zampini ierr = MatMumpsFactorSchur_Private(mumps);CHKERRQ(ierr); 237b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.size_schur,&B_N);CHKERRQ(ierr); 238b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.schur_lld,&B_slda);CHKERRQ(ierr); 239b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.nrhs,&B_Nrhs);CHKERRQ(ierr); 240b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.lredrhs,&B_rlda);CHKERRQ(ierr); 24159ac8732SStefano Zampini if (mumps->schur_inverted) { 24259ac8732SStefano Zampini PetscInt sizesol = B_Nrhs*B_N; 24359ac8732SStefano Zampini if (!mumps->schur_sol || sizesol > mumps->schur_sizesol) { 24459ac8732SStefano Zampini ierr = PetscFree(mumps->schur_sol);CHKERRQ(ierr); 24559ac8732SStefano Zampini ierr = PetscMalloc1(sizesol,&mumps->schur_sol);CHKERRQ(ierr); 24659ac8732SStefano Zampini mumps->schur_sizesol = sizesol; 247b5fa320bSStefano Zampini } 24859ac8732SStefano Zampini if (!mumps->sym) { 24959ac8732SStefano Zampini char type[2]; 250b5fa320bSStefano Zampini if (mumps->id.ICNTL(19) == 1) { /* stored by rows */ 25159ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 25259ac8732SStefano Zampini sprintf(type,"N"); 253b5fa320bSStefano Zampini } else { 25459ac8732SStefano Zampini sprintf(type,"T"); 255b5fa320bSStefano Zampini } 25659ac8732SStefano Zampini } else { /* stored by columns */ 25759ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 25859ac8732SStefano Zampini sprintf(type,"T"); 25959ac8732SStefano Zampini } else { 26059ac8732SStefano Zampini sprintf(type,"N"); 26159ac8732SStefano Zampini } 26259ac8732SStefano Zampini } 26359ac8732SStefano Zampini PetscStackCallBLAS("BLASgemm",BLASgemm_(type,"N",&B_N,&B_Nrhs,&B_N,&one,(PetscScalar*)mumps->id.schur,&B_slda,(PetscScalar*)mumps->id.redrhs,&B_rlda,&zero,mumps->schur_sol,&B_rlda)); 26459ac8732SStefano Zampini } else { 26559ac8732SStefano Zampini char ord[2]; 26659ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 26759ac8732SStefano Zampini sprintf(ord,"L"); 26859ac8732SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 26959ac8732SStefano Zampini sprintf(ord,"U"); 27059ac8732SStefano Zampini } 27159ac8732SStefano Zampini PetscStackCallBLAS("BLASsymm",BLASsymm_("L",ord,&B_N,&B_Nrhs,&one,(PetscScalar*)mumps->id.schur,&B_slda,(PetscScalar*)mumps->id.redrhs,&B_rlda,&zero,mumps->schur_sol,&B_rlda)); 27259ac8732SStefano Zampini } 273e807eca7SStefano Zampini if (sol_in_redrhs) { 27459ac8732SStefano Zampini ierr = PetscMemcpy(mumps->id.redrhs,mumps->schur_sol,sizesol*sizeof(PetscScalar));CHKERRQ(ierr); 275e807eca7SStefano Zampini } 276a12f35bfSStefano Zampini } else { /* Schur complement has not been inverted */ 277a12f35bfSStefano Zampini MumpsScalar *orhs=NULL; 278a12f35bfSStefano Zampini 279a12f35bfSStefano Zampini if (!sol_in_redrhs) { 280a12f35bfSStefano Zampini PetscInt sizesol = B_Nrhs*B_N; 281a12f35bfSStefano Zampini if (!mumps->schur_sol || sizesol > mumps->schur_sizesol) { 282a12f35bfSStefano Zampini ierr = PetscFree(mumps->schur_sol);CHKERRQ(ierr); 283a12f35bfSStefano Zampini ierr = PetscMalloc1(sizesol,&mumps->schur_sol);CHKERRQ(ierr); 284a12f35bfSStefano Zampini mumps->schur_sizesol = sizesol; 285a12f35bfSStefano Zampini } 286a12f35bfSStefano Zampini orhs = mumps->id.redrhs; 287a12f35bfSStefano Zampini ierr = PetscMemcpy(mumps->schur_sol,mumps->id.redrhs,sizesol*sizeof(PetscScalar));CHKERRQ(ierr); 288a12f35bfSStefano Zampini mumps->id.redrhs = (MumpsScalar*)mumps->schur_sol; 289a12f35bfSStefano Zampini } 29059ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full Schur matrix */ 29159ac8732SStefano Zampini char type[2]; 29259ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 1) { /* stored by rows */ 29359ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 29459ac8732SStefano Zampini sprintf(type,"N"); 29559ac8732SStefano Zampini } else { 29659ac8732SStefano Zampini sprintf(type,"T"); 29759ac8732SStefano Zampini } 29859ac8732SStefano Zampini } else { /* stored by columns */ 29959ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 30059ac8732SStefano Zampini sprintf(type,"T"); 30159ac8732SStefano Zampini } else { 30259ac8732SStefano Zampini sprintf(type,"N"); 30359ac8732SStefano Zampini } 30459ac8732SStefano Zampini } 30559ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 30659ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetrs",LAPACKgetrs_(type,&B_N,&B_Nrhs,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,(PetscScalar*)mumps->id.redrhs,&B_rlda,&B_ierr)); 307b5fa320bSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 308b5fa320bSStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GETRS Lapack routine %d",(int)B_ierr); 309b5fa320bSStefano Zampini } else { /* either full or lower-triangular (not packed) */ 310b5fa320bSStefano Zampini char ord[2]; 311b5fa320bSStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 312b5fa320bSStefano Zampini sprintf(ord,"L"); 313b5fa320bSStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 314b5fa320bSStefano Zampini sprintf(ord,"U"); 315b5fa320bSStefano Zampini } 316b5fa320bSStefano Zampini if (mumps->id.sym == 2) { 317b5fa320bSStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 31859ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytrs",LAPACKsytrs_(ord,&B_N,&B_Nrhs,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,(PetscScalar*)mumps->id.redrhs,&B_rlda,&B_ierr)); 319b5fa320bSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 320b5fa320bSStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYTRS Lapack routine %d",(int)B_ierr); 321b5fa320bSStefano Zampini } else { 322b5fa320bSStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 32359ac8732SStefano Zampini PetscStackCallBLAS("LAPACKpotrs",LAPACKpotrs_(ord,&B_N,&B_Nrhs,(PetscScalar*)mumps->id.schur,&B_slda,(PetscScalar*)mumps->id.redrhs,&B_rlda,&B_ierr)); 324b5fa320bSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 325b5fa320bSStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in POTRS Lapack routine %d",(int)B_ierr); 326b5fa320bSStefano Zampini } 327b5fa320bSStefano Zampini } 328e807eca7SStefano Zampini if (!sol_in_redrhs) { 329a12f35bfSStefano Zampini mumps->id.redrhs = orhs; 330e807eca7SStefano Zampini } 33159ac8732SStefano Zampini } 332b5fa320bSStefano Zampini PetscFunctionReturn(0); 333b5fa320bSStefano Zampini } 334b5fa320bSStefano Zampini 33559ac8732SStefano Zampini #undef __FUNCT__ 33659ac8732SStefano Zampini #define __FUNCT__ "MatMumpsHandleSchur_Private" 337b8f61ee1SStefano Zampini static PetscErrorCode MatMumpsHandleSchur_Private(Mat_MUMPS* mumps, PetscBool expansion) 338b5fa320bSStefano Zampini { 339b5fa320bSStefano Zampini PetscErrorCode ierr; 340b5fa320bSStefano Zampini 341b5fa320bSStefano Zampini PetscFunctionBegin; 342b5fa320bSStefano Zampini if (!mumps->id.ICNTL(19)) { /* do nothing when Schur complement has not been computed */ 343b5fa320bSStefano Zampini PetscFunctionReturn(0); 344b5fa320bSStefano Zampini } 345b8f61ee1SStefano Zampini if (!expansion) { /* prepare for the condensation step */ 346b5fa320bSStefano Zampini PetscInt sizeredrhs = mumps->id.nrhs*mumps->id.size_schur; 347b5fa320bSStefano Zampini /* allocate MUMPS internal array to store reduced right-hand sides */ 348b5fa320bSStefano Zampini if (!mumps->id.redrhs || sizeredrhs > mumps->sizeredrhs) { 349b5fa320bSStefano Zampini ierr = PetscFree(mumps->id.redrhs);CHKERRQ(ierr); 350b5fa320bSStefano Zampini mumps->id.lredrhs = mumps->id.size_schur; 351b5fa320bSStefano Zampini ierr = PetscMalloc1(mumps->id.nrhs*mumps->id.lredrhs,&mumps->id.redrhs);CHKERRQ(ierr); 352b5fa320bSStefano Zampini mumps->sizeredrhs = mumps->id.nrhs*mumps->id.lredrhs; 353b5fa320bSStefano Zampini } 354b5fa320bSStefano Zampini mumps->id.ICNTL(26) = 1; /* condensation phase */ 355b5fa320bSStefano Zampini } else { /* prepare for the expansion step */ 356b8f61ee1SStefano Zampini /* solve Schur complement (this has to be done by the MUMPS user, so basically us) */ 357e807eca7SStefano Zampini ierr = MatMumpsSolveSchur_Private(mumps,PETSC_TRUE);CHKERRQ(ierr); 358b5fa320bSStefano Zampini mumps->id.ICNTL(26) = 2; /* expansion phase */ 359b5fa320bSStefano Zampini PetscMUMPS_c(&mumps->id); 360b5fa320bSStefano Zampini if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 361b5fa320bSStefano Zampini /* restore defaults */ 362b5fa320bSStefano Zampini mumps->id.ICNTL(26) = -1; 363b5fa320bSStefano Zampini } 364b5fa320bSStefano Zampini PetscFunctionReturn(0); 365b5fa320bSStefano Zampini } 366b5fa320bSStefano Zampini 367397b6df1SKris Buschelman /* 368d341cd04SHong Zhang MatConvertToTriples_A_B - convert Petsc matrix to triples: row[nz], col[nz], val[nz] 369d341cd04SHong Zhang 370397b6df1SKris Buschelman input: 37167877ebaSShri Abhyankar A - matrix in aij,baij or sbaij (bs=1) format 372397b6df1SKris Buschelman shift - 0: C style output triple; 1: Fortran style output triple. 373bccb9932SShri Abhyankar reuse - MAT_INITIAL_MATRIX: spaces are allocated and values are set for the triple 374bccb9932SShri Abhyankar MAT_REUSE_MATRIX: only the values in v array are updated 375397b6df1SKris Buschelman output: 376397b6df1SKris Buschelman nnz - dim of r, c, and v (number of local nonzero entries of A) 377397b6df1SKris Buschelman r, c, v - row and col index, matrix values (matrix triples) 378eb9baa12SBarry Smith 379eb9baa12SBarry Smith The returned values r, c, and sometimes v are obtained in a single PetscMalloc(). Then in MatDestroy_MUMPS() it is 380eb9baa12SBarry Smith freed with PetscFree((mumps->irn); This is not ideal code, the fact that v is ONLY sometimes part of mumps->irn means 381eb9baa12SBarry Smith that the PetscMalloc() cannot easily be replaced with a PetscMalloc3(). 382eb9baa12SBarry Smith 383397b6df1SKris Buschelman */ 38416ebf90aSShri Abhyankar 38516ebf90aSShri Abhyankar #undef __FUNCT__ 38616ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqaij_seqaij" 387bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqaij_seqaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 388b24902e0SBarry Smith { 389185f6596SHong Zhang const PetscInt *ai,*aj,*ajj,M=A->rmap->n; 39067877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 391dfbe8321SBarry Smith PetscErrorCode ierr; 392c1490034SHong Zhang PetscInt *row,*col; 39316ebf90aSShri Abhyankar Mat_SeqAIJ *aa=(Mat_SeqAIJ*)A->data; 394397b6df1SKris Buschelman 395397b6df1SKris Buschelman PetscFunctionBegin; 39616ebf90aSShri Abhyankar *v=aa->a; 397bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 3982205254eSKarl Rupp nz = aa->nz; 3992205254eSKarl Rupp ai = aa->i; 4002205254eSKarl Rupp aj = aa->j; 40116ebf90aSShri Abhyankar *nnz = nz; 402785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 403185f6596SHong Zhang col = row + nz; 404185f6596SHong Zhang 40516ebf90aSShri Abhyankar nz = 0; 40616ebf90aSShri Abhyankar for (i=0; i<M; i++) { 40716ebf90aSShri Abhyankar rnz = ai[i+1] - ai[i]; 40867877ebaSShri Abhyankar ajj = aj + ai[i]; 40967877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 41067877ebaSShri Abhyankar row[nz] = i+shift; col[nz++] = ajj[j] + shift; 41116ebf90aSShri Abhyankar } 41216ebf90aSShri Abhyankar } 41316ebf90aSShri Abhyankar *r = row; *c = col; 41416ebf90aSShri Abhyankar } 41516ebf90aSShri Abhyankar PetscFunctionReturn(0); 41616ebf90aSShri Abhyankar } 417397b6df1SKris Buschelman 41816ebf90aSShri Abhyankar #undef __FUNCT__ 41967877ebaSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqbaij_seqaij" 420bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqbaij_seqaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 42167877ebaSShri Abhyankar { 42267877ebaSShri Abhyankar Mat_SeqBAIJ *aa=(Mat_SeqBAIJ*)A->data; 42333d57670SJed Brown const PetscInt *ai,*aj,*ajj,bs2 = aa->bs2; 42433d57670SJed Brown PetscInt bs,M,nz,idx=0,rnz,i,j,k,m; 42567877ebaSShri Abhyankar PetscErrorCode ierr; 42667877ebaSShri Abhyankar PetscInt *row,*col; 42767877ebaSShri Abhyankar 42867877ebaSShri Abhyankar PetscFunctionBegin; 42933d57670SJed Brown ierr = MatGetBlockSize(A,&bs);CHKERRQ(ierr); 43033d57670SJed Brown M = A->rmap->N/bs; 431cf3759fdSShri Abhyankar *v = aa->a; 432bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 433cf3759fdSShri Abhyankar ai = aa->i; aj = aa->j; 43467877ebaSShri Abhyankar nz = bs2*aa->nz; 43567877ebaSShri Abhyankar *nnz = nz; 436785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 437185f6596SHong Zhang col = row + nz; 438185f6596SHong Zhang 43967877ebaSShri Abhyankar for (i=0; i<M; i++) { 44067877ebaSShri Abhyankar ajj = aj + ai[i]; 44167877ebaSShri Abhyankar rnz = ai[i+1] - ai[i]; 44267877ebaSShri Abhyankar for (k=0; k<rnz; k++) { 44367877ebaSShri Abhyankar for (j=0; j<bs; j++) { 44467877ebaSShri Abhyankar for (m=0; m<bs; m++) { 44567877ebaSShri Abhyankar row[idx] = i*bs + m + shift; 446cf3759fdSShri Abhyankar col[idx++] = bs*(ajj[k]) + j + shift; 44767877ebaSShri Abhyankar } 44867877ebaSShri Abhyankar } 44967877ebaSShri Abhyankar } 45067877ebaSShri Abhyankar } 451cf3759fdSShri Abhyankar *r = row; *c = col; 45267877ebaSShri Abhyankar } 45367877ebaSShri Abhyankar PetscFunctionReturn(0); 45467877ebaSShri Abhyankar } 45567877ebaSShri Abhyankar 45667877ebaSShri Abhyankar #undef __FUNCT__ 45716ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqsbaij_seqsbaij" 458bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqsbaij_seqsbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 45916ebf90aSShri Abhyankar { 46067877ebaSShri Abhyankar const PetscInt *ai, *aj,*ajj,M=A->rmap->n; 46167877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 46216ebf90aSShri Abhyankar PetscErrorCode ierr; 46316ebf90aSShri Abhyankar PetscInt *row,*col; 46416ebf90aSShri Abhyankar Mat_SeqSBAIJ *aa=(Mat_SeqSBAIJ*)A->data; 46516ebf90aSShri Abhyankar 46616ebf90aSShri Abhyankar PetscFunctionBegin; 467882afa5aSHong Zhang *v = aa->a; 468bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 4692205254eSKarl Rupp nz = aa->nz; 4702205254eSKarl Rupp ai = aa->i; 4712205254eSKarl Rupp aj = aa->j; 4722205254eSKarl Rupp *v = aa->a; 47316ebf90aSShri Abhyankar *nnz = nz; 474785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 475185f6596SHong Zhang col = row + nz; 476185f6596SHong Zhang 47716ebf90aSShri Abhyankar nz = 0; 47816ebf90aSShri Abhyankar for (i=0; i<M; i++) { 47916ebf90aSShri Abhyankar rnz = ai[i+1] - ai[i]; 48067877ebaSShri Abhyankar ajj = aj + ai[i]; 48167877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 48267877ebaSShri Abhyankar row[nz] = i+shift; col[nz++] = ajj[j] + shift; 48316ebf90aSShri Abhyankar } 48416ebf90aSShri Abhyankar } 48516ebf90aSShri Abhyankar *r = row; *c = col; 48616ebf90aSShri Abhyankar } 48716ebf90aSShri Abhyankar PetscFunctionReturn(0); 48816ebf90aSShri Abhyankar } 48916ebf90aSShri Abhyankar 49016ebf90aSShri Abhyankar #undef __FUNCT__ 49116ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqaij_seqsbaij" 492bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqaij_seqsbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 49316ebf90aSShri Abhyankar { 49467877ebaSShri Abhyankar const PetscInt *ai,*aj,*ajj,*adiag,M=A->rmap->n; 49567877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 49667877ebaSShri Abhyankar const PetscScalar *av,*v1; 49716ebf90aSShri Abhyankar PetscScalar *val; 49816ebf90aSShri Abhyankar PetscErrorCode ierr; 49916ebf90aSShri Abhyankar PetscInt *row,*col; 500829b1710SHong Zhang Mat_SeqAIJ *aa=(Mat_SeqAIJ*)A->data; 50116ebf90aSShri Abhyankar 50216ebf90aSShri Abhyankar PetscFunctionBegin; 50316ebf90aSShri Abhyankar ai =aa->i; aj=aa->j;av=aa->a; 50416ebf90aSShri Abhyankar adiag=aa->diag; 505bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 506829b1710SHong Zhang /* count nz in the uppper triangular part of A */ 507829b1710SHong Zhang nz = 0; 508829b1710SHong Zhang for (i=0; i<M; i++) nz += ai[i+1] - adiag[i]; 50916ebf90aSShri Abhyankar *nnz = nz; 510829b1710SHong Zhang 511185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 512185f6596SHong Zhang col = row + nz; 513185f6596SHong Zhang val = (PetscScalar*)(col + nz); 514185f6596SHong Zhang 51516ebf90aSShri Abhyankar nz = 0; 51616ebf90aSShri Abhyankar for (i=0; i<M; i++) { 51716ebf90aSShri Abhyankar rnz = ai[i+1] - adiag[i]; 51867877ebaSShri Abhyankar ajj = aj + adiag[i]; 519cf3759fdSShri Abhyankar v1 = av + adiag[i]; 52067877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 52167877ebaSShri Abhyankar row[nz] = i+shift; col[nz] = ajj[j] + shift; val[nz++] = v1[j]; 52216ebf90aSShri Abhyankar } 52316ebf90aSShri Abhyankar } 52416ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 525397b6df1SKris Buschelman } else { 52616ebf90aSShri Abhyankar nz = 0; val = *v; 52716ebf90aSShri Abhyankar for (i=0; i <M; i++) { 52816ebf90aSShri Abhyankar rnz = ai[i+1] - adiag[i]; 52967877ebaSShri Abhyankar ajj = aj + adiag[i]; 53067877ebaSShri Abhyankar v1 = av + adiag[i]; 53167877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 53267877ebaSShri Abhyankar val[nz++] = v1[j]; 53316ebf90aSShri Abhyankar } 53416ebf90aSShri Abhyankar } 53516ebf90aSShri Abhyankar } 53616ebf90aSShri Abhyankar PetscFunctionReturn(0); 53716ebf90aSShri Abhyankar } 53816ebf90aSShri Abhyankar 53916ebf90aSShri Abhyankar #undef __FUNCT__ 54016ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpisbaij_mpisbaij" 541bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpisbaij_mpisbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 54216ebf90aSShri Abhyankar { 54316ebf90aSShri Abhyankar const PetscInt *ai, *aj, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 54416ebf90aSShri Abhyankar PetscErrorCode ierr; 54516ebf90aSShri Abhyankar PetscInt rstart,nz,i,j,jj,irow,countA,countB; 54616ebf90aSShri Abhyankar PetscInt *row,*col; 54716ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 54816ebf90aSShri Abhyankar PetscScalar *val; 549397b6df1SKris Buschelman Mat_MPISBAIJ *mat = (Mat_MPISBAIJ*)A->data; 550397b6df1SKris Buschelman Mat_SeqSBAIJ *aa = (Mat_SeqSBAIJ*)(mat->A)->data; 551397b6df1SKris Buschelman Mat_SeqBAIJ *bb = (Mat_SeqBAIJ*)(mat->B)->data; 55216ebf90aSShri Abhyankar 55316ebf90aSShri Abhyankar PetscFunctionBegin; 554d0f46423SBarry Smith ai=aa->i; aj=aa->j; bi=bb->i; bj=bb->j; rstart= A->rmap->rstart; 555397b6df1SKris Buschelman av=aa->a; bv=bb->a; 556397b6df1SKris Buschelman 5572205254eSKarl Rupp garray = mat->garray; 5582205254eSKarl Rupp 559bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 56016ebf90aSShri Abhyankar nz = aa->nz + bb->nz; 56116ebf90aSShri Abhyankar *nnz = nz; 562185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 563185f6596SHong Zhang col = row + nz; 564185f6596SHong Zhang val = (PetscScalar*)(col + nz); 565185f6596SHong Zhang 566397b6df1SKris Buschelman *r = row; *c = col; *v = val; 567397b6df1SKris Buschelman } else { 568397b6df1SKris Buschelman row = *r; col = *c; val = *v; 569397b6df1SKris Buschelman } 570397b6df1SKris Buschelman 571028e57e8SHong Zhang jj = 0; irow = rstart; 572397b6df1SKris Buschelman for (i=0; i<m; i++) { 573397b6df1SKris Buschelman ajj = aj + ai[i]; /* ptr to the beginning of this row */ 574397b6df1SKris Buschelman countA = ai[i+1] - ai[i]; 575397b6df1SKris Buschelman countB = bi[i+1] - bi[i]; 576397b6df1SKris Buschelman bjj = bj + bi[i]; 57716ebf90aSShri Abhyankar v1 = av + ai[i]; 57816ebf90aSShri Abhyankar v2 = bv + bi[i]; 579397b6df1SKris Buschelman 580397b6df1SKris Buschelman /* A-part */ 581397b6df1SKris Buschelman for (j=0; j<countA; j++) { 582bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 583397b6df1SKris Buschelman row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 584397b6df1SKris Buschelman } 58516ebf90aSShri Abhyankar val[jj++] = v1[j]; 586397b6df1SKris Buschelman } 58716ebf90aSShri Abhyankar 58816ebf90aSShri Abhyankar /* B-part */ 58916ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 590bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 591397b6df1SKris Buschelman row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 592397b6df1SKris Buschelman } 59316ebf90aSShri Abhyankar val[jj++] = v2[j]; 59416ebf90aSShri Abhyankar } 59516ebf90aSShri Abhyankar irow++; 59616ebf90aSShri Abhyankar } 59716ebf90aSShri Abhyankar PetscFunctionReturn(0); 59816ebf90aSShri Abhyankar } 59916ebf90aSShri Abhyankar 60016ebf90aSShri Abhyankar #undef __FUNCT__ 60116ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpiaij_mpiaij" 602bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpiaij_mpiaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 60316ebf90aSShri Abhyankar { 60416ebf90aSShri Abhyankar const PetscInt *ai, *aj, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 60516ebf90aSShri Abhyankar PetscErrorCode ierr; 60616ebf90aSShri Abhyankar PetscInt rstart,nz,i,j,jj,irow,countA,countB; 60716ebf90aSShri Abhyankar PetscInt *row,*col; 60816ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 60916ebf90aSShri Abhyankar PetscScalar *val; 61016ebf90aSShri Abhyankar Mat_MPIAIJ *mat = (Mat_MPIAIJ*)A->data; 61116ebf90aSShri Abhyankar Mat_SeqAIJ *aa = (Mat_SeqAIJ*)(mat->A)->data; 61216ebf90aSShri Abhyankar Mat_SeqAIJ *bb = (Mat_SeqAIJ*)(mat->B)->data; 61316ebf90aSShri Abhyankar 61416ebf90aSShri Abhyankar PetscFunctionBegin; 61516ebf90aSShri Abhyankar ai=aa->i; aj=aa->j; bi=bb->i; bj=bb->j; rstart= A->rmap->rstart; 61616ebf90aSShri Abhyankar av=aa->a; bv=bb->a; 61716ebf90aSShri Abhyankar 6182205254eSKarl Rupp garray = mat->garray; 6192205254eSKarl Rupp 620bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 62116ebf90aSShri Abhyankar nz = aa->nz + bb->nz; 62216ebf90aSShri Abhyankar *nnz = nz; 623185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 624185f6596SHong Zhang col = row + nz; 625185f6596SHong Zhang val = (PetscScalar*)(col + nz); 626185f6596SHong Zhang 62716ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 62816ebf90aSShri Abhyankar } else { 62916ebf90aSShri Abhyankar row = *r; col = *c; val = *v; 63016ebf90aSShri Abhyankar } 63116ebf90aSShri Abhyankar 63216ebf90aSShri Abhyankar jj = 0; irow = rstart; 63316ebf90aSShri Abhyankar for (i=0; i<m; i++) { 63416ebf90aSShri Abhyankar ajj = aj + ai[i]; /* ptr to the beginning of this row */ 63516ebf90aSShri Abhyankar countA = ai[i+1] - ai[i]; 63616ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 63716ebf90aSShri Abhyankar bjj = bj + bi[i]; 63816ebf90aSShri Abhyankar v1 = av + ai[i]; 63916ebf90aSShri Abhyankar v2 = bv + bi[i]; 64016ebf90aSShri Abhyankar 64116ebf90aSShri Abhyankar /* A-part */ 64216ebf90aSShri Abhyankar for (j=0; j<countA; j++) { 643bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 64416ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 64516ebf90aSShri Abhyankar } 64616ebf90aSShri Abhyankar val[jj++] = v1[j]; 64716ebf90aSShri Abhyankar } 64816ebf90aSShri Abhyankar 64916ebf90aSShri Abhyankar /* B-part */ 65016ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 651bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 65216ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 65316ebf90aSShri Abhyankar } 65416ebf90aSShri Abhyankar val[jj++] = v2[j]; 65516ebf90aSShri Abhyankar } 65616ebf90aSShri Abhyankar irow++; 65716ebf90aSShri Abhyankar } 65816ebf90aSShri Abhyankar PetscFunctionReturn(0); 65916ebf90aSShri Abhyankar } 66016ebf90aSShri Abhyankar 66116ebf90aSShri Abhyankar #undef __FUNCT__ 66267877ebaSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpibaij_mpiaij" 663bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpibaij_mpiaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 66467877ebaSShri Abhyankar { 66567877ebaSShri Abhyankar Mat_MPIBAIJ *mat = (Mat_MPIBAIJ*)A->data; 66667877ebaSShri Abhyankar Mat_SeqBAIJ *aa = (Mat_SeqBAIJ*)(mat->A)->data; 66767877ebaSShri Abhyankar Mat_SeqBAIJ *bb = (Mat_SeqBAIJ*)(mat->B)->data; 66867877ebaSShri Abhyankar const PetscInt *ai = aa->i, *bi = bb->i, *aj = aa->j, *bj = bb->j,*ajj, *bjj; 669d985c460SShri Abhyankar const PetscInt *garray = mat->garray,mbs=mat->mbs,rstart=A->rmap->rstart; 67033d57670SJed Brown const PetscInt bs2=mat->bs2; 67167877ebaSShri Abhyankar PetscErrorCode ierr; 67233d57670SJed Brown PetscInt bs,nz,i,j,k,n,jj,irow,countA,countB,idx; 67367877ebaSShri Abhyankar PetscInt *row,*col; 67467877ebaSShri Abhyankar const PetscScalar *av=aa->a, *bv=bb->a,*v1,*v2; 67567877ebaSShri Abhyankar PetscScalar *val; 67667877ebaSShri Abhyankar 67767877ebaSShri Abhyankar PetscFunctionBegin; 67833d57670SJed Brown ierr = MatGetBlockSize(A,&bs);CHKERRQ(ierr); 679bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 68067877ebaSShri Abhyankar nz = bs2*(aa->nz + bb->nz); 68167877ebaSShri Abhyankar *nnz = nz; 682185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 683185f6596SHong Zhang col = row + nz; 684185f6596SHong Zhang val = (PetscScalar*)(col + nz); 685185f6596SHong Zhang 68667877ebaSShri Abhyankar *r = row; *c = col; *v = val; 68767877ebaSShri Abhyankar } else { 68867877ebaSShri Abhyankar row = *r; col = *c; val = *v; 68967877ebaSShri Abhyankar } 69067877ebaSShri Abhyankar 691d985c460SShri Abhyankar jj = 0; irow = rstart; 69267877ebaSShri Abhyankar for (i=0; i<mbs; i++) { 69367877ebaSShri Abhyankar countA = ai[i+1] - ai[i]; 69467877ebaSShri Abhyankar countB = bi[i+1] - bi[i]; 69567877ebaSShri Abhyankar ajj = aj + ai[i]; 69667877ebaSShri Abhyankar bjj = bj + bi[i]; 69767877ebaSShri Abhyankar v1 = av + bs2*ai[i]; 69867877ebaSShri Abhyankar v2 = bv + bs2*bi[i]; 69967877ebaSShri Abhyankar 70067877ebaSShri Abhyankar idx = 0; 70167877ebaSShri Abhyankar /* A-part */ 70267877ebaSShri Abhyankar for (k=0; k<countA; k++) { 70367877ebaSShri Abhyankar for (j=0; j<bs; j++) { 70467877ebaSShri Abhyankar for (n=0; n<bs; n++) { 705bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 706d985c460SShri Abhyankar row[jj] = irow + n + shift; 707d985c460SShri Abhyankar col[jj] = rstart + bs*ajj[k] + j + shift; 70867877ebaSShri Abhyankar } 70967877ebaSShri Abhyankar val[jj++] = v1[idx++]; 71067877ebaSShri Abhyankar } 71167877ebaSShri Abhyankar } 71267877ebaSShri Abhyankar } 71367877ebaSShri Abhyankar 71467877ebaSShri Abhyankar idx = 0; 71567877ebaSShri Abhyankar /* B-part */ 71667877ebaSShri Abhyankar for (k=0; k<countB; k++) { 71767877ebaSShri Abhyankar for (j=0; j<bs; j++) { 71867877ebaSShri Abhyankar for (n=0; n<bs; n++) { 719bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 720d985c460SShri Abhyankar row[jj] = irow + n + shift; 721d985c460SShri Abhyankar col[jj] = bs*garray[bjj[k]] + j + shift; 72267877ebaSShri Abhyankar } 723d985c460SShri Abhyankar val[jj++] = v2[idx++]; 72467877ebaSShri Abhyankar } 72567877ebaSShri Abhyankar } 72667877ebaSShri Abhyankar } 727d985c460SShri Abhyankar irow += bs; 72867877ebaSShri Abhyankar } 72967877ebaSShri Abhyankar PetscFunctionReturn(0); 73067877ebaSShri Abhyankar } 73167877ebaSShri Abhyankar 73267877ebaSShri Abhyankar #undef __FUNCT__ 73316ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpiaij_mpisbaij" 734bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpiaij_mpisbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 73516ebf90aSShri Abhyankar { 73616ebf90aSShri Abhyankar const PetscInt *ai, *aj,*adiag, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 73716ebf90aSShri Abhyankar PetscErrorCode ierr; 738e0bace9bSHong Zhang PetscInt rstart,nz,nza,nzb,i,j,jj,irow,countA,countB; 73916ebf90aSShri Abhyankar PetscInt *row,*col; 74016ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 74116ebf90aSShri Abhyankar PetscScalar *val; 74216ebf90aSShri Abhyankar Mat_MPIAIJ *mat = (Mat_MPIAIJ*)A->data; 74316ebf90aSShri Abhyankar Mat_SeqAIJ *aa =(Mat_SeqAIJ*)(mat->A)->data; 74416ebf90aSShri Abhyankar Mat_SeqAIJ *bb =(Mat_SeqAIJ*)(mat->B)->data; 74516ebf90aSShri Abhyankar 74616ebf90aSShri Abhyankar PetscFunctionBegin; 74716ebf90aSShri Abhyankar ai=aa->i; aj=aa->j; adiag=aa->diag; 74816ebf90aSShri Abhyankar bi=bb->i; bj=bb->j; garray = mat->garray; 74916ebf90aSShri Abhyankar av=aa->a; bv=bb->a; 7502205254eSKarl Rupp 75116ebf90aSShri Abhyankar rstart = A->rmap->rstart; 75216ebf90aSShri Abhyankar 753bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 754e0bace9bSHong Zhang nza = 0; /* num of upper triangular entries in mat->A, including diagonals */ 755e0bace9bSHong Zhang nzb = 0; /* num of upper triangular entries in mat->B */ 75616ebf90aSShri Abhyankar for (i=0; i<m; i++) { 757e0bace9bSHong Zhang nza += (ai[i+1] - adiag[i]); 75816ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 75916ebf90aSShri Abhyankar bjj = bj + bi[i]; 760e0bace9bSHong Zhang for (j=0; j<countB; j++) { 761e0bace9bSHong Zhang if (garray[bjj[j]] > rstart) nzb++; 762e0bace9bSHong Zhang } 763e0bace9bSHong Zhang } 76416ebf90aSShri Abhyankar 765e0bace9bSHong Zhang nz = nza + nzb; /* total nz of upper triangular part of mat */ 76616ebf90aSShri Abhyankar *nnz = nz; 767185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 768185f6596SHong Zhang col = row + nz; 769185f6596SHong Zhang val = (PetscScalar*)(col + nz); 770185f6596SHong Zhang 77116ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 77216ebf90aSShri Abhyankar } else { 77316ebf90aSShri Abhyankar row = *r; col = *c; val = *v; 77416ebf90aSShri Abhyankar } 77516ebf90aSShri Abhyankar 77616ebf90aSShri Abhyankar jj = 0; irow = rstart; 77716ebf90aSShri Abhyankar for (i=0; i<m; i++) { 77816ebf90aSShri Abhyankar ajj = aj + adiag[i]; /* ptr to the beginning of the diagonal of this row */ 77916ebf90aSShri Abhyankar v1 = av + adiag[i]; 78016ebf90aSShri Abhyankar countA = ai[i+1] - adiag[i]; 78116ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 78216ebf90aSShri Abhyankar bjj = bj + bi[i]; 78316ebf90aSShri Abhyankar v2 = bv + bi[i]; 78416ebf90aSShri Abhyankar 78516ebf90aSShri Abhyankar /* A-part */ 78616ebf90aSShri Abhyankar for (j=0; j<countA; j++) { 787bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 78816ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 78916ebf90aSShri Abhyankar } 79016ebf90aSShri Abhyankar val[jj++] = v1[j]; 79116ebf90aSShri Abhyankar } 79216ebf90aSShri Abhyankar 79316ebf90aSShri Abhyankar /* B-part */ 79416ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 79516ebf90aSShri Abhyankar if (garray[bjj[j]] > rstart) { 796bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 79716ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 79816ebf90aSShri Abhyankar } 79916ebf90aSShri Abhyankar val[jj++] = v2[j]; 80016ebf90aSShri Abhyankar } 801397b6df1SKris Buschelman } 802397b6df1SKris Buschelman irow++; 803397b6df1SKris Buschelman } 804397b6df1SKris Buschelman PetscFunctionReturn(0); 805397b6df1SKris Buschelman } 806397b6df1SKris Buschelman 807397b6df1SKris Buschelman #undef __FUNCT__ 8083924e44cSKris Buschelman #define __FUNCT__ "MatDestroy_MUMPS" 809dfbe8321SBarry Smith PetscErrorCode MatDestroy_MUMPS(Mat A) 810dfbe8321SBarry Smith { 811*e69c285eSBarry Smith Mat_MUMPS *mumps=(Mat_MUMPS*)A->data; 812dfbe8321SBarry Smith PetscErrorCode ierr; 813b24902e0SBarry Smith 814397b6df1SKris Buschelman PetscFunctionBegin; 815a5e57a09SHong Zhang ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr); 816a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_rhs);CHKERRQ(ierr); 817a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 818801fbe65SHong Zhang ierr = VecDestroy(&mumps->b_seq);CHKERRQ(ierr); 819a5e57a09SHong Zhang ierr = VecDestroy(&mumps->x_seq);CHKERRQ(ierr); 820a5e57a09SHong Zhang ierr = PetscFree(mumps->id.perm_in);CHKERRQ(ierr); 821a5e57a09SHong Zhang ierr = PetscFree(mumps->irn);CHKERRQ(ierr); 822b34f08ffSHong Zhang ierr = PetscFree(mumps->info);CHKERRQ(ierr); 82359ac8732SStefano Zampini ierr = MatMumpsResetSchur_Private(mumps);CHKERRQ(ierr); 824a5e57a09SHong Zhang mumps->id.job = JOB_END; 825a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 8266f3cc6f9SBarry Smith ierr = MPI_Comm_free(&mumps->comm_mumps);CHKERRQ(ierr); 827*e69c285eSBarry Smith ierr = PetscFree(A->data);CHKERRQ(ierr); 828bf0cc555SLisandro Dalcin 82997969023SHong Zhang /* clear composed functions */ 830bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatFactorGetSolverPackage_C",NULL);CHKERRQ(ierr); 8315a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatFactorSetSchurIS_C",NULL);CHKERRQ(ierr); 8325a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatFactorInvertSchurComplement_C",NULL);CHKERRQ(ierr); 8335a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatFactorCreateSchurComplement_C",NULL);CHKERRQ(ierr); 8345a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatFactorGetSchurComplement_C",NULL);CHKERRQ(ierr); 8355a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatFactorSolveSchurComplement_C",NULL);CHKERRQ(ierr); 8365a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatFactorSolveSchurComplementTranspose_C",NULL);CHKERRQ(ierr); 837bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetIcntl_C",NULL);CHKERRQ(ierr); 838bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetIcntl_C",NULL);CHKERRQ(ierr); 839bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetCntl_C",NULL);CHKERRQ(ierr); 840bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetCntl_C",NULL);CHKERRQ(ierr); 841ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetInfo_C",NULL);CHKERRQ(ierr); 842ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetInfog_C",NULL);CHKERRQ(ierr); 843ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetRinfo_C",NULL);CHKERRQ(ierr); 844ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetRinfog_C",NULL);CHKERRQ(ierr); 845397b6df1SKris Buschelman PetscFunctionReturn(0); 846397b6df1SKris Buschelman } 847397b6df1SKris Buschelman 848397b6df1SKris Buschelman #undef __FUNCT__ 849f6c57405SHong Zhang #define __FUNCT__ "MatSolve_MUMPS" 850b24902e0SBarry Smith PetscErrorCode MatSolve_MUMPS(Mat A,Vec b,Vec x) 851b24902e0SBarry Smith { 852*e69c285eSBarry Smith Mat_MUMPS *mumps=(Mat_MUMPS*)A->data; 853d54de34fSKris Buschelman PetscScalar *array; 85467877ebaSShri Abhyankar Vec b_seq; 855329ec9b3SHong Zhang IS is_iden,is_petsc; 856dfbe8321SBarry Smith PetscErrorCode ierr; 857329ec9b3SHong Zhang PetscInt i; 858cc86f929SStefano Zampini PetscBool second_solve = PETSC_FALSE; 859883f2eb9SBarry Smith static PetscBool cite1 = PETSC_FALSE,cite2 = PETSC_FALSE; 860397b6df1SKris Buschelman 861397b6df1SKris Buschelman PetscFunctionBegin; 862883f2eb9SBarry Smith ierr = PetscCitationsRegister("@article{MUMPS01,\n author = {P.~R. Amestoy and I.~S. Duff and J.-Y. L'Excellent and J. Koster},\n title = {A fully asynchronous multifrontal solver using distributed dynamic scheduling},\n journal = {SIAM Journal on Matrix Analysis and Applications},\n volume = {23},\n number = {1},\n pages = {15--41},\n year = {2001}\n}\n",&cite1);CHKERRQ(ierr); 863883f2eb9SBarry Smith ierr = PetscCitationsRegister("@article{MUMPS02,\n author = {P.~R. Amestoy and A. Guermouche and J.-Y. L'Excellent and S. Pralet},\n title = {Hybrid scheduling for the parallel solution of linear systems},\n journal = {Parallel Computing},\n volume = {32},\n number = {2},\n pages = {136--156},\n year = {2006}\n}\n",&cite2);CHKERRQ(ierr); 8642aca8efcSHong Zhang 865d8cd2189SHong Zhang if (A->errortype) { 8662aca8efcSHong Zhang ierr = PetscInfo2(A,"MatSolve is called with singular matrix factor, INFOG(1)=%d, INFO(2)=%d\n",mumps->id.INFOG(1),mumps->id.INFO(2));CHKERRQ(ierr); 8672aca8efcSHong Zhang ierr = VecSetInf(x);CHKERRQ(ierr); 8682aca8efcSHong Zhang PetscFunctionReturn(0); 8692aca8efcSHong Zhang } 8702aca8efcSHong Zhang 871a5e57a09SHong Zhang mumps->id.nrhs = 1; 872a5e57a09SHong Zhang b_seq = mumps->b_seq; 873a5e57a09SHong Zhang if (mumps->size > 1) { 874329ec9b3SHong Zhang /* MUMPS only supports centralized rhs. Scatter b into a seqential rhs vector */ 875a5e57a09SHong Zhang ierr = VecScatterBegin(mumps->scat_rhs,b,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 876a5e57a09SHong Zhang ierr = VecScatterEnd(mumps->scat_rhs,b,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 877a5e57a09SHong Zhang if (!mumps->myid) {ierr = VecGetArray(b_seq,&array);CHKERRQ(ierr);} 878397b6df1SKris Buschelman } else { /* size == 1 */ 879397b6df1SKris Buschelman ierr = VecCopy(b,x);CHKERRQ(ierr); 880397b6df1SKris Buschelman ierr = VecGetArray(x,&array);CHKERRQ(ierr); 881397b6df1SKris Buschelman } 882a5e57a09SHong Zhang if (!mumps->myid) { /* define rhs on the host */ 883a5e57a09SHong Zhang mumps->id.nrhs = 1; 884940cd9d6SSatish Balay mumps->id.rhs = (MumpsScalar*)array; 885397b6df1SKris Buschelman } 886397b6df1SKris Buschelman 887cc86f929SStefano Zampini /* 888cc86f929SStefano Zampini handle condensation step of Schur complement (if any) 889cc86f929SStefano Zampini We set by default ICNTL(26) == -1 when Schur indices have been provided by the user. 890cc86f929SStefano Zampini According to MUMPS (5.0.0) manual, any value should be harmful during the factorization phase 891cc86f929SStefano Zampini Unless the user provides a valid value for ICNTL(26), MatSolve and MatMatSolve routines solve the full system. 892cc86f929SStefano Zampini This requires an extra call to PetscMUMPS_c and the computation of the factors for S 893cc86f929SStefano Zampini */ 894cc86f929SStefano Zampini if (mumps->id.ICNTL(26) < 0 || mumps->id.ICNTL(26) > 2) { 895cc86f929SStefano Zampini second_solve = PETSC_TRUE; 896b8f61ee1SStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps,PETSC_FALSE);CHKERRQ(ierr); 897cc86f929SStefano Zampini } 898397b6df1SKris Buschelman /* solve phase */ 899329ec9b3SHong Zhang /*-------------*/ 900a5e57a09SHong Zhang mumps->id.job = JOB_SOLVE; 901a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 902a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 903397b6df1SKris Buschelman 904b5fa320bSStefano Zampini /* handle expansion step of Schur complement (if any) */ 905cc86f929SStefano Zampini if (second_solve) { 906b8f61ee1SStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps,PETSC_TRUE);CHKERRQ(ierr); 907cc86f929SStefano Zampini } 908b5fa320bSStefano Zampini 909a5e57a09SHong Zhang if (mumps->size > 1) { /* convert mumps distributed solution to petsc mpi x */ 910a5e57a09SHong Zhang if (mumps->scat_sol && mumps->ICNTL9_pre != mumps->id.ICNTL(9)) { 911a5e57a09SHong Zhang /* when id.ICNTL(9) changes, the contents of lsol_loc may change (not its size, lsol_loc), recreates scat_sol */ 912a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 913397b6df1SKris Buschelman } 914a5e57a09SHong Zhang if (!mumps->scat_sol) { /* create scatter scat_sol */ 915a5e57a09SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,mumps->id.lsol_loc,0,1,&is_iden);CHKERRQ(ierr); /* from */ 916a5e57a09SHong Zhang for (i=0; i<mumps->id.lsol_loc; i++) { 917a5e57a09SHong Zhang mumps->id.isol_loc[i] -= 1; /* change Fortran style to C style */ 918a5e57a09SHong Zhang } 919a5e57a09SHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,mumps->id.lsol_loc,mumps->id.isol_loc,PETSC_COPY_VALUES,&is_petsc);CHKERRQ(ierr); /* to */ 920a5e57a09SHong Zhang ierr = VecScatterCreate(mumps->x_seq,is_iden,x,is_petsc,&mumps->scat_sol);CHKERRQ(ierr); 9216bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 9226bf464f9SBarry Smith ierr = ISDestroy(&is_petsc);CHKERRQ(ierr); 9232205254eSKarl Rupp 924a5e57a09SHong Zhang mumps->ICNTL9_pre = mumps->id.ICNTL(9); /* save current value of id.ICNTL(9) */ 925397b6df1SKris Buschelman } 926a5e57a09SHong Zhang 927a5e57a09SHong Zhang ierr = VecScatterBegin(mumps->scat_sol,mumps->x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 928a5e57a09SHong Zhang ierr = VecScatterEnd(mumps->scat_sol,mumps->x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 929329ec9b3SHong Zhang } 930397b6df1SKris Buschelman PetscFunctionReturn(0); 931397b6df1SKris Buschelman } 932397b6df1SKris Buschelman 93351d5961aSHong Zhang #undef __FUNCT__ 93451d5961aSHong Zhang #define __FUNCT__ "MatSolveTranspose_MUMPS" 93551d5961aSHong Zhang PetscErrorCode MatSolveTranspose_MUMPS(Mat A,Vec b,Vec x) 93651d5961aSHong Zhang { 937*e69c285eSBarry Smith Mat_MUMPS *mumps=(Mat_MUMPS*)A->data; 93851d5961aSHong Zhang PetscErrorCode ierr; 93951d5961aSHong Zhang 94051d5961aSHong Zhang PetscFunctionBegin; 941a5e57a09SHong Zhang mumps->id.ICNTL(9) = 0; 9420ad0caddSJed Brown ierr = MatSolve_MUMPS(A,b,x);CHKERRQ(ierr); 943a5e57a09SHong Zhang mumps->id.ICNTL(9) = 1; 94451d5961aSHong Zhang PetscFunctionReturn(0); 94551d5961aSHong Zhang } 94651d5961aSHong Zhang 947e0b74bf9SHong Zhang #undef __FUNCT__ 948e0b74bf9SHong Zhang #define __FUNCT__ "MatMatSolve_MUMPS" 949e0b74bf9SHong Zhang PetscErrorCode MatMatSolve_MUMPS(Mat A,Mat B,Mat X) 950e0b74bf9SHong Zhang { 951bda8bf91SBarry Smith PetscErrorCode ierr; 952bda8bf91SBarry Smith PetscBool flg; 953*e69c285eSBarry Smith Mat_MUMPS *mumps=(Mat_MUMPS*)A->data; 954334c5f61SHong Zhang PetscInt i,nrhs,M; 9552cd7d884SHong Zhang PetscScalar *array,*bray; 956bda8bf91SBarry Smith 957e0b74bf9SHong Zhang PetscFunctionBegin; 9580298fd71SBarry Smith ierr = PetscObjectTypeCompareAny((PetscObject)B,&flg,MATSEQDENSE,MATMPIDENSE,NULL);CHKERRQ(ierr); 959801fbe65SHong Zhang if (!flg) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_ARG_WRONG,"Matrix B must be MATDENSE matrix"); 9600298fd71SBarry Smith ierr = PetscObjectTypeCompareAny((PetscObject)X,&flg,MATSEQDENSE,MATMPIDENSE,NULL);CHKERRQ(ierr); 961801fbe65SHong Zhang if (!flg) SETERRQ(PetscObjectComm((PetscObject)X),PETSC_ERR_ARG_WRONG,"Matrix X must be MATDENSE matrix"); 962801fbe65SHong Zhang if (B->rmap->n != X->rmap->n) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_ARG_WRONG,"Matrix B and X must have same row distribution"); 9634e34a73bSHong Zhang 9642cd7d884SHong Zhang ierr = MatGetSize(B,&M,&nrhs);CHKERRQ(ierr); 965334c5f61SHong Zhang mumps->id.nrhs = nrhs; 966334c5f61SHong Zhang mumps->id.lrhs = M; 9674e34a73bSHong Zhang 9682cd7d884SHong Zhang if (mumps->size == 1) { 9692cd7d884SHong Zhang /* copy B to X */ 9702cd7d884SHong Zhang ierr = MatDenseGetArray(B,&bray);CHKERRQ(ierr); 9712cd7d884SHong Zhang ierr = MatDenseGetArray(X,&array);CHKERRQ(ierr); 9726444a565SStefano Zampini ierr = PetscMemcpy(array,bray,M*nrhs*sizeof(PetscScalar));CHKERRQ(ierr); 9732cd7d884SHong Zhang ierr = MatDenseRestoreArray(B,&bray);CHKERRQ(ierr); 974940cd9d6SSatish Balay mumps->id.rhs = (MumpsScalar*)array; 975b5fa320bSStefano Zampini /* handle condensation step of Schur complement (if any) */ 976b8f61ee1SStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps,PETSC_FALSE);CHKERRQ(ierr); 977801fbe65SHong Zhang 9782cd7d884SHong Zhang /* solve phase */ 9792cd7d884SHong Zhang /*-------------*/ 9802cd7d884SHong Zhang mumps->id.job = JOB_SOLVE; 9812cd7d884SHong Zhang PetscMUMPS_c(&mumps->id); 9822cd7d884SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 983b5fa320bSStefano Zampini 984b5fa320bSStefano Zampini /* handle expansion step of Schur complement (if any) */ 985b8f61ee1SStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps,PETSC_TRUE);CHKERRQ(ierr); 9862cd7d884SHong Zhang ierr = MatDenseRestoreArray(X,&array);CHKERRQ(ierr); 987334c5f61SHong Zhang } else { /*--------- parallel case --------*/ 98871aed81dSHong Zhang PetscInt lsol_loc,nlsol_loc,*isol_loc,*idx,*iidx,*idxx,*isol_loc_save; 9891070efccSSatish Balay MumpsScalar *sol_loc,*sol_loc_save; 990801fbe65SHong Zhang IS is_to,is_from; 991334c5f61SHong Zhang PetscInt k,proc,j,m; 992801fbe65SHong Zhang const PetscInt *rstart; 993334c5f61SHong Zhang Vec v_mpi,b_seq,x_seq; 994334c5f61SHong Zhang VecScatter scat_rhs,scat_sol; 995801fbe65SHong Zhang 996801fbe65SHong Zhang /* create x_seq to hold local solution */ 99771aed81dSHong Zhang isol_loc_save = mumps->id.isol_loc; /* save it for MatSovle() */ 99871aed81dSHong Zhang sol_loc_save = mumps->id.sol_loc; 999801fbe65SHong Zhang 100071aed81dSHong Zhang lsol_loc = mumps->id.INFO(23); 100171aed81dSHong Zhang nlsol_loc = nrhs*lsol_loc; /* length of sol_loc */ 100271aed81dSHong Zhang ierr = PetscMalloc2(nlsol_loc,&sol_loc,nlsol_loc,&isol_loc);CHKERRQ(ierr); 1003940cd9d6SSatish Balay mumps->id.sol_loc = (MumpsScalar*)sol_loc; 1004801fbe65SHong Zhang mumps->id.isol_loc = isol_loc; 1005801fbe65SHong Zhang 10061070efccSSatish Balay ierr = VecCreateSeqWithArray(PETSC_COMM_SELF,1,nlsol_loc,(PetscScalar*)sol_loc,&x_seq);CHKERRQ(ierr); 10072cd7d884SHong Zhang 100874f0fcc7SHong Zhang /* copy rhs matrix B into vector v_mpi */ 1009334c5f61SHong Zhang ierr = MatGetLocalSize(B,&m,NULL);CHKERRQ(ierr); 1010801fbe65SHong Zhang ierr = MatDenseGetArray(B,&bray);CHKERRQ(ierr); 101174f0fcc7SHong Zhang ierr = VecCreateMPIWithArray(PetscObjectComm((PetscObject)B),1,nrhs*m,nrhs*M,(const PetscScalar*)bray,&v_mpi);CHKERRQ(ierr); 1012801fbe65SHong Zhang ierr = MatDenseRestoreArray(B,&bray);CHKERRQ(ierr); 1013801fbe65SHong Zhang 1014334c5f61SHong Zhang /* scatter v_mpi to b_seq because MUMPS only supports centralized rhs */ 101574f0fcc7SHong Zhang /* idx: maps from k-th index of v_mpi to (i,j)-th global entry of B; 1016801fbe65SHong Zhang iidx: inverse of idx, will be used by scattering xx_seq -> X */ 1017801fbe65SHong Zhang ierr = PetscMalloc2(nrhs*M,&idx,nrhs*M,&iidx);CHKERRQ(ierr); 1018801fbe65SHong Zhang ierr = MatGetOwnershipRanges(B,&rstart);CHKERRQ(ierr); 1019801fbe65SHong Zhang k = 0; 1020801fbe65SHong Zhang for (proc=0; proc<mumps->size; proc++){ 1021801fbe65SHong Zhang for (j=0; j<nrhs; j++){ 1022801fbe65SHong Zhang for (i=rstart[proc]; i<rstart[proc+1]; i++){ 1023801fbe65SHong Zhang iidx[j*M + i] = k; 1024801fbe65SHong Zhang idx[k++] = j*M + i; 1025801fbe65SHong Zhang } 1026801fbe65SHong Zhang } 10272cd7d884SHong Zhang } 10282cd7d884SHong Zhang 1029801fbe65SHong Zhang if (!mumps->myid) { 1030334c5f61SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,nrhs*M,&b_seq);CHKERRQ(ierr); 1031801fbe65SHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,nrhs*M,idx,PETSC_COPY_VALUES,&is_to);CHKERRQ(ierr); 1032801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,nrhs*M,0,1,&is_from);CHKERRQ(ierr); 1033801fbe65SHong Zhang } else { 1034334c5f61SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&b_seq);CHKERRQ(ierr); 1035801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_to);CHKERRQ(ierr); 1036801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_from);CHKERRQ(ierr); 1037801fbe65SHong Zhang } 1038334c5f61SHong Zhang ierr = VecScatterCreate(v_mpi,is_from,b_seq,is_to,&scat_rhs);CHKERRQ(ierr); 1039334c5f61SHong Zhang ierr = VecScatterBegin(scat_rhs,v_mpi,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1040801fbe65SHong Zhang ierr = ISDestroy(&is_to);CHKERRQ(ierr); 1041801fbe65SHong Zhang ierr = ISDestroy(&is_from);CHKERRQ(ierr); 1042334c5f61SHong Zhang ierr = VecScatterEnd(scat_rhs,v_mpi,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1043801fbe65SHong Zhang 1044801fbe65SHong Zhang if (!mumps->myid) { /* define rhs on the host */ 1045334c5f61SHong Zhang ierr = VecGetArray(b_seq,&bray);CHKERRQ(ierr); 1046940cd9d6SSatish Balay mumps->id.rhs = (MumpsScalar*)bray; 1047334c5f61SHong Zhang ierr = VecRestoreArray(b_seq,&bray);CHKERRQ(ierr); 1048801fbe65SHong Zhang } 1049801fbe65SHong Zhang 1050801fbe65SHong Zhang /* solve phase */ 1051801fbe65SHong Zhang /*-------------*/ 1052801fbe65SHong Zhang mumps->id.job = JOB_SOLVE; 1053801fbe65SHong Zhang PetscMUMPS_c(&mumps->id); 1054801fbe65SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 1055801fbe65SHong Zhang 1056334c5f61SHong Zhang /* scatter mumps distributed solution to petsc vector v_mpi, which shares local arrays with solution matrix X */ 105774f0fcc7SHong Zhang ierr = MatDenseGetArray(X,&array);CHKERRQ(ierr); 105874f0fcc7SHong Zhang ierr = VecPlaceArray(v_mpi,array);CHKERRQ(ierr); 1059801fbe65SHong Zhang 1060334c5f61SHong Zhang /* create scatter scat_sol */ 106171aed81dSHong Zhang ierr = PetscMalloc1(nlsol_loc,&idxx);CHKERRQ(ierr); 106271aed81dSHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,nlsol_loc,0,1,&is_from);CHKERRQ(ierr); 106371aed81dSHong Zhang for (i=0; i<lsol_loc; i++) { 1064334c5f61SHong Zhang isol_loc[i] -= 1; /* change Fortran style to C style */ 1065334c5f61SHong Zhang idxx[i] = iidx[isol_loc[i]]; 1066801fbe65SHong Zhang for (j=1; j<nrhs; j++){ 1067334c5f61SHong Zhang idxx[j*lsol_loc+i] = iidx[isol_loc[i]+j*M]; 1068801fbe65SHong Zhang } 1069801fbe65SHong Zhang } 107071aed81dSHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,nlsol_loc,idxx,PETSC_COPY_VALUES,&is_to);CHKERRQ(ierr); 1071334c5f61SHong Zhang ierr = VecScatterCreate(x_seq,is_from,v_mpi,is_to,&scat_sol);CHKERRQ(ierr); 1072334c5f61SHong Zhang ierr = VecScatterBegin(scat_sol,x_seq,v_mpi,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1073801fbe65SHong Zhang ierr = ISDestroy(&is_from);CHKERRQ(ierr); 1074801fbe65SHong Zhang ierr = ISDestroy(&is_to);CHKERRQ(ierr); 1075334c5f61SHong Zhang ierr = VecScatterEnd(scat_sol,x_seq,v_mpi,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1076801fbe65SHong Zhang ierr = MatDenseRestoreArray(X,&array);CHKERRQ(ierr); 107771aed81dSHong Zhang 107871aed81dSHong Zhang /* free spaces */ 107971aed81dSHong Zhang mumps->id.sol_loc = sol_loc_save; 108071aed81dSHong Zhang mumps->id.isol_loc = isol_loc_save; 108171aed81dSHong Zhang 108271aed81dSHong Zhang ierr = PetscFree2(sol_loc,isol_loc);CHKERRQ(ierr); 1083801fbe65SHong Zhang ierr = PetscFree2(idx,iidx);CHKERRQ(ierr); 1084801fbe65SHong Zhang ierr = PetscFree(idxx);CHKERRQ(ierr); 108571aed81dSHong Zhang ierr = VecDestroy(&x_seq);CHKERRQ(ierr); 108674f0fcc7SHong Zhang ierr = VecDestroy(&v_mpi);CHKERRQ(ierr); 1087334c5f61SHong Zhang ierr = VecDestroy(&b_seq);CHKERRQ(ierr); 1088334c5f61SHong Zhang ierr = VecScatterDestroy(&scat_rhs);CHKERRQ(ierr); 1089334c5f61SHong Zhang ierr = VecScatterDestroy(&scat_sol);CHKERRQ(ierr); 1090801fbe65SHong Zhang } 1091e0b74bf9SHong Zhang PetscFunctionReturn(0); 1092e0b74bf9SHong Zhang } 1093e0b74bf9SHong Zhang 1094ace3df97SHong Zhang #if !defined(PETSC_USE_COMPLEX) 1095a58c3f20SHong Zhang /* 1096a58c3f20SHong Zhang input: 1097a58c3f20SHong Zhang F: numeric factor 1098a58c3f20SHong Zhang output: 1099a58c3f20SHong Zhang nneg: total number of negative pivots 110019d49a3bSHong Zhang nzero: total number of zero pivots 110119d49a3bSHong Zhang npos: (global dimension of F) - nneg - nzero 1102a58c3f20SHong Zhang */ 1103a58c3f20SHong Zhang #undef __FUNCT__ 1104a58c3f20SHong Zhang #define __FUNCT__ "MatGetInertia_SBAIJMUMPS" 1105dfbe8321SBarry Smith PetscErrorCode MatGetInertia_SBAIJMUMPS(Mat F,int *nneg,int *nzero,int *npos) 1106a58c3f20SHong Zhang { 1107*e69c285eSBarry Smith Mat_MUMPS *mumps =(Mat_MUMPS*)F->data; 1108dfbe8321SBarry Smith PetscErrorCode ierr; 1109c1490034SHong Zhang PetscMPIInt size; 1110a58c3f20SHong Zhang 1111a58c3f20SHong Zhang PetscFunctionBegin; 1112ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)F),&size);CHKERRQ(ierr); 1113bcb30aebSHong Zhang /* MUMPS 4.3.1 calls ScaLAPACK when ICNTL(13)=0 (default), which does not offer the possibility to compute the inertia of a dense matrix. Set ICNTL(13)=1 to skip ScaLAPACK */ 1114a5e57a09SHong Zhang if (size > 1 && mumps->id.ICNTL(13) != 1) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"ICNTL(13)=%d. -mat_mumps_icntl_13 must be set as 1 for correct global matrix inertia\n",mumps->id.INFOG(13)); 1115ed85ac9fSHong Zhang 1116710ac8efSHong Zhang if (nneg) *nneg = mumps->id.INFOG(12); 1117ed85ac9fSHong Zhang if (nzero || npos) { 1118ed85ac9fSHong Zhang if (mumps->id.ICNTL(24) != 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"-mat_mumps_icntl_24 must be set as 1 for null pivot row detection"); 1119710ac8efSHong Zhang if (nzero) *nzero = mumps->id.INFOG(28); 1120710ac8efSHong Zhang if (npos) *npos = F->rmap->N - (mumps->id.INFOG(12) + mumps->id.INFOG(28)); 1121a58c3f20SHong Zhang } 1122a58c3f20SHong Zhang PetscFunctionReturn(0); 1123a58c3f20SHong Zhang } 112419d49a3bSHong Zhang #endif 1125a58c3f20SHong Zhang 1126397b6df1SKris Buschelman #undef __FUNCT__ 1127f6c57405SHong Zhang #define __FUNCT__ "MatFactorNumeric_MUMPS" 11289a625307SHong Zhang PetscErrorCode MatFactorNumeric_MUMPS(Mat F,Mat A,const MatFactorInfo *info) 1129af281ebdSHong Zhang { 1130*e69c285eSBarry Smith Mat_MUMPS *mumps =(Mat_MUMPS*)(F)->data; 11316849ba73SBarry Smith PetscErrorCode ierr; 1132ace3abfcSBarry Smith PetscBool isMPIAIJ; 1133397b6df1SKris Buschelman 1134397b6df1SKris Buschelman PetscFunctionBegin; 11356baea169SHong Zhang if (mumps->id.INFOG(1) < 0) { 11362aca8efcSHong Zhang if (mumps->id.INFOG(1) == -6) { 11372aca8efcSHong Zhang ierr = PetscInfo2(A,"MatFactorNumeric is called with singular matrix structure, INFOG(1)=%d, INFO(2)=%d\n",mumps->id.INFOG(1),mumps->id.INFO(2));CHKERRQ(ierr); 11386baea169SHong Zhang } 11396baea169SHong Zhang ierr = PetscInfo2(A,"MatFactorNumeric is called after analysis phase fails, INFOG(1)=%d, INFO(2)=%d\n",mumps->id.INFOG(1),mumps->id.INFO(2));CHKERRQ(ierr); 11402aca8efcSHong Zhang PetscFunctionReturn(0); 11412aca8efcSHong Zhang } 11426baea169SHong Zhang 1143a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_REUSE_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 1144397b6df1SKris Buschelman 1145397b6df1SKris Buschelman /* numerical factorization phase */ 1146329ec9b3SHong Zhang /*-------------------------------*/ 1147a5e57a09SHong Zhang mumps->id.job = JOB_FACTNUMERIC; 11484e34a73bSHong Zhang if (!mumps->id.ICNTL(18)) { /* A is centralized */ 1149a5e57a09SHong Zhang if (!mumps->myid) { 1150940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 1151397b6df1SKris Buschelman } 1152397b6df1SKris Buschelman } else { 1153940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 1154397b6df1SKris Buschelman } 1155a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1156a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) { 1157c0d63f2fSHong Zhang if (A->erroriffailure) { 1158c0d63f2fSHong Zhang SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: INFOG(1)=%d, INFO(2)=%d\n",mumps->id.INFOG(1),mumps->id.INFO(2)); 1159c0d63f2fSHong Zhang } else { 1160c0d63f2fSHong Zhang if (mumps->id.INFOG(1) == -10) { /* numerically singular matrix */ 11612aca8efcSHong Zhang ierr = PetscInfo2(F,"matrix is numerically singular, INFOG(1)=%d, INFO(2)=%d\n",mumps->id.INFOG(1),mumps->id.INFO(2));CHKERRQ(ierr); 1162680c5173SHong Zhang F->errortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 1163c0d63f2fSHong Zhang } else if (mumps->id.INFOG(1) == -13) { 1164c0d63f2fSHong Zhang ierr = PetscInfo2(F,"MUMPS in numerical factorization phase: INFOG(1)=%d, cannot allocate required memory %d megabytes\n",mumps->id.INFOG(1),mumps->id.INFO(2));CHKERRQ(ierr); 1165680c5173SHong Zhang F->errortype = MAT_FACTOR_OUTMEMORY; 1166c0d63f2fSHong Zhang } else if (mumps->id.INFOG(1) == -8 || mumps->id.INFOG(1) == -9 || (-16 < mumps->id.INFOG(1) && mumps->id.INFOG(1) < -10) ) { 1167c0d63f2fSHong Zhang ierr = PetscInfo2(F,"MUMPS in numerical factorization phase: INFOG(1)=%d, INFO(2)=%d, problem with workarray \n",mumps->id.INFOG(1),mumps->id.INFO(2));CHKERRQ(ierr); 1168680c5173SHong Zhang F->errortype = MAT_FACTOR_OUTMEMORY; 11692aca8efcSHong Zhang } else { 1170c0d63f2fSHong Zhang ierr = PetscInfo2(F,"MUMPS in numerical factorization phase: INFOG(1)=%d, INFO(2)=%d\n",mumps->id.INFOG(1),mumps->id.INFO(2));CHKERRQ(ierr); 1171680c5173SHong Zhang F->errortype = MAT_FACTOR_OTHER; 11722aca8efcSHong Zhang } 11732aca8efcSHong Zhang } 1174397b6df1SKris Buschelman } 1175a5e57a09SHong Zhang if (!mumps->myid && mumps->id.ICNTL(16) > 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB," mumps->id.ICNTL(16):=%d\n",mumps->id.INFOG(16)); 1176397b6df1SKris Buschelman 1177dcd589f8SShri Abhyankar (F)->assembled = PETSC_TRUE; 1178a5e57a09SHong Zhang mumps->matstruc = SAME_NONZERO_PATTERN; 1179b5fa320bSStefano Zampini mumps->schur_factored = PETSC_FALSE; 118059ac8732SStefano Zampini mumps->schur_inverted = PETSC_FALSE; 118167877ebaSShri Abhyankar 1182066565c5SStefano Zampini /* just to be sure that ICNTL(19) value returned by a call from MatMumpsGetIcntl is always consistent */ 1183066565c5SStefano Zampini if (!mumps->sym && mumps->id.ICNTL(19) && mumps->id.ICNTL(19) != 1) mumps->id.ICNTL(19) = 3; 1184066565c5SStefano Zampini 1185a5e57a09SHong Zhang if (mumps->size > 1) { 118667877ebaSShri Abhyankar PetscInt lsol_loc; 118767877ebaSShri Abhyankar PetscScalar *sol_loc; 11882205254eSKarl Rupp 1189c2093ab7SHong Zhang ierr = PetscObjectTypeCompare((PetscObject)A,MATMPIAIJ,&isMPIAIJ);CHKERRQ(ierr); 1190c2093ab7SHong Zhang 1191c2093ab7SHong Zhang /* distributed solution; Create x_seq=sol_loc for repeated use */ 1192c2093ab7SHong Zhang if (mumps->x_seq) { 1193c2093ab7SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 1194c2093ab7SHong Zhang ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr); 1195c2093ab7SHong Zhang ierr = VecDestroy(&mumps->x_seq);CHKERRQ(ierr); 1196c2093ab7SHong Zhang } 1197a5e57a09SHong Zhang lsol_loc = mumps->id.INFO(23); /* length of sol_loc */ 1198dcca6d9dSJed Brown ierr = PetscMalloc2(lsol_loc,&sol_loc,lsol_loc,&mumps->id.isol_loc);CHKERRQ(ierr); 1199a5e57a09SHong Zhang mumps->id.lsol_loc = lsol_loc; 1200940cd9d6SSatish Balay mumps->id.sol_loc = (MumpsScalar*)sol_loc; 1201a5e57a09SHong Zhang ierr = VecCreateSeqWithArray(PETSC_COMM_SELF,1,lsol_loc,sol_loc,&mumps->x_seq);CHKERRQ(ierr); 120267877ebaSShri Abhyankar } 1203397b6df1SKris Buschelman PetscFunctionReturn(0); 1204397b6df1SKris Buschelman } 1205397b6df1SKris Buschelman 12069a2535b5SHong Zhang /* Sets MUMPS options from the options database */ 1207dcd589f8SShri Abhyankar #undef __FUNCT__ 12089a2535b5SHong Zhang #define __FUNCT__ "PetscSetMUMPSFromOptions" 12099a2535b5SHong Zhang PetscErrorCode PetscSetMUMPSFromOptions(Mat F, Mat A) 1210dcd589f8SShri Abhyankar { 1211*e69c285eSBarry Smith Mat_MUMPS *mumps = (Mat_MUMPS*)F->data; 1212dcd589f8SShri Abhyankar PetscErrorCode ierr; 1213b34f08ffSHong Zhang PetscInt icntl,info[40],i,ninfo=40; 1214ace3abfcSBarry Smith PetscBool flg; 1215dcd589f8SShri Abhyankar 1216dcd589f8SShri Abhyankar PetscFunctionBegin; 1217ce94432eSBarry Smith ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)A),((PetscObject)A)->prefix,"MUMPS Options","Mat");CHKERRQ(ierr); 12189a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_1","ICNTL(1): output stream for error messages","None",mumps->id.ICNTL(1),&icntl,&flg);CHKERRQ(ierr); 12199a2535b5SHong Zhang if (flg) mumps->id.ICNTL(1) = icntl; 12209a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_2","ICNTL(2): output stream for diagnostic printing, statistics, and warning","None",mumps->id.ICNTL(2),&icntl,&flg);CHKERRQ(ierr); 12219a2535b5SHong Zhang if (flg) mumps->id.ICNTL(2) = icntl; 12229a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_3","ICNTL(3): output stream for global information, collected on the host","None",mumps->id.ICNTL(3),&icntl,&flg);CHKERRQ(ierr); 12239a2535b5SHong Zhang if (flg) mumps->id.ICNTL(3) = icntl; 1224dcd589f8SShri Abhyankar 12259a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_4","ICNTL(4): level of printing (0 to 4)","None",mumps->id.ICNTL(4),&icntl,&flg);CHKERRQ(ierr); 12269a2535b5SHong Zhang if (flg) mumps->id.ICNTL(4) = icntl; 12279a2535b5SHong Zhang if (mumps->id.ICNTL(4) || PetscLogPrintInfo) mumps->id.ICNTL(3) = 6; /* resume MUMPS default id.ICNTL(3) = 6 */ 12289a2535b5SHong Zhang 1229d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_6","ICNTL(6): permutes to a zero-free diagonal and/or scale the matrix (0 to 7)","None",mumps->id.ICNTL(6),&icntl,&flg);CHKERRQ(ierr); 12309a2535b5SHong Zhang if (flg) mumps->id.ICNTL(6) = icntl; 12319a2535b5SHong Zhang 1232d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_7","ICNTL(7): computes a symmetric permutation in sequential analysis (0 to 7). 3=Scotch, 4=PORD, 5=Metis","None",mumps->id.ICNTL(7),&icntl,&flg);CHKERRQ(ierr); 1233dcd589f8SShri Abhyankar if (flg) { 12342205254eSKarl Rupp if (icntl== 1 && mumps->size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"pivot order be set by the user in PERM_IN -- not supported by the PETSc/MUMPS interface\n"); 12352205254eSKarl Rupp else mumps->id.ICNTL(7) = icntl; 1236dcd589f8SShri Abhyankar } 1237e0b74bf9SHong Zhang 12380298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_8","ICNTL(8): scaling strategy (-2 to 8 or 77)","None",mumps->id.ICNTL(8),&mumps->id.ICNTL(8),NULL);CHKERRQ(ierr); 1239d341cd04SHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_9","ICNTL(9): computes the solution using A or A^T","None",mumps->id.ICNTL(9),&mumps->id.ICNTL(9),NULL);CHKERRQ(ierr); handled by MatSolveTranspose_MUMPS() */ 12400298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_10","ICNTL(10): max num of refinements","None",mumps->id.ICNTL(10),&mumps->id.ICNTL(10),NULL);CHKERRQ(ierr); 1241d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_11","ICNTL(11): statistics related to an error analysis (via -ksp_view)","None",mumps->id.ICNTL(11),&mumps->id.ICNTL(11),NULL);CHKERRQ(ierr); 1242d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_12","ICNTL(12): an ordering strategy for symmetric matrices (0 to 3)","None",mumps->id.ICNTL(12),&mumps->id.ICNTL(12),NULL);CHKERRQ(ierr); 1243d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_13","ICNTL(13): parallelism of the root node (enable ScaLAPACK) and its splitting","None",mumps->id.ICNTL(13),&mumps->id.ICNTL(13),NULL);CHKERRQ(ierr); 1244d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_14","ICNTL(14): percentage increase in the estimated working space","None",mumps->id.ICNTL(14),&mumps->id.ICNTL(14),NULL);CHKERRQ(ierr); 1245d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_19","ICNTL(19): computes the Schur complement","None",mumps->id.ICNTL(19),&mumps->id.ICNTL(19),NULL);CHKERRQ(ierr); 124659ac8732SStefano Zampini if (mumps->id.ICNTL(19) <= 0 || mumps->id.ICNTL(19) > 3) { /* reset any schur data (if any) */ 124759ac8732SStefano Zampini ierr = MatMumpsResetSchur_Private(mumps);CHKERRQ(ierr); 124859ac8732SStefano Zampini } 12494e34a73bSHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_20","ICNTL(20): the format (dense or sparse) of the right-hand sides","None",mumps->id.ICNTL(20),&mumps->id.ICNTL(20),NULL);CHKERRQ(ierr); -- sparse rhs is not supported in PETSc API */ 1250d341cd04SHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_21","ICNTL(21): the distribution (centralized or distributed) of the solution vectors","None",mumps->id.ICNTL(21),&mumps->id.ICNTL(21),NULL);CHKERRQ(ierr); we only use distributed solution vector */ 12519a2535b5SHong Zhang 1252d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_22","ICNTL(22): in-core/out-of-core factorization and solve (0 or 1)","None",mumps->id.ICNTL(22),&mumps->id.ICNTL(22),NULL);CHKERRQ(ierr); 12530298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_23","ICNTL(23): max size of the working memory (MB) that can allocate per processor","None",mumps->id.ICNTL(23),&mumps->id.ICNTL(23),NULL);CHKERRQ(ierr); 12540298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_24","ICNTL(24): detection of null pivot rows (0 or 1)","None",mumps->id.ICNTL(24),&mumps->id.ICNTL(24),NULL);CHKERRQ(ierr); 12559a2535b5SHong Zhang if (mumps->id.ICNTL(24)) { 12569a2535b5SHong Zhang mumps->id.ICNTL(13) = 1; /* turn-off ScaLAPACK to help with the correct detection of null pivots */ 1257d7ebd59bSHong Zhang } 1258d7ebd59bSHong Zhang 1259d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_25","ICNTL(25): compute a solution of a deficient matrix and a null space basis","None",mumps->id.ICNTL(25),&mumps->id.ICNTL(25),NULL);CHKERRQ(ierr); 1260d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_26","ICNTL(26): drives the solution phase if a Schur complement matrix","None",mumps->id.ICNTL(26),&mumps->id.ICNTL(26),NULL);CHKERRQ(ierr); 12612cd7d884SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_27","ICNTL(27): the blocking size for multiple right-hand sides","None",mumps->id.ICNTL(27),&mumps->id.ICNTL(27),NULL);CHKERRQ(ierr); 12620298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_28","ICNTL(28): use 1 for sequential analysis and ictnl(7) ordering, or 2 for parallel analysis and ictnl(29) ordering","None",mumps->id.ICNTL(28),&mumps->id.ICNTL(28),NULL);CHKERRQ(ierr); 1263d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_29","ICNTL(29): parallel ordering 1 = ptscotch, 2 = parmetis","None",mumps->id.ICNTL(29),&mumps->id.ICNTL(29),NULL);CHKERRQ(ierr); 12640298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_30","ICNTL(30): compute user-specified set of entries in inv(A)","None",mumps->id.ICNTL(30),&mumps->id.ICNTL(30),NULL);CHKERRQ(ierr); 1265d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_31","ICNTL(31): indicates which factors may be discarded during factorization","None",mumps->id.ICNTL(31),&mumps->id.ICNTL(31),NULL);CHKERRQ(ierr); 12664e34a73bSHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_32","ICNTL(32): performs the forward elemination of the right-hand sides during factorization","None",mumps->id.ICNTL(32),&mumps->id.ICNTL(32),NULL);CHKERRQ(ierr); -- not supported by PETSc API */ 12670298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_33","ICNTL(33): compute determinant","None",mumps->id.ICNTL(33),&mumps->id.ICNTL(33),NULL);CHKERRQ(ierr); 1268dcd589f8SShri Abhyankar 12690298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_1","CNTL(1): relative pivoting threshold","None",mumps->id.CNTL(1),&mumps->id.CNTL(1),NULL);CHKERRQ(ierr); 12700298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_2","CNTL(2): stopping criterion of refinement","None",mumps->id.CNTL(2),&mumps->id.CNTL(2),NULL);CHKERRQ(ierr); 12710298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_3","CNTL(3): absolute pivoting threshold","None",mumps->id.CNTL(3),&mumps->id.CNTL(3),NULL);CHKERRQ(ierr); 12720298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_4","CNTL(4): value for static pivoting","None",mumps->id.CNTL(4),&mumps->id.CNTL(4),NULL);CHKERRQ(ierr); 12730298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_5","CNTL(5): fixation for null pivots","None",mumps->id.CNTL(5),&mumps->id.CNTL(5),NULL);CHKERRQ(ierr); 1274e5bb22a1SHong Zhang 12750298fd71SBarry Smith ierr = PetscOptionsString("-mat_mumps_ooc_tmpdir", "out of core directory", "None", mumps->id.ooc_tmpdir, mumps->id.ooc_tmpdir, 256, NULL); 1276b34f08ffSHong Zhang 127716d797efSHong Zhang ierr = PetscOptionsIntArray("-mat_mumps_view_info","request INFO local to each processor","",info,&ninfo,NULL);CHKERRQ(ierr); 1278b34f08ffSHong Zhang if (ninfo) { 1279b34f08ffSHong Zhang if (ninfo > 40) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"number of INFO %d must <= 40\n",ninfo); 1280b34f08ffSHong Zhang ierr = PetscMalloc1(ninfo,&mumps->info);CHKERRQ(ierr); 1281b34f08ffSHong Zhang mumps->ninfo = ninfo; 1282b34f08ffSHong Zhang for (i=0; i<ninfo; i++) { 12836c4ed002SBarry Smith if (info[i] < 0 || info[i]>40) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"index of INFO %d must between 1 and 40\n",ninfo); 12846c4ed002SBarry Smith else { 1285b34f08ffSHong Zhang mumps->info[i] = info[i]; 1286b34f08ffSHong Zhang } 1287b34f08ffSHong Zhang } 1288b34f08ffSHong Zhang } 1289b34f08ffSHong Zhang 1290dcd589f8SShri Abhyankar PetscOptionsEnd(); 1291dcd589f8SShri Abhyankar PetscFunctionReturn(0); 1292dcd589f8SShri Abhyankar } 1293dcd589f8SShri Abhyankar 1294dcd589f8SShri Abhyankar #undef __FUNCT__ 1295dcd589f8SShri Abhyankar #define __FUNCT__ "PetscInitializeMUMPS" 1296f697e70eSHong Zhang PetscErrorCode PetscInitializeMUMPS(Mat A,Mat_MUMPS *mumps) 1297dcd589f8SShri Abhyankar { 1298dcd589f8SShri Abhyankar PetscErrorCode ierr; 1299dcd589f8SShri Abhyankar 1300dcd589f8SShri Abhyankar PetscFunctionBegin; 1301ce94432eSBarry Smith ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)A), &mumps->myid); 1302ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)A),&mumps->size);CHKERRQ(ierr); 1303ce94432eSBarry Smith ierr = MPI_Comm_dup(PetscObjectComm((PetscObject)A),&(mumps->comm_mumps));CHKERRQ(ierr); 13042205254eSKarl Rupp 1305f697e70eSHong Zhang mumps->id.comm_fortran = MPI_Comm_c2f(mumps->comm_mumps); 1306f697e70eSHong Zhang 1307f697e70eSHong Zhang mumps->id.job = JOB_INIT; 1308f697e70eSHong Zhang mumps->id.par = 1; /* host participates factorizaton and solve */ 1309f697e70eSHong Zhang mumps->id.sym = mumps->sym; 13102907cef9SHong Zhang PetscMUMPS_c(&mumps->id); 1311f697e70eSHong Zhang 13120298fd71SBarry Smith mumps->scat_rhs = NULL; 13130298fd71SBarry Smith mumps->scat_sol = NULL; 13149a2535b5SHong Zhang 131570544d5fSHong Zhang /* set PETSc-MUMPS default options - override MUMPS default */ 13169a2535b5SHong Zhang mumps->id.ICNTL(3) = 0; 13179a2535b5SHong Zhang mumps->id.ICNTL(4) = 0; 13189a2535b5SHong Zhang if (mumps->size == 1) { 13199a2535b5SHong Zhang mumps->id.ICNTL(18) = 0; /* centralized assembled matrix input */ 13209a2535b5SHong Zhang } else { 13219a2535b5SHong Zhang mumps->id.ICNTL(18) = 3; /* distributed assembled matrix input */ 13224e34a73bSHong Zhang mumps->id.ICNTL(20) = 0; /* rhs is in dense format */ 132370544d5fSHong Zhang mumps->id.ICNTL(21) = 1; /* distributed solution */ 13249a2535b5SHong Zhang } 13256444a565SStefano Zampini 13266444a565SStefano Zampini /* schur */ 13276444a565SStefano Zampini mumps->id.size_schur = 0; 13286444a565SStefano Zampini mumps->id.listvar_schur = NULL; 13296444a565SStefano Zampini mumps->id.schur = NULL; 1330b5fa320bSStefano Zampini mumps->sizeredrhs = 0; 1331b5fa320bSStefano Zampini mumps->schur_pivots = NULL; 1332b5fa320bSStefano Zampini mumps->schur_work = NULL; 133359ac8732SStefano Zampini mumps->schur_sol = NULL; 133459ac8732SStefano Zampini mumps->schur_sizesol = 0; 133559ac8732SStefano Zampini mumps->schur_factored = PETSC_FALSE; 133659ac8732SStefano Zampini mumps->schur_inverted = PETSC_FALSE; 1337dcd589f8SShri Abhyankar PetscFunctionReturn(0); 1338dcd589f8SShri Abhyankar } 1339dcd589f8SShri Abhyankar 13405cd7cf9dSHong Zhang #undef __FUNCT__ 13415cd7cf9dSHong Zhang #define __FUNCT__ "MatFactorSymbolic_MUMPS_ReportIfError" 13429a625307SHong Zhang PetscErrorCode MatFactorSymbolic_MUMPS_ReportIfError(Mat F,Mat A,const MatFactorInfo *info,Mat_MUMPS *mumps) 13435cd7cf9dSHong Zhang { 13445cd7cf9dSHong Zhang PetscErrorCode ierr; 13455cd7cf9dSHong Zhang 13465cd7cf9dSHong Zhang PetscFunctionBegin; 13475cd7cf9dSHong Zhang if (mumps->id.INFOG(1) < 0) { 13485cd7cf9dSHong Zhang if (A->erroriffailure) { 13495cd7cf9dSHong Zhang SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 13505cd7cf9dSHong Zhang } else { 13515cd7cf9dSHong Zhang if (mumps->id.INFOG(1) == -6) { 13525cd7cf9dSHong Zhang ierr = PetscInfo2(F,"matrix is singular in structure, INFOG(1)=%d, INFO(2)=%d\n",mumps->id.INFOG(1),mumps->id.INFO(2));CHKERRQ(ierr); 1353680c5173SHong Zhang F->errortype = MAT_FACTOR_STRUCT_ZEROPIVOT; 13545cd7cf9dSHong Zhang } else if (mumps->id.INFOG(1) == -5 || mumps->id.INFOG(1) == -7) { 13555cd7cf9dSHong Zhang ierr = PetscInfo2(F,"problem of workspace, INFOG(1)=%d, INFO(2)=%d\n",mumps->id.INFOG(1),mumps->id.INFO(2));CHKERRQ(ierr); 1356680c5173SHong Zhang F->errortype = MAT_FACTOR_OUTMEMORY; 13575cd7cf9dSHong Zhang } else { 13585cd7cf9dSHong Zhang ierr = PetscInfo2(F,"Error reported by MUMPS in analysis phase: INFOG(1)=%d, INFO(2)=%d\n",mumps->id.INFOG(1),mumps->id.INFO(2));CHKERRQ(ierr); 1359680c5173SHong Zhang F->errortype = MAT_FACTOR_OTHER; 13605cd7cf9dSHong Zhang } 13615cd7cf9dSHong Zhang } 13625cd7cf9dSHong Zhang } 13635cd7cf9dSHong Zhang PetscFunctionReturn(0); 13645cd7cf9dSHong Zhang } 13655cd7cf9dSHong Zhang 1366a5e57a09SHong Zhang /* Note Petsc r(=c) permutation is used when mumps->id.ICNTL(7)==1 with centralized assembled matrix input; otherwise r and c are ignored */ 1367397b6df1SKris Buschelman #undef __FUNCT__ 1368f0c56d0fSKris Buschelman #define __FUNCT__ "MatLUFactorSymbolic_AIJMUMPS" 13699a625307SHong Zhang PetscErrorCode MatLUFactorSymbolic_AIJMUMPS(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info) 1370b24902e0SBarry Smith { 1371*e69c285eSBarry Smith Mat_MUMPS *mumps = (Mat_MUMPS*)F->data; 1372dcd589f8SShri Abhyankar PetscErrorCode ierr; 137367877ebaSShri Abhyankar Vec b; 137467877ebaSShri Abhyankar IS is_iden; 137567877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1376397b6df1SKris Buschelman 1377397b6df1SKris Buschelman PetscFunctionBegin; 1378a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1379dcd589f8SShri Abhyankar 13809a2535b5SHong Zhang /* Set MUMPS options from the options database */ 13819a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1382dcd589f8SShri Abhyankar 1383a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 1384dcd589f8SShri Abhyankar 138567877ebaSShri Abhyankar /* analysis phase */ 138667877ebaSShri Abhyankar /*----------------*/ 1387a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1388a5e57a09SHong Zhang mumps->id.n = M; 1389a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 139067877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1391a5e57a09SHong Zhang if (!mumps->myid) { 1392a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1393a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1394940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 139567877ebaSShri Abhyankar } 1396a5e57a09SHong Zhang if (mumps->id.ICNTL(7) == 1) { /* use user-provide matrix ordering - assuming r = c ordering */ 13975248a706SHong Zhang /* 13985248a706SHong Zhang PetscBool flag; 13995248a706SHong Zhang ierr = ISEqual(r,c,&flag);CHKERRQ(ierr); 14005248a706SHong Zhang if (!flag) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"row_perm != col_perm"); 14015248a706SHong Zhang ierr = ISView(r,PETSC_VIEWER_STDOUT_SELF); 14025248a706SHong Zhang */ 1403a5e57a09SHong Zhang if (!mumps->myid) { 1404e0b74bf9SHong Zhang const PetscInt *idx; 1405e0b74bf9SHong Zhang PetscInt i,*perm_in; 14062205254eSKarl Rupp 1407785e854fSJed Brown ierr = PetscMalloc1(M,&perm_in);CHKERRQ(ierr); 1408e0b74bf9SHong Zhang ierr = ISGetIndices(r,&idx);CHKERRQ(ierr); 14092205254eSKarl Rupp 1410a5e57a09SHong Zhang mumps->id.perm_in = perm_in; 1411e0b74bf9SHong Zhang for (i=0; i<M; i++) perm_in[i] = idx[i]+1; /* perm_in[]: start from 1, not 0! */ 1412e0b74bf9SHong Zhang ierr = ISRestoreIndices(r,&idx);CHKERRQ(ierr); 1413e0b74bf9SHong Zhang } 1414e0b74bf9SHong Zhang } 141567877ebaSShri Abhyankar } 141667877ebaSShri Abhyankar break; 141767877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1418a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1419a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1420a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1421940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 142267877ebaSShri Abhyankar } 142367877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1424a5e57a09SHong Zhang if (!mumps->myid) { 14252cd7d884SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->rmap->N,&mumps->b_seq);CHKERRQ(ierr); 14262cd7d884SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,A->rmap->N,0,1,&is_iden);CHKERRQ(ierr); 142767877ebaSShri Abhyankar } else { 1428a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 142967877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 143067877ebaSShri Abhyankar } 14312a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1432a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 14336bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 14346bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 143567877ebaSShri Abhyankar break; 143667877ebaSShri Abhyankar } 1437a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 14385cd7cf9dSHong Zhang ierr = MatFactorSymbolic_MUMPS_ReportIfError(F,A,info,mumps);CHKERRQ(ierr); 143967877ebaSShri Abhyankar 1440719d5645SBarry Smith F->ops->lufactornumeric = MatFactorNumeric_MUMPS; 1441dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 144251d5961aSHong Zhang F->ops->solvetranspose = MatSolveTranspose_MUMPS; 14434e34a73bSHong Zhang F->ops->matsolve = MatMatSolve_MUMPS; 1444b24902e0SBarry Smith PetscFunctionReturn(0); 1445b24902e0SBarry Smith } 1446b24902e0SBarry Smith 1447450b117fSShri Abhyankar /* Note the Petsc r and c permutations are ignored */ 1448450b117fSShri Abhyankar #undef __FUNCT__ 1449450b117fSShri Abhyankar #define __FUNCT__ "MatLUFactorSymbolic_BAIJMUMPS" 14509a625307SHong Zhang PetscErrorCode MatLUFactorSymbolic_BAIJMUMPS(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info) 1451450b117fSShri Abhyankar { 1452*e69c285eSBarry Smith Mat_MUMPS *mumps = (Mat_MUMPS*)F->data; 1453dcd589f8SShri Abhyankar PetscErrorCode ierr; 145467877ebaSShri Abhyankar Vec b; 145567877ebaSShri Abhyankar IS is_iden; 145667877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1457450b117fSShri Abhyankar 1458450b117fSShri Abhyankar PetscFunctionBegin; 1459a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1460dcd589f8SShri Abhyankar 14619a2535b5SHong Zhang /* Set MUMPS options from the options database */ 14629a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1463dcd589f8SShri Abhyankar 1464a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 146567877ebaSShri Abhyankar 146667877ebaSShri Abhyankar /* analysis phase */ 146767877ebaSShri Abhyankar /*----------------*/ 1468a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1469a5e57a09SHong Zhang mumps->id.n = M; 1470a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 147167877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1472a5e57a09SHong Zhang if (!mumps->myid) { 1473a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1474a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1475940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 147667877ebaSShri Abhyankar } 147767877ebaSShri Abhyankar } 147867877ebaSShri Abhyankar break; 147967877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1480a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1481a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1482a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1483940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 148467877ebaSShri Abhyankar } 148567877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1486a5e57a09SHong Zhang if (!mumps->myid) { 1487a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr); 148867877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr); 148967877ebaSShri Abhyankar } else { 1490a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 149167877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 149267877ebaSShri Abhyankar } 14932a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1494a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 14956bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 14966bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 149767877ebaSShri Abhyankar break; 149867877ebaSShri Abhyankar } 1499a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 15005cd7cf9dSHong Zhang ierr = MatFactorSymbolic_MUMPS_ReportIfError(F,A,info,mumps);CHKERRQ(ierr); 150167877ebaSShri Abhyankar 1502450b117fSShri Abhyankar F->ops->lufactornumeric = MatFactorNumeric_MUMPS; 1503dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 150451d5961aSHong Zhang F->ops->solvetranspose = MatSolveTranspose_MUMPS; 1505450b117fSShri Abhyankar PetscFunctionReturn(0); 1506450b117fSShri Abhyankar } 1507b24902e0SBarry Smith 1508141f4205SHong Zhang /* Note the Petsc r permutation and factor info are ignored */ 1509397b6df1SKris Buschelman #undef __FUNCT__ 151067877ebaSShri Abhyankar #define __FUNCT__ "MatCholeskyFactorSymbolic_MUMPS" 15119a625307SHong Zhang PetscErrorCode MatCholeskyFactorSymbolic_MUMPS(Mat F,Mat A,IS r,const MatFactorInfo *info) 1512b24902e0SBarry Smith { 1513*e69c285eSBarry Smith Mat_MUMPS *mumps = (Mat_MUMPS*)F->data; 1514dcd589f8SShri Abhyankar PetscErrorCode ierr; 151567877ebaSShri Abhyankar Vec b; 151667877ebaSShri Abhyankar IS is_iden; 151767877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1518397b6df1SKris Buschelman 1519397b6df1SKris Buschelman PetscFunctionBegin; 1520a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1521dcd589f8SShri Abhyankar 15229a2535b5SHong Zhang /* Set MUMPS options from the options database */ 15239a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1524dcd589f8SShri Abhyankar 1525a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 1526dcd589f8SShri Abhyankar 152767877ebaSShri Abhyankar /* analysis phase */ 152867877ebaSShri Abhyankar /*----------------*/ 1529a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1530a5e57a09SHong Zhang mumps->id.n = M; 1531a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 153267877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1533a5e57a09SHong Zhang if (!mumps->myid) { 1534a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1535a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1536940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 153767877ebaSShri Abhyankar } 153867877ebaSShri Abhyankar } 153967877ebaSShri Abhyankar break; 154067877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1541a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1542a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1543a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1544940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 154567877ebaSShri Abhyankar } 154667877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1547a5e57a09SHong Zhang if (!mumps->myid) { 1548a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr); 154967877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr); 155067877ebaSShri Abhyankar } else { 1551a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 155267877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 155367877ebaSShri Abhyankar } 15542a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1555a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 15566bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 15576bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 155867877ebaSShri Abhyankar break; 155967877ebaSShri Abhyankar } 1560a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 15615cd7cf9dSHong Zhang ierr = MatFactorSymbolic_MUMPS_ReportIfError(F,A,info,mumps);CHKERRQ(ierr); 15625cd7cf9dSHong Zhang 15632792810eSHong Zhang F->ops->choleskyfactornumeric = MatFactorNumeric_MUMPS; 1564dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 156551d5961aSHong Zhang F->ops->solvetranspose = MatSolve_MUMPS; 15664e34a73bSHong Zhang F->ops->matsolve = MatMatSolve_MUMPS; 15674e34a73bSHong Zhang #if defined(PETSC_USE_COMPLEX) 15680298fd71SBarry Smith F->ops->getinertia = NULL; 15694e34a73bSHong Zhang #else 15704e34a73bSHong Zhang F->ops->getinertia = MatGetInertia_SBAIJMUMPS; 1571db4efbfdSBarry Smith #endif 1572b24902e0SBarry Smith PetscFunctionReturn(0); 1573b24902e0SBarry Smith } 1574b24902e0SBarry Smith 1575397b6df1SKris Buschelman #undef __FUNCT__ 157664e6c443SBarry Smith #define __FUNCT__ "MatView_MUMPS" 157764e6c443SBarry Smith PetscErrorCode MatView_MUMPS(Mat A,PetscViewer viewer) 157874ed9c26SBarry Smith { 1579f6c57405SHong Zhang PetscErrorCode ierr; 158064e6c443SBarry Smith PetscBool iascii; 158164e6c443SBarry Smith PetscViewerFormat format; 1582*e69c285eSBarry Smith Mat_MUMPS *mumps=(Mat_MUMPS*)A->data; 1583f6c57405SHong Zhang 1584f6c57405SHong Zhang PetscFunctionBegin; 158564e6c443SBarry Smith /* check if matrix is mumps type */ 158664e6c443SBarry Smith if (A->ops->solve != MatSolve_MUMPS) PetscFunctionReturn(0); 158764e6c443SBarry Smith 1588251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 158964e6c443SBarry Smith if (iascii) { 159064e6c443SBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 159164e6c443SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO) { 159264e6c443SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"MUMPS run parameters:\n");CHKERRQ(ierr); 1593a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," SYM (matrix type): %d \n",mumps->id.sym);CHKERRQ(ierr); 1594a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," PAR (host participation): %d \n",mumps->id.par);CHKERRQ(ierr); 1595a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(1) (output for error): %d \n",mumps->id.ICNTL(1));CHKERRQ(ierr); 1596a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(2) (output of diagnostic msg): %d \n",mumps->id.ICNTL(2));CHKERRQ(ierr); 1597a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(3) (output for global info): %d \n",mumps->id.ICNTL(3));CHKERRQ(ierr); 1598a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(4) (level of printing): %d \n",mumps->id.ICNTL(4));CHKERRQ(ierr); 1599a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(5) (input mat struct): %d \n",mumps->id.ICNTL(5));CHKERRQ(ierr); 1600a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(6) (matrix prescaling): %d \n",mumps->id.ICNTL(6));CHKERRQ(ierr); 1601a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(7) (sequentia matrix ordering):%d \n",mumps->id.ICNTL(7));CHKERRQ(ierr); 1602a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(8) (scalling strategy): %d \n",mumps->id.ICNTL(8));CHKERRQ(ierr); 1603a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(10) (max num of refinements): %d \n",mumps->id.ICNTL(10));CHKERRQ(ierr); 1604a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(11) (error analysis): %d \n",mumps->id.ICNTL(11));CHKERRQ(ierr); 1605a5e57a09SHong Zhang if (mumps->id.ICNTL(11)>0) { 1606a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(4) (inf norm of input mat): %g\n",mumps->id.RINFOG(4));CHKERRQ(ierr); 1607a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(5) (inf norm of solution): %g\n",mumps->id.RINFOG(5));CHKERRQ(ierr); 1608a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(6) (inf norm of residual): %g\n",mumps->id.RINFOG(6));CHKERRQ(ierr); 1609a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(7),RINFOG(8) (backward error est): %g, %g\n",mumps->id.RINFOG(7),mumps->id.RINFOG(8));CHKERRQ(ierr); 1610a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(9) (error estimate): %g \n",mumps->id.RINFOG(9));CHKERRQ(ierr); 1611a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(10),RINFOG(11)(condition numbers): %g, %g\n",mumps->id.RINFOG(10),mumps->id.RINFOG(11));CHKERRQ(ierr); 1612f6c57405SHong Zhang } 1613a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(12) (efficiency control): %d \n",mumps->id.ICNTL(12));CHKERRQ(ierr); 1614a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(13) (efficiency control): %d \n",mumps->id.ICNTL(13));CHKERRQ(ierr); 1615a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(14) (percentage of estimated workspace increase): %d \n",mumps->id.ICNTL(14));CHKERRQ(ierr); 1616f6c57405SHong Zhang /* ICNTL(15-17) not used */ 1617a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(18) (input mat struct): %d \n",mumps->id.ICNTL(18));CHKERRQ(ierr); 1618a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(19) (Shur complement info): %d \n",mumps->id.ICNTL(19));CHKERRQ(ierr); 1619a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(20) (rhs sparse pattern): %d \n",mumps->id.ICNTL(20));CHKERRQ(ierr); 1620ca3dc52bSPierre Jolivet ierr = PetscViewerASCIIPrintf(viewer," ICNTL(21) (solution struct): %d \n",mumps->id.ICNTL(21));CHKERRQ(ierr); 1621a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(22) (in-core/out-of-core facility): %d \n",mumps->id.ICNTL(22));CHKERRQ(ierr); 1622a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(23) (max size of memory can be allocated locally):%d \n",mumps->id.ICNTL(23));CHKERRQ(ierr); 1623c0165424SHong Zhang 1624a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(24) (detection of null pivot rows): %d \n",mumps->id.ICNTL(24));CHKERRQ(ierr); 1625a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(25) (computation of a null space basis): %d \n",mumps->id.ICNTL(25));CHKERRQ(ierr); 1626a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(26) (Schur options for rhs or solution): %d \n",mumps->id.ICNTL(26));CHKERRQ(ierr); 1627a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(27) (experimental parameter): %d \n",mumps->id.ICNTL(27));CHKERRQ(ierr); 1628a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(28) (use parallel or sequential ordering): %d \n",mumps->id.ICNTL(28));CHKERRQ(ierr); 1629a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(29) (parallel ordering): %d \n",mumps->id.ICNTL(29));CHKERRQ(ierr); 163042179a6aSHong Zhang 1631a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(30) (user-specified set of entries in inv(A)): %d \n",mumps->id.ICNTL(30));CHKERRQ(ierr); 1632a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(31) (factors is discarded in the solve phase): %d \n",mumps->id.ICNTL(31));CHKERRQ(ierr); 1633a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(33) (compute determinant): %d \n",mumps->id.ICNTL(33));CHKERRQ(ierr); 1634f6c57405SHong Zhang 1635a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(1) (relative pivoting threshold): %g \n",mumps->id.CNTL(1));CHKERRQ(ierr); 1636a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(2) (stopping criterion of refinement): %g \n",mumps->id.CNTL(2));CHKERRQ(ierr); 1637ca3dc52bSPierre Jolivet ierr = PetscViewerASCIIPrintf(viewer," CNTL(3) (absolute pivoting threshold): %g \n",mumps->id.CNTL(3));CHKERRQ(ierr); 1638ca3dc52bSPierre Jolivet ierr = PetscViewerASCIIPrintf(viewer," CNTL(4) (value of static pivoting): %g \n",mumps->id.CNTL(4));CHKERRQ(ierr); 1639a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(5) (fixation for null pivots): %g \n",mumps->id.CNTL(5));CHKERRQ(ierr); 1640f6c57405SHong Zhang 1641f6c57405SHong Zhang /* infomation local to each processor */ 164234ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(1) (local estimated flops for the elimination after analysis): \n");CHKERRQ(ierr); 16431575c14dSBarry Smith ierr = PetscViewerASCIIPushSynchronized(viewer);CHKERRQ(ierr); 1644a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(1));CHKERRQ(ierr); 164534ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 164634ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(2) (local estimated flops for the assembly after factorization): \n");CHKERRQ(ierr); 1647a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(2));CHKERRQ(ierr); 164834ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 164934ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(3) (local estimated flops for the elimination after factorization): \n");CHKERRQ(ierr); 1650a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(3));CHKERRQ(ierr); 165134ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1652f6c57405SHong Zhang 165334ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(15) (estimated size of (in MB) MUMPS internal data for running numerical factorization): \n");CHKERRQ(ierr); 1654a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(15));CHKERRQ(ierr); 165534ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1656f6c57405SHong Zhang 165734ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(16) (size of (in MB) MUMPS internal data used during numerical factorization): \n");CHKERRQ(ierr); 1658a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(16));CHKERRQ(ierr); 165934ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1660f6c57405SHong Zhang 166134ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(23) (num of pivots eliminated on this processor after factorization): \n");CHKERRQ(ierr); 1662a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(23));CHKERRQ(ierr); 166334ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1664b34f08ffSHong Zhang 1665b34f08ffSHong Zhang if (mumps->ninfo && mumps->ninfo <= 40){ 1666b34f08ffSHong Zhang PetscInt i; 1667b34f08ffSHong Zhang for (i=0; i<mumps->ninfo; i++){ 1668b34f08ffSHong Zhang ierr = PetscViewerASCIIPrintf(viewer, " INFO(%d): \n",mumps->info[i]);CHKERRQ(ierr); 1669b34f08ffSHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(mumps->info[i]));CHKERRQ(ierr); 1670b34f08ffSHong Zhang ierr = PetscViewerFlush(viewer); 1671b34f08ffSHong Zhang } 1672b34f08ffSHong Zhang } 1673b34f08ffSHong Zhang 1674b34f08ffSHong Zhang 16751575c14dSBarry Smith ierr = PetscViewerASCIIPopSynchronized(viewer);CHKERRQ(ierr); 1676f6c57405SHong Zhang 1677a5e57a09SHong Zhang if (!mumps->myid) { /* information from the host */ 1678a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(1) (global estimated flops for the elimination after analysis): %g \n",mumps->id.RINFOG(1));CHKERRQ(ierr); 1679a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(2) (global estimated flops for the assembly after factorization): %g \n",mumps->id.RINFOG(2));CHKERRQ(ierr); 1680a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(3) (global estimated flops for the elimination after factorization): %g \n",mumps->id.RINFOG(3));CHKERRQ(ierr); 1681a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," (RINFOG(12) RINFOG(13))*2^INFOG(34) (determinant): (%g,%g)*(2^%d)\n",mumps->id.RINFOG(12),mumps->id.RINFOG(13),mumps->id.INFOG(34));CHKERRQ(ierr); 1682f6c57405SHong Zhang 1683a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(3) (estimated real workspace for factors on all processors after analysis): %d \n",mumps->id.INFOG(3));CHKERRQ(ierr); 1684a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(4) (estimated integer workspace for factors on all processors after analysis): %d \n",mumps->id.INFOG(4));CHKERRQ(ierr); 1685a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(5) (estimated maximum front size in the complete tree): %d \n",mumps->id.INFOG(5));CHKERRQ(ierr); 1686a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(6) (number of nodes in the complete tree): %d \n",mumps->id.INFOG(6));CHKERRQ(ierr); 1687a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(7) (ordering option effectively use after analysis): %d \n",mumps->id.INFOG(7));CHKERRQ(ierr); 1688a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(8) (structural symmetry in percent of the permuted matrix after analysis): %d \n",mumps->id.INFOG(8));CHKERRQ(ierr); 1689a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(9) (total real/complex workspace to store the matrix factors after factorization): %d \n",mumps->id.INFOG(9));CHKERRQ(ierr); 1690a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(10) (total integer space store the matrix factors after factorization): %d \n",mumps->id.INFOG(10));CHKERRQ(ierr); 1691a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(11) (order of largest frontal matrix after factorization): %d \n",mumps->id.INFOG(11));CHKERRQ(ierr); 1692a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(12) (number of off-diagonal pivots): %d \n",mumps->id.INFOG(12));CHKERRQ(ierr); 1693a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(13) (number of delayed pivots after factorization): %d \n",mumps->id.INFOG(13));CHKERRQ(ierr); 1694a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(14) (number of memory compress after factorization): %d \n",mumps->id.INFOG(14));CHKERRQ(ierr); 1695a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(15) (number of steps of iterative refinement after solution): %d \n",mumps->id.INFOG(15));CHKERRQ(ierr); 1696a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(16) (estimated size (in MB) of all MUMPS internal data for factorization after analysis: value on the most memory consuming processor): %d \n",mumps->id.INFOG(16));CHKERRQ(ierr); 1697a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(17) (estimated size of all MUMPS internal data for factorization after analysis: sum over all processors): %d \n",mumps->id.INFOG(17));CHKERRQ(ierr); 1698a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(18) (size of all MUMPS internal data allocated during factorization: value on the most memory consuming processor): %d \n",mumps->id.INFOG(18));CHKERRQ(ierr); 1699a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(19) (size of all MUMPS internal data allocated during factorization: sum over all processors): %d \n",mumps->id.INFOG(19));CHKERRQ(ierr); 1700a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(20) (estimated number of entries in the factors): %d \n",mumps->id.INFOG(20));CHKERRQ(ierr); 1701a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(21) (size in MB of memory effectively used during factorization - value on the most memory consuming processor): %d \n",mumps->id.INFOG(21));CHKERRQ(ierr); 1702a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(22) (size in MB of memory effectively used during factorization - sum over all processors): %d \n",mumps->id.INFOG(22));CHKERRQ(ierr); 1703a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(23) (after analysis: value of ICNTL(6) effectively used): %d \n",mumps->id.INFOG(23));CHKERRQ(ierr); 1704a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(24) (after analysis: value of ICNTL(12) effectively used): %d \n",mumps->id.INFOG(24));CHKERRQ(ierr); 1705a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(25) (after factorization: number of pivots modified by static pivoting): %d \n",mumps->id.INFOG(25));CHKERRQ(ierr); 170640d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(28) (after factorization: number of null pivots encountered): %d\n",mumps->id.INFOG(28));CHKERRQ(ierr); 170740d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(29) (after factorization: effective number of entries in the factors (sum over all processors)): %d\n",mumps->id.INFOG(29));CHKERRQ(ierr); 170840d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(30, 31) (after solution: size in Mbytes of memory used during solution phase): %d, %d\n",mumps->id.INFOG(30),mumps->id.INFOG(31));CHKERRQ(ierr); 170940d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(32) (after analysis: type of analysis done): %d\n",mumps->id.INFOG(32));CHKERRQ(ierr); 171040d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(33) (value used for ICNTL(8)): %d\n",mumps->id.INFOG(33));CHKERRQ(ierr); 171140d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(34) (exponent of the determinant if determinant is requested): %d\n",mumps->id.INFOG(34));CHKERRQ(ierr); 1712f6c57405SHong Zhang } 1713f6c57405SHong Zhang } 1714cb828f0fSHong Zhang } 1715f6c57405SHong Zhang PetscFunctionReturn(0); 1716f6c57405SHong Zhang } 1717f6c57405SHong Zhang 171835bd34faSBarry Smith #undef __FUNCT__ 171935bd34faSBarry Smith #define __FUNCT__ "MatGetInfo_MUMPS" 172035bd34faSBarry Smith PetscErrorCode MatGetInfo_MUMPS(Mat A,MatInfoType flag,MatInfo *info) 172135bd34faSBarry Smith { 1722*e69c285eSBarry Smith Mat_MUMPS *mumps =(Mat_MUMPS*)A->data; 172335bd34faSBarry Smith 172435bd34faSBarry Smith PetscFunctionBegin; 172535bd34faSBarry Smith info->block_size = 1.0; 1726cb828f0fSHong Zhang info->nz_allocated = mumps->id.INFOG(20); 1727cb828f0fSHong Zhang info->nz_used = mumps->id.INFOG(20); 172835bd34faSBarry Smith info->nz_unneeded = 0.0; 172935bd34faSBarry Smith info->assemblies = 0.0; 173035bd34faSBarry Smith info->mallocs = 0.0; 173135bd34faSBarry Smith info->memory = 0.0; 173235bd34faSBarry Smith info->fill_ratio_given = 0; 173335bd34faSBarry Smith info->fill_ratio_needed = 0; 173435bd34faSBarry Smith info->factor_mallocs = 0; 173535bd34faSBarry Smith PetscFunctionReturn(0); 173635bd34faSBarry Smith } 173735bd34faSBarry Smith 17385ccb76cbSHong Zhang /* -------------------------------------------------------------------------------------------*/ 17395ccb76cbSHong Zhang #undef __FUNCT__ 17408e7ba810SStefano Zampini #define __FUNCT__ "MatFactorSetSchurIS_MUMPS" 17418e7ba810SStefano Zampini PetscErrorCode MatFactorSetSchurIS_MUMPS(Mat F, IS is) 17426444a565SStefano Zampini { 1743*e69c285eSBarry Smith Mat_MUMPS *mumps =(Mat_MUMPS*)F->data; 17448e7ba810SStefano Zampini const PetscInt *idxs; 17458e7ba810SStefano Zampini PetscInt size,i; 17466444a565SStefano Zampini PetscErrorCode ierr; 17476444a565SStefano Zampini 17486444a565SStefano Zampini PetscFunctionBegin; 174959ac8732SStefano Zampini if (mumps->size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"MUMPS parallel Schur complements not yet supported from PETSc\n"); 17508e7ba810SStefano Zampini ierr = ISGetLocalSize(is,&size);CHKERRQ(ierr); 17516444a565SStefano Zampini if (mumps->id.size_schur != size) { 17526444a565SStefano Zampini ierr = PetscFree2(mumps->id.listvar_schur,mumps->id.schur);CHKERRQ(ierr); 17536444a565SStefano Zampini mumps->id.size_schur = size; 17546444a565SStefano Zampini mumps->id.schur_lld = size; 17556444a565SStefano Zampini ierr = PetscMalloc2(size,&mumps->id.listvar_schur,size*size,&mumps->id.schur);CHKERRQ(ierr); 17566444a565SStefano Zampini } 17578e7ba810SStefano Zampini ierr = ISGetIndices(is,&idxs);CHKERRQ(ierr); 17586444a565SStefano Zampini ierr = PetscMemcpy(mumps->id.listvar_schur,idxs,size*sizeof(PetscInt));CHKERRQ(ierr); 17598e7ba810SStefano Zampini /* MUMPS expects Fortran style indices */ 17608e7ba810SStefano Zampini for (i=0;i<size;i++) mumps->id.listvar_schur[i]++; 17618e7ba810SStefano Zampini ierr = ISRestoreIndices(is,&idxs);CHKERRQ(ierr); 176278a7176cSStefano Zampini if (size) { /* turn on Schur switch if we the set of indices is not empty */ 17636444a565SStefano Zampini if (F->factortype == MAT_FACTOR_LU) { 176459ac8732SStefano Zampini mumps->id.ICNTL(19) = 3; /* MUMPS returns full matrix */ 17656444a565SStefano Zampini } else { 176659ac8732SStefano Zampini mumps->id.ICNTL(19) = 2; /* MUMPS returns lower triangular part */ 17676444a565SStefano Zampini } 176859ac8732SStefano Zampini /* set a special value of ICNTL (not handled my MUMPS) to be used in the solve phase by PETSc */ 1769b5fa320bSStefano Zampini mumps->id.ICNTL(26) = -1; 177078a7176cSStefano Zampini } 17716444a565SStefano Zampini PetscFunctionReturn(0); 17726444a565SStefano Zampini } 17736444a565SStefano Zampini 17746444a565SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 17756444a565SStefano Zampini #undef __FUNCT__ 17765a05ddb0SStefano Zampini #define __FUNCT__ "MatFactorCreateSchurComplement_MUMPS" 17775a05ddb0SStefano Zampini PetscErrorCode MatFactorCreateSchurComplement_MUMPS(Mat F,Mat* S) 17786444a565SStefano Zampini { 17796444a565SStefano Zampini Mat St; 1780*e69c285eSBarry Smith Mat_MUMPS *mumps =(Mat_MUMPS*)F->data; 17816444a565SStefano Zampini PetscScalar *array; 17826444a565SStefano Zampini #if defined(PETSC_USE_COMPLEX) 17838ac429a0SStefano Zampini PetscScalar im = PetscSqrtScalar((PetscScalar)-1.0); 17846444a565SStefano Zampini #endif 17856444a565SStefano Zampini PetscErrorCode ierr; 17866444a565SStefano Zampini 17876444a565SStefano Zampini PetscFunctionBegin; 17885a05ddb0SStefano Zampini if (!mumps->id.ICNTL(19)) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatFactorSetSchurIS to enable it"); 17895a05ddb0SStefano Zampini else if (!mumps->id.size_schur) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatFactorSetSchurIS before"); 17906f3cc6f9SBarry Smith 17916444a565SStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)F),&St);CHKERRQ(ierr); 17926444a565SStefano Zampini ierr = MatSetSizes(St,PETSC_DECIDE,PETSC_DECIDE,mumps->id.size_schur,mumps->id.size_schur);CHKERRQ(ierr); 17936444a565SStefano Zampini ierr = MatSetType(St,MATDENSE);CHKERRQ(ierr); 17946444a565SStefano Zampini ierr = MatSetUp(St);CHKERRQ(ierr); 17956444a565SStefano Zampini ierr = MatDenseGetArray(St,&array);CHKERRQ(ierr); 179659ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full matrix */ 17976444a565SStefano Zampini if (mumps->id.ICNTL(19) == 1) { /* stored by rows */ 17986444a565SStefano Zampini PetscInt i,j,N=mumps->id.size_schur; 17996444a565SStefano Zampini for (i=0;i<N;i++) { 18006444a565SStefano Zampini for (j=0;j<N;j++) { 18016444a565SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 18026444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j]; 18036444a565SStefano Zampini #else 18046444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j].r + im*mumps->id.schur[i*N+j].i; 18056444a565SStefano Zampini #endif 18066444a565SStefano Zampini array[j*N+i] = val; 18076444a565SStefano Zampini } 18086444a565SStefano Zampini } 18096444a565SStefano Zampini } else { /* stored by columns */ 18106444a565SStefano Zampini ierr = PetscMemcpy(array,mumps->id.schur,mumps->id.size_schur*mumps->id.size_schur*sizeof(PetscScalar));CHKERRQ(ierr); 18116444a565SStefano Zampini } 18126444a565SStefano Zampini } else { /* either full or lower-triangular (not packed) */ 18136444a565SStefano Zampini if (mumps->id.ICNTL(19) == 2) { /* lower triangular stored by columns */ 18146444a565SStefano Zampini PetscInt i,j,N=mumps->id.size_schur; 18156444a565SStefano Zampini for (i=0;i<N;i++) { 18166444a565SStefano Zampini for (j=i;j<N;j++) { 18176444a565SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 18186444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j]; 18196444a565SStefano Zampini #else 18206444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j].r + im*mumps->id.schur[i*N+j].i; 18216444a565SStefano Zampini #endif 18226444a565SStefano Zampini array[i*N+j] = val; 18236444a565SStefano Zampini array[j*N+i] = val; 18246444a565SStefano Zampini } 18256444a565SStefano Zampini } 18266444a565SStefano Zampini } else if (mumps->id.ICNTL(19) == 3) { /* full matrix */ 18276444a565SStefano Zampini ierr = PetscMemcpy(array,mumps->id.schur,mumps->id.size_schur*mumps->id.size_schur*sizeof(PetscScalar));CHKERRQ(ierr); 18286444a565SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 18296444a565SStefano Zampini PetscInt i,j,N=mumps->id.size_schur; 18306444a565SStefano Zampini for (i=0;i<N;i++) { 18316444a565SStefano Zampini for (j=0;j<i+1;j++) { 18326444a565SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 18336444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j]; 18346444a565SStefano Zampini #else 18356444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j].r + im*mumps->id.schur[i*N+j].i; 18366444a565SStefano Zampini #endif 18376444a565SStefano Zampini array[i*N+j] = val; 18386444a565SStefano Zampini array[j*N+i] = val; 18396444a565SStefano Zampini } 18406444a565SStefano Zampini } 18416444a565SStefano Zampini } 18426444a565SStefano Zampini } 18436444a565SStefano Zampini ierr = MatDenseRestoreArray(St,&array);CHKERRQ(ierr); 18446444a565SStefano Zampini *S = St; 18456444a565SStefano Zampini PetscFunctionReturn(0); 18466444a565SStefano Zampini } 18476444a565SStefano Zampini 184859ac8732SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 184959ac8732SStefano Zampini #undef __FUNCT__ 18505a05ddb0SStefano Zampini #define __FUNCT__ "MatFactorGetSchurComplement_MUMPS" 18515a05ddb0SStefano Zampini PetscErrorCode MatFactorGetSchurComplement_MUMPS(Mat F,Mat* S) 185259ac8732SStefano Zampini { 185359ac8732SStefano Zampini Mat St; 1854*e69c285eSBarry Smith Mat_MUMPS *mumps =(Mat_MUMPS*)F->data; 185559ac8732SStefano Zampini PetscErrorCode ierr; 185659ac8732SStefano Zampini 185759ac8732SStefano Zampini PetscFunctionBegin; 18585a05ddb0SStefano Zampini if (!mumps->id.ICNTL(19)) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatFactorSetSchurIS to enable it"); 18595a05ddb0SStefano Zampini else if (!mumps->id.size_schur) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatFactorSetSchurIS before"); 18606f3cc6f9SBarry Smith 18617bc32933SStefano Zampini /* It should be the responsibility of the user to handle different ICNTL(19) cases and factorization stages if they want to work with the raw data */ 186259ac8732SStefano Zampini ierr = MatCreateSeqDense(PetscObjectComm((PetscObject)F),mumps->id.size_schur,mumps->id.size_schur,(PetscScalar*)mumps->id.schur,&St);CHKERRQ(ierr); 186359ac8732SStefano Zampini *S = St; 186459ac8732SStefano Zampini PetscFunctionReturn(0); 186559ac8732SStefano Zampini } 186659ac8732SStefano Zampini 186759ac8732SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 186859ac8732SStefano Zampini #undef __FUNCT__ 18695a05ddb0SStefano Zampini #define __FUNCT__ "MatFactorInvertSchurComplement_MUMPS" 18705a05ddb0SStefano Zampini PetscErrorCode MatFactorInvertSchurComplement_MUMPS(Mat F) 187159ac8732SStefano Zampini { 1872*e69c285eSBarry Smith Mat_MUMPS *mumps =(Mat_MUMPS*)F->data; 187359ac8732SStefano Zampini PetscErrorCode ierr; 187459ac8732SStefano Zampini 187559ac8732SStefano Zampini PetscFunctionBegin; 187659ac8732SStefano Zampini if (!mumps->id.ICNTL(19)) { /* do nothing */ 187759ac8732SStefano Zampini PetscFunctionReturn(0); 187859ac8732SStefano Zampini } 18795a05ddb0SStefano Zampini if (!mumps->id.size_schur) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatFactorSetSchurIS before"); 188059ac8732SStefano Zampini ierr = MatMumpsInvertSchur_Private(mumps);CHKERRQ(ierr); 188159ac8732SStefano Zampini PetscFunctionReturn(0); 188259ac8732SStefano Zampini } 188359ac8732SStefano Zampini 18846444a565SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 18856444a565SStefano Zampini #undef __FUNCT__ 18865a05ddb0SStefano Zampini #define __FUNCT__ "MatFactorSolveSchurComplement_MUMPS" 18875a05ddb0SStefano Zampini PetscErrorCode MatFactorSolveSchurComplement_MUMPS(Mat F, Vec rhs, Vec sol) 1888e807eca7SStefano Zampini { 1889*e69c285eSBarry Smith Mat_MUMPS *mumps =(Mat_MUMPS*)F->data; 1890e807eca7SStefano Zampini MumpsScalar *orhs; 1891e807eca7SStefano Zampini PetscScalar *osol,*nrhs,*nsol; 18929a3a5937SStefano Zampini PetscInt orhs_size,osol_size,olrhs_size; 1893e807eca7SStefano Zampini PetscErrorCode ierr; 1894e807eca7SStefano Zampini 1895e807eca7SStefano Zampini PetscFunctionBegin; 18965a05ddb0SStefano Zampini if (!mumps->id.ICNTL(19)) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatFactorSetSchurIS to enable it"); 18975a05ddb0SStefano Zampini if (!mumps->id.size_schur) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatFactorSetSchurIS before"); 18986f3cc6f9SBarry Smith 1899e807eca7SStefano Zampini /* swap pointers */ 1900e807eca7SStefano Zampini orhs = mumps->id.redrhs; 19019a3a5937SStefano Zampini olrhs_size = mumps->id.lredrhs; 1902a12f35bfSStefano Zampini orhs_size = mumps->sizeredrhs; 1903e807eca7SStefano Zampini osol = mumps->schur_sol; 1904a12f35bfSStefano Zampini osol_size = mumps->schur_sizesol; 1905e807eca7SStefano Zampini ierr = VecGetArray(rhs,&nrhs);CHKERRQ(ierr); 1906e807eca7SStefano Zampini ierr = VecGetArray(sol,&nsol);CHKERRQ(ierr); 1907e807eca7SStefano Zampini mumps->id.redrhs = (MumpsScalar*)nrhs; 1908a12f35bfSStefano Zampini ierr = VecGetLocalSize(rhs,&mumps->sizeredrhs);CHKERRQ(ierr); 19099a3a5937SStefano Zampini mumps->id.lredrhs = mumps->sizeredrhs; 1910e807eca7SStefano Zampini mumps->schur_sol = nsol; 1911a12f35bfSStefano Zampini ierr = VecGetLocalSize(sol,&mumps->schur_sizesol);CHKERRQ(ierr); 1912a12f35bfSStefano Zampini 1913e807eca7SStefano Zampini /* solve Schur complement */ 1914e807eca7SStefano Zampini mumps->id.nrhs = 1; 1915e807eca7SStefano Zampini ierr = MatMumpsSolveSchur_Private(mumps,PETSC_FALSE);CHKERRQ(ierr); 1916e807eca7SStefano Zampini /* restore pointers */ 1917e807eca7SStefano Zampini ierr = VecRestoreArray(rhs,&nrhs);CHKERRQ(ierr); 1918e807eca7SStefano Zampini ierr = VecRestoreArray(sol,&nsol);CHKERRQ(ierr); 1919e807eca7SStefano Zampini mumps->id.redrhs = orhs; 19209a3a5937SStefano Zampini mumps->id.lredrhs = olrhs_size; 1921a12f35bfSStefano Zampini mumps->sizeredrhs = orhs_size; 1922e807eca7SStefano Zampini mumps->schur_sol = osol; 1923a12f35bfSStefano Zampini mumps->schur_sizesol = osol_size; 1924e807eca7SStefano Zampini PetscFunctionReturn(0); 1925e807eca7SStefano Zampini } 1926e807eca7SStefano Zampini 19277404bcfbSStefano Zampini /* -------------------------------------------------------------------------------------------*/ 19287404bcfbSStefano Zampini #undef __FUNCT__ 19295a05ddb0SStefano Zampini #define __FUNCT__ "MatFactorSolveSchurComplementTranspose_MUMPS" 19305a05ddb0SStefano Zampini PetscErrorCode MatFactorSolveSchurComplementTranspose_MUMPS(Mat F, Vec rhs, Vec sol) 19317404bcfbSStefano Zampini { 1932*e69c285eSBarry Smith Mat_MUMPS *mumps =(Mat_MUMPS*)F->data; 19337404bcfbSStefano Zampini MumpsScalar *orhs; 19347404bcfbSStefano Zampini PetscScalar *osol,*nrhs,*nsol; 1935a12f35bfSStefano Zampini PetscInt orhs_size,osol_size; 19367404bcfbSStefano Zampini PetscErrorCode ierr; 19377404bcfbSStefano Zampini 19387404bcfbSStefano Zampini PetscFunctionBegin; 19395a05ddb0SStefano Zampini if (!mumps->id.ICNTL(19)) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatFactorSetSchurIS to enable it"); 19405a05ddb0SStefano Zampini else if (!mumps->id.size_schur) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatFactorSetSchurIS before"); 19416f3cc6f9SBarry Smith 19427404bcfbSStefano Zampini /* swap pointers */ 19437404bcfbSStefano Zampini orhs = mumps->id.redrhs; 1944a12f35bfSStefano Zampini orhs_size = mumps->sizeredrhs; 19457404bcfbSStefano Zampini osol = mumps->schur_sol; 1946a12f35bfSStefano Zampini osol_size = mumps->schur_sizesol; 19477404bcfbSStefano Zampini ierr = VecGetArray(rhs,&nrhs);CHKERRQ(ierr); 19487404bcfbSStefano Zampini ierr = VecGetArray(sol,&nsol);CHKERRQ(ierr); 19497404bcfbSStefano Zampini mumps->id.redrhs = (MumpsScalar*)nrhs; 1950a12f35bfSStefano Zampini ierr = VecGetLocalSize(rhs,&mumps->sizeredrhs);CHKERRQ(ierr); 19517404bcfbSStefano Zampini mumps->schur_sol = nsol; 1952a12f35bfSStefano Zampini ierr = VecGetLocalSize(sol,&mumps->schur_sizesol);CHKERRQ(ierr); 1953a12f35bfSStefano Zampini 19547404bcfbSStefano Zampini /* solve Schur complement */ 19557404bcfbSStefano Zampini mumps->id.nrhs = 1; 19567404bcfbSStefano Zampini mumps->id.ICNTL(9) = 0; 19577404bcfbSStefano Zampini ierr = MatMumpsSolveSchur_Private(mumps,PETSC_FALSE);CHKERRQ(ierr); 19587404bcfbSStefano Zampini mumps->id.ICNTL(9) = 1; 19597404bcfbSStefano Zampini /* restore pointers */ 19607404bcfbSStefano Zampini ierr = VecRestoreArray(rhs,&nrhs);CHKERRQ(ierr); 19617404bcfbSStefano Zampini ierr = VecRestoreArray(sol,&nsol);CHKERRQ(ierr); 19627404bcfbSStefano Zampini mumps->id.redrhs = orhs; 1963a12f35bfSStefano Zampini mumps->sizeredrhs = orhs_size; 19647404bcfbSStefano Zampini mumps->schur_sol = osol; 1965a12f35bfSStefano Zampini mumps->schur_sizesol = osol_size; 19667404bcfbSStefano Zampini PetscFunctionReturn(0); 19677404bcfbSStefano Zampini } 19687404bcfbSStefano Zampini 1969e807eca7SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 1970e807eca7SStefano Zampini #undef __FUNCT__ 19715ccb76cbSHong Zhang #define __FUNCT__ "MatMumpsSetIcntl_MUMPS" 19725ccb76cbSHong Zhang PetscErrorCode MatMumpsSetIcntl_MUMPS(Mat F,PetscInt icntl,PetscInt ival) 19735ccb76cbSHong Zhang { 1974*e69c285eSBarry Smith Mat_MUMPS *mumps =(Mat_MUMPS*)F->data; 19755ccb76cbSHong Zhang 19765ccb76cbSHong Zhang PetscFunctionBegin; 1977a5e57a09SHong Zhang mumps->id.ICNTL(icntl) = ival; 19785ccb76cbSHong Zhang PetscFunctionReturn(0); 19795ccb76cbSHong Zhang } 19805ccb76cbSHong Zhang 19815ccb76cbSHong Zhang #undef __FUNCT__ 1982bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetIcntl_MUMPS" 1983bc6112feSHong Zhang PetscErrorCode MatMumpsGetIcntl_MUMPS(Mat F,PetscInt icntl,PetscInt *ival) 1984bc6112feSHong Zhang { 1985*e69c285eSBarry Smith Mat_MUMPS *mumps =(Mat_MUMPS*)F->data; 1986bc6112feSHong Zhang 1987bc6112feSHong Zhang PetscFunctionBegin; 1988bc6112feSHong Zhang *ival = mumps->id.ICNTL(icntl); 1989bc6112feSHong Zhang PetscFunctionReturn(0); 1990bc6112feSHong Zhang } 1991bc6112feSHong Zhang 1992bc6112feSHong Zhang #undef __FUNCT__ 19935ccb76cbSHong Zhang #define __FUNCT__ "MatMumpsSetIcntl" 19945ccb76cbSHong Zhang /*@ 19955ccb76cbSHong Zhang MatMumpsSetIcntl - Set MUMPS parameter ICNTL() 19965ccb76cbSHong Zhang 19975ccb76cbSHong Zhang Logically Collective on Mat 19985ccb76cbSHong Zhang 19995ccb76cbSHong Zhang Input Parameters: 20005ccb76cbSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 20015ccb76cbSHong Zhang . icntl - index of MUMPS parameter array ICNTL() 20025ccb76cbSHong Zhang - ival - value of MUMPS ICNTL(icntl) 20035ccb76cbSHong Zhang 20045ccb76cbSHong Zhang Options Database: 20055ccb76cbSHong Zhang . -mat_mumps_icntl_<icntl> <ival> 20065ccb76cbSHong Zhang 20075ccb76cbSHong Zhang Level: beginner 20085ccb76cbSHong Zhang 200996a0c994SBarry Smith References: 201096a0c994SBarry Smith . MUMPS Users' Guide 20115ccb76cbSHong Zhang 20125ccb76cbSHong Zhang .seealso: MatGetFactor() 20135ccb76cbSHong Zhang @*/ 20145ccb76cbSHong Zhang PetscErrorCode MatMumpsSetIcntl(Mat F,PetscInt icntl,PetscInt ival) 20155ccb76cbSHong Zhang { 20165ccb76cbSHong Zhang PetscErrorCode ierr; 20175ccb76cbSHong Zhang 20185ccb76cbSHong Zhang PetscFunctionBegin; 20192989dfd4SHong Zhang PetscValidType(F,1); 20202989dfd4SHong Zhang if (!F->factortype) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ARG_WRONGSTATE,"Only for factored matrix"); 20215ccb76cbSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 20225ccb76cbSHong Zhang PetscValidLogicalCollectiveInt(F,ival,3); 20235ccb76cbSHong Zhang ierr = PetscTryMethod(F,"MatMumpsSetIcntl_C",(Mat,PetscInt,PetscInt),(F,icntl,ival));CHKERRQ(ierr); 20245ccb76cbSHong Zhang PetscFunctionReturn(0); 20255ccb76cbSHong Zhang } 20265ccb76cbSHong Zhang 2027bc6112feSHong Zhang #undef __FUNCT__ 2028bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetIcntl" 2029a21f80fcSHong Zhang /*@ 2030a21f80fcSHong Zhang MatMumpsGetIcntl - Get MUMPS parameter ICNTL() 2031a21f80fcSHong Zhang 2032a21f80fcSHong Zhang Logically Collective on Mat 2033a21f80fcSHong Zhang 2034a21f80fcSHong Zhang Input Parameters: 2035a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2036a21f80fcSHong Zhang - icntl - index of MUMPS parameter array ICNTL() 2037a21f80fcSHong Zhang 2038a21f80fcSHong Zhang Output Parameter: 2039a21f80fcSHong Zhang . ival - value of MUMPS ICNTL(icntl) 2040a21f80fcSHong Zhang 2041a21f80fcSHong Zhang Level: beginner 2042a21f80fcSHong Zhang 204396a0c994SBarry Smith References: 204496a0c994SBarry Smith . MUMPS Users' Guide 2045a21f80fcSHong Zhang 2046a21f80fcSHong Zhang .seealso: MatGetFactor() 2047a21f80fcSHong Zhang @*/ 2048bc6112feSHong Zhang PetscErrorCode MatMumpsGetIcntl(Mat F,PetscInt icntl,PetscInt *ival) 2049bc6112feSHong Zhang { 2050bc6112feSHong Zhang PetscErrorCode ierr; 2051bc6112feSHong Zhang 2052bc6112feSHong Zhang PetscFunctionBegin; 20532989dfd4SHong Zhang PetscValidType(F,1); 20542989dfd4SHong Zhang if (!F->factortype) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ARG_WRONGSTATE,"Only for factored matrix"); 2055bc6112feSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 2056bc6112feSHong Zhang PetscValidIntPointer(ival,3); 20572989dfd4SHong Zhang ierr = PetscUseMethod(F,"MatMumpsGetIcntl_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 2058bc6112feSHong Zhang PetscFunctionReturn(0); 2059bc6112feSHong Zhang } 2060bc6112feSHong Zhang 20618928b65cSHong Zhang /* -------------------------------------------------------------------------------------------*/ 20628928b65cSHong Zhang #undef __FUNCT__ 20638928b65cSHong Zhang #define __FUNCT__ "MatMumpsSetCntl_MUMPS" 20648928b65cSHong Zhang PetscErrorCode MatMumpsSetCntl_MUMPS(Mat F,PetscInt icntl,PetscReal val) 20658928b65cSHong Zhang { 2066*e69c285eSBarry Smith Mat_MUMPS *mumps =(Mat_MUMPS*)F->data; 20678928b65cSHong Zhang 20688928b65cSHong Zhang PetscFunctionBegin; 20698928b65cSHong Zhang mumps->id.CNTL(icntl) = val; 20708928b65cSHong Zhang PetscFunctionReturn(0); 20718928b65cSHong Zhang } 20728928b65cSHong Zhang 20738928b65cSHong Zhang #undef __FUNCT__ 2074bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetCntl_MUMPS" 2075bc6112feSHong Zhang PetscErrorCode MatMumpsGetCntl_MUMPS(Mat F,PetscInt icntl,PetscReal *val) 2076bc6112feSHong Zhang { 2077*e69c285eSBarry Smith Mat_MUMPS *mumps =(Mat_MUMPS*)F->data; 2078bc6112feSHong Zhang 2079bc6112feSHong Zhang PetscFunctionBegin; 2080bc6112feSHong Zhang *val = mumps->id.CNTL(icntl); 2081bc6112feSHong Zhang PetscFunctionReturn(0); 2082bc6112feSHong Zhang } 2083bc6112feSHong Zhang 2084bc6112feSHong Zhang #undef __FUNCT__ 20858928b65cSHong Zhang #define __FUNCT__ "MatMumpsSetCntl" 20868928b65cSHong Zhang /*@ 20878928b65cSHong Zhang MatMumpsSetCntl - Set MUMPS parameter CNTL() 20888928b65cSHong Zhang 20898928b65cSHong Zhang Logically Collective on Mat 20908928b65cSHong Zhang 20918928b65cSHong Zhang Input Parameters: 20928928b65cSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 20938928b65cSHong Zhang . icntl - index of MUMPS parameter array CNTL() 20948928b65cSHong Zhang - val - value of MUMPS CNTL(icntl) 20958928b65cSHong Zhang 20968928b65cSHong Zhang Options Database: 20978928b65cSHong Zhang . -mat_mumps_cntl_<icntl> <val> 20988928b65cSHong Zhang 20998928b65cSHong Zhang Level: beginner 21008928b65cSHong Zhang 210196a0c994SBarry Smith References: 210296a0c994SBarry Smith . MUMPS Users' Guide 21038928b65cSHong Zhang 21048928b65cSHong Zhang .seealso: MatGetFactor() 21058928b65cSHong Zhang @*/ 21068928b65cSHong Zhang PetscErrorCode MatMumpsSetCntl(Mat F,PetscInt icntl,PetscReal val) 21078928b65cSHong Zhang { 21088928b65cSHong Zhang PetscErrorCode ierr; 21098928b65cSHong Zhang 21108928b65cSHong Zhang PetscFunctionBegin; 21112989dfd4SHong Zhang PetscValidType(F,1); 21122989dfd4SHong Zhang if (!F->factortype) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ARG_WRONGSTATE,"Only for factored matrix"); 21138928b65cSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 2114bc6112feSHong Zhang PetscValidLogicalCollectiveReal(F,val,3); 21158928b65cSHong Zhang ierr = PetscTryMethod(F,"MatMumpsSetCntl_C",(Mat,PetscInt,PetscReal),(F,icntl,val));CHKERRQ(ierr); 21168928b65cSHong Zhang PetscFunctionReturn(0); 21178928b65cSHong Zhang } 21188928b65cSHong Zhang 2119bc6112feSHong Zhang #undef __FUNCT__ 2120bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetCntl" 2121a21f80fcSHong Zhang /*@ 2122a21f80fcSHong Zhang MatMumpsGetCntl - Get MUMPS parameter CNTL() 2123a21f80fcSHong Zhang 2124a21f80fcSHong Zhang Logically Collective on Mat 2125a21f80fcSHong Zhang 2126a21f80fcSHong Zhang Input Parameters: 2127a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2128a21f80fcSHong Zhang - icntl - index of MUMPS parameter array CNTL() 2129a21f80fcSHong Zhang 2130a21f80fcSHong Zhang Output Parameter: 2131a21f80fcSHong Zhang . val - value of MUMPS CNTL(icntl) 2132a21f80fcSHong Zhang 2133a21f80fcSHong Zhang Level: beginner 2134a21f80fcSHong Zhang 213596a0c994SBarry Smith References: 213696a0c994SBarry Smith . MUMPS Users' Guide 2137a21f80fcSHong Zhang 2138a21f80fcSHong Zhang .seealso: MatGetFactor() 2139a21f80fcSHong Zhang @*/ 2140bc6112feSHong Zhang PetscErrorCode MatMumpsGetCntl(Mat F,PetscInt icntl,PetscReal *val) 2141bc6112feSHong Zhang { 2142bc6112feSHong Zhang PetscErrorCode ierr; 2143bc6112feSHong Zhang 2144bc6112feSHong Zhang PetscFunctionBegin; 21452989dfd4SHong Zhang PetscValidType(F,1); 21462989dfd4SHong Zhang if (!F->factortype) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ARG_WRONGSTATE,"Only for factored matrix"); 2147bc6112feSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 2148bc6112feSHong Zhang PetscValidRealPointer(val,3); 21492989dfd4SHong Zhang ierr = PetscUseMethod(F,"MatMumpsGetCntl_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 2150bc6112feSHong Zhang PetscFunctionReturn(0); 2151bc6112feSHong Zhang } 2152bc6112feSHong Zhang 2153bc6112feSHong Zhang #undef __FUNCT__ 2154ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfo_MUMPS" 2155ca810319SHong Zhang PetscErrorCode MatMumpsGetInfo_MUMPS(Mat F,PetscInt icntl,PetscInt *info) 2156bc6112feSHong Zhang { 2157*e69c285eSBarry Smith Mat_MUMPS *mumps =(Mat_MUMPS*)F->data; 2158bc6112feSHong Zhang 2159bc6112feSHong Zhang PetscFunctionBegin; 2160bc6112feSHong Zhang *info = mumps->id.INFO(icntl); 2161bc6112feSHong Zhang PetscFunctionReturn(0); 2162bc6112feSHong Zhang } 2163bc6112feSHong Zhang 2164bc6112feSHong Zhang #undef __FUNCT__ 2165ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfog_MUMPS" 2166ca810319SHong Zhang PetscErrorCode MatMumpsGetInfog_MUMPS(Mat F,PetscInt icntl,PetscInt *infog) 2167bc6112feSHong Zhang { 2168*e69c285eSBarry Smith Mat_MUMPS *mumps =(Mat_MUMPS*)F->data; 2169bc6112feSHong Zhang 2170bc6112feSHong Zhang PetscFunctionBegin; 2171bc6112feSHong Zhang *infog = mumps->id.INFOG(icntl); 2172bc6112feSHong Zhang PetscFunctionReturn(0); 2173bc6112feSHong Zhang } 2174bc6112feSHong Zhang 2175bc6112feSHong Zhang #undef __FUNCT__ 2176ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfo_MUMPS" 2177ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfo_MUMPS(Mat F,PetscInt icntl,PetscReal *rinfo) 2178bc6112feSHong Zhang { 2179*e69c285eSBarry Smith Mat_MUMPS *mumps =(Mat_MUMPS*)F->data; 2180bc6112feSHong Zhang 2181bc6112feSHong Zhang PetscFunctionBegin; 2182bc6112feSHong Zhang *rinfo = mumps->id.RINFO(icntl); 2183bc6112feSHong Zhang PetscFunctionReturn(0); 2184bc6112feSHong Zhang } 2185bc6112feSHong Zhang 2186bc6112feSHong Zhang #undef __FUNCT__ 2187ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfog_MUMPS" 2188ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfog_MUMPS(Mat F,PetscInt icntl,PetscReal *rinfog) 2189bc6112feSHong Zhang { 2190*e69c285eSBarry Smith Mat_MUMPS *mumps =(Mat_MUMPS*)F->data; 2191bc6112feSHong Zhang 2192bc6112feSHong Zhang PetscFunctionBegin; 2193bc6112feSHong Zhang *rinfog = mumps->id.RINFOG(icntl); 2194bc6112feSHong Zhang PetscFunctionReturn(0); 2195bc6112feSHong Zhang } 2196bc6112feSHong Zhang 2197bc6112feSHong Zhang #undef __FUNCT__ 2198ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfo" 2199a21f80fcSHong Zhang /*@ 2200a21f80fcSHong Zhang MatMumpsGetInfo - Get MUMPS parameter INFO() 2201a21f80fcSHong Zhang 2202a21f80fcSHong Zhang Logically Collective on Mat 2203a21f80fcSHong Zhang 2204a21f80fcSHong Zhang Input Parameters: 2205a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2206a21f80fcSHong Zhang - icntl - index of MUMPS parameter array INFO() 2207a21f80fcSHong Zhang 2208a21f80fcSHong Zhang Output Parameter: 2209a21f80fcSHong Zhang . ival - value of MUMPS INFO(icntl) 2210a21f80fcSHong Zhang 2211a21f80fcSHong Zhang Level: beginner 2212a21f80fcSHong Zhang 221396a0c994SBarry Smith References: 221496a0c994SBarry Smith . MUMPS Users' Guide 2215a21f80fcSHong Zhang 2216a21f80fcSHong Zhang .seealso: MatGetFactor() 2217a21f80fcSHong Zhang @*/ 2218ca810319SHong Zhang PetscErrorCode MatMumpsGetInfo(Mat F,PetscInt icntl,PetscInt *ival) 2219bc6112feSHong Zhang { 2220bc6112feSHong Zhang PetscErrorCode ierr; 2221bc6112feSHong Zhang 2222bc6112feSHong Zhang PetscFunctionBegin; 22232989dfd4SHong Zhang PetscValidType(F,1); 22242989dfd4SHong Zhang if (!F->factortype) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ARG_WRONGSTATE,"Only for factored matrix"); 2225ca810319SHong Zhang PetscValidIntPointer(ival,3); 22262989dfd4SHong Zhang ierr = PetscUseMethod(F,"MatMumpsGetInfo_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 2227bc6112feSHong Zhang PetscFunctionReturn(0); 2228bc6112feSHong Zhang } 2229bc6112feSHong Zhang 2230bc6112feSHong Zhang #undef __FUNCT__ 2231ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfog" 2232a21f80fcSHong Zhang /*@ 2233a21f80fcSHong Zhang MatMumpsGetInfog - Get MUMPS parameter INFOG() 2234a21f80fcSHong Zhang 2235a21f80fcSHong Zhang Logically Collective on Mat 2236a21f80fcSHong Zhang 2237a21f80fcSHong Zhang Input Parameters: 2238a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2239a21f80fcSHong Zhang - icntl - index of MUMPS parameter array INFOG() 2240a21f80fcSHong Zhang 2241a21f80fcSHong Zhang Output Parameter: 2242a21f80fcSHong Zhang . ival - value of MUMPS INFOG(icntl) 2243a21f80fcSHong Zhang 2244a21f80fcSHong Zhang Level: beginner 2245a21f80fcSHong Zhang 224696a0c994SBarry Smith References: 224796a0c994SBarry Smith . MUMPS Users' Guide 2248a21f80fcSHong Zhang 2249a21f80fcSHong Zhang .seealso: MatGetFactor() 2250a21f80fcSHong Zhang @*/ 2251ca810319SHong Zhang PetscErrorCode MatMumpsGetInfog(Mat F,PetscInt icntl,PetscInt *ival) 2252bc6112feSHong Zhang { 2253bc6112feSHong Zhang PetscErrorCode ierr; 2254bc6112feSHong Zhang 2255bc6112feSHong Zhang PetscFunctionBegin; 22562989dfd4SHong Zhang PetscValidType(F,1); 22572989dfd4SHong Zhang if (!F->factortype) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ARG_WRONGSTATE,"Only for factored matrix"); 2258ca810319SHong Zhang PetscValidIntPointer(ival,3); 22592989dfd4SHong Zhang ierr = PetscUseMethod(F,"MatMumpsGetInfog_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 2260bc6112feSHong Zhang PetscFunctionReturn(0); 2261bc6112feSHong Zhang } 2262bc6112feSHong Zhang 2263bc6112feSHong Zhang #undef __FUNCT__ 2264ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfo" 2265a21f80fcSHong Zhang /*@ 2266a21f80fcSHong Zhang MatMumpsGetRinfo - Get MUMPS parameter RINFO() 2267a21f80fcSHong Zhang 2268a21f80fcSHong Zhang Logically Collective on Mat 2269a21f80fcSHong Zhang 2270a21f80fcSHong Zhang Input Parameters: 2271a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2272a21f80fcSHong Zhang - icntl - index of MUMPS parameter array RINFO() 2273a21f80fcSHong Zhang 2274a21f80fcSHong Zhang Output Parameter: 2275a21f80fcSHong Zhang . val - value of MUMPS RINFO(icntl) 2276a21f80fcSHong Zhang 2277a21f80fcSHong Zhang Level: beginner 2278a21f80fcSHong Zhang 227996a0c994SBarry Smith References: 228096a0c994SBarry Smith . MUMPS Users' Guide 2281a21f80fcSHong Zhang 2282a21f80fcSHong Zhang .seealso: MatGetFactor() 2283a21f80fcSHong Zhang @*/ 2284ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfo(Mat F,PetscInt icntl,PetscReal *val) 2285bc6112feSHong Zhang { 2286bc6112feSHong Zhang PetscErrorCode ierr; 2287bc6112feSHong Zhang 2288bc6112feSHong Zhang PetscFunctionBegin; 22892989dfd4SHong Zhang PetscValidType(F,1); 22902989dfd4SHong Zhang if (!F->factortype) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ARG_WRONGSTATE,"Only for factored matrix"); 2291bc6112feSHong Zhang PetscValidRealPointer(val,3); 22922989dfd4SHong Zhang ierr = PetscUseMethod(F,"MatMumpsGetRinfo_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 2293bc6112feSHong Zhang PetscFunctionReturn(0); 2294bc6112feSHong Zhang } 2295bc6112feSHong Zhang 2296bc6112feSHong Zhang #undef __FUNCT__ 2297ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfog" 2298a21f80fcSHong Zhang /*@ 2299a21f80fcSHong Zhang MatMumpsGetRinfog - Get MUMPS parameter RINFOG() 2300a21f80fcSHong Zhang 2301a21f80fcSHong Zhang Logically Collective on Mat 2302a21f80fcSHong Zhang 2303a21f80fcSHong Zhang Input Parameters: 2304a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2305a21f80fcSHong Zhang - icntl - index of MUMPS parameter array RINFOG() 2306a21f80fcSHong Zhang 2307a21f80fcSHong Zhang Output Parameter: 2308a21f80fcSHong Zhang . val - value of MUMPS RINFOG(icntl) 2309a21f80fcSHong Zhang 2310a21f80fcSHong Zhang Level: beginner 2311a21f80fcSHong Zhang 231296a0c994SBarry Smith References: 231396a0c994SBarry Smith . MUMPS Users' Guide 2314a21f80fcSHong Zhang 2315a21f80fcSHong Zhang .seealso: MatGetFactor() 2316a21f80fcSHong Zhang @*/ 2317ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfog(Mat F,PetscInt icntl,PetscReal *val) 2318bc6112feSHong Zhang { 2319bc6112feSHong Zhang PetscErrorCode ierr; 2320bc6112feSHong Zhang 2321bc6112feSHong Zhang PetscFunctionBegin; 23222989dfd4SHong Zhang PetscValidType(F,1); 23232989dfd4SHong Zhang if (!F->factortype) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ARG_WRONGSTATE,"Only for factored matrix"); 2324bc6112feSHong Zhang PetscValidRealPointer(val,3); 23252989dfd4SHong Zhang ierr = PetscUseMethod(F,"MatMumpsGetRinfog_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 2326bc6112feSHong Zhang PetscFunctionReturn(0); 2327bc6112feSHong Zhang } 2328bc6112feSHong Zhang 232924b6179bSKris Buschelman /*MC 23302692d6eeSBarry Smith MATSOLVERMUMPS - A matrix type providing direct solvers (LU and Cholesky) for 233124b6179bSKris Buschelman distributed and sequential matrices via the external package MUMPS. 233224b6179bSKris Buschelman 233341c8de11SBarry Smith Works with MATAIJ and MATSBAIJ matrices 233424b6179bSKris Buschelman 2335c2b89b5dSBarry Smith Use ./configure --download-mumps --download-scalapack --download-parmetis --download-metis --download-ptscotch to have PETSc installed with MUMPS 2336c2b89b5dSBarry Smith 2337c2b89b5dSBarry Smith Use -pc_type cholesky or lu -pc_factor_mat_solver_package mumps to us this direct solver 2338c2b89b5dSBarry Smith 233924b6179bSKris Buschelman Options Database Keys: 23404422a9fcSPatrick Sanan + -mat_mumps_icntl_1 - ICNTL(1): output stream for error messages 23414422a9fcSPatrick Sanan . -mat_mumps_icntl_2 - ICNTL(2): output stream for diagnostic printing, statistics, and warning 23424422a9fcSPatrick Sanan . -mat_mumps_icntl_3 - ICNTL(3): output stream for global information, collected on the host 23434422a9fcSPatrick Sanan . -mat_mumps_icntl_4 - ICNTL(4): level of printing (0 to 4) 23444422a9fcSPatrick Sanan . -mat_mumps_icntl_6 - ICNTL(6): permutes to a zero-free diagonal and/or scale the matrix (0 to 7) 23454422a9fcSPatrick Sanan . -mat_mumps_icntl_7 - ICNTL(7): computes a symmetric permutation in sequential analysis (0 to 7). 3=Scotch, 4=PORD, 5=Metis 23464422a9fcSPatrick Sanan . -mat_mumps_icntl_8 - ICNTL(8): scaling strategy (-2 to 8 or 77) 23474422a9fcSPatrick Sanan . -mat_mumps_icntl_10 - ICNTL(10): max num of refinements 23484422a9fcSPatrick Sanan . -mat_mumps_icntl_11 - ICNTL(11): statistics related to an error analysis (via -ksp_view) 23494422a9fcSPatrick Sanan . -mat_mumps_icntl_12 - ICNTL(12): an ordering strategy for symmetric matrices (0 to 3) 23504422a9fcSPatrick Sanan . -mat_mumps_icntl_13 - ICNTL(13): parallelism of the root node (enable ScaLAPACK) and its splitting 23514422a9fcSPatrick Sanan . -mat_mumps_icntl_14 - ICNTL(14): percentage increase in the estimated working space 23524422a9fcSPatrick Sanan . -mat_mumps_icntl_19 - ICNTL(19): computes the Schur complement 23534422a9fcSPatrick Sanan . -mat_mumps_icntl_22 - ICNTL(22): in-core/out-of-core factorization and solve (0 or 1) 23544422a9fcSPatrick Sanan . -mat_mumps_icntl_23 - ICNTL(23): max size of the working memory (MB) that can allocate per processor 23554422a9fcSPatrick Sanan . -mat_mumps_icntl_24 - ICNTL(24): detection of null pivot rows (0 or 1) 23564422a9fcSPatrick Sanan . -mat_mumps_icntl_25 - ICNTL(25): compute a solution of a deficient matrix and a null space basis 23574422a9fcSPatrick Sanan . -mat_mumps_icntl_26 - ICNTL(26): drives the solution phase if a Schur complement matrix 23584422a9fcSPatrick Sanan . -mat_mumps_icntl_28 - ICNTL(28): use 1 for sequential analysis and ictnl(7) ordering, or 2 for parallel analysis and ictnl(29) ordering 23594422a9fcSPatrick Sanan . -mat_mumps_icntl_29 - ICNTL(29): parallel ordering 1 = ptscotch, 2 = parmetis 23604422a9fcSPatrick Sanan . -mat_mumps_icntl_30 - ICNTL(30): compute user-specified set of entries in inv(A) 23614422a9fcSPatrick Sanan . -mat_mumps_icntl_31 - ICNTL(31): indicates which factors may be discarded during factorization 23624422a9fcSPatrick Sanan . -mat_mumps_icntl_33 - ICNTL(33): compute determinant 23634422a9fcSPatrick Sanan . -mat_mumps_cntl_1 - CNTL(1): relative pivoting threshold 23644422a9fcSPatrick Sanan . -mat_mumps_cntl_2 - CNTL(2): stopping criterion of refinement 23654422a9fcSPatrick Sanan . -mat_mumps_cntl_3 - CNTL(3): absolute pivoting threshold 23664422a9fcSPatrick Sanan . -mat_mumps_cntl_4 - CNTL(4): value for static pivoting 23674422a9fcSPatrick Sanan - -mat_mumps_cntl_5 - CNTL(5): fixation for null pivots 236824b6179bSKris Buschelman 236924b6179bSKris Buschelman Level: beginner 237024b6179bSKris Buschelman 237141c8de11SBarry Smith .seealso: PCFactorSetMatSolverPackage(), MatSolverPackage 237241c8de11SBarry Smith 237324b6179bSKris Buschelman M*/ 237424b6179bSKris Buschelman 237535bd34faSBarry Smith #undef __FUNCT__ 237635bd34faSBarry Smith #define __FUNCT__ "MatFactorGetSolverPackage_mumps" 2377f7a08781SBarry Smith static PetscErrorCode MatFactorGetSolverPackage_mumps(Mat A,const MatSolverPackage *type) 237835bd34faSBarry Smith { 237935bd34faSBarry Smith PetscFunctionBegin; 23802692d6eeSBarry Smith *type = MATSOLVERMUMPS; 238135bd34faSBarry Smith PetscFunctionReturn(0); 238235bd34faSBarry Smith } 238335bd34faSBarry Smith 2384bccb9932SShri Abhyankar /* MatGetFactor for Seq and MPI AIJ matrices */ 23852877fffaSHong Zhang #undef __FUNCT__ 2386bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_aij_mumps" 2387cc2e6a90SBarry Smith static PetscErrorCode MatGetFactor_aij_mumps(Mat A,MatFactorType ftype,Mat *F) 23882877fffaSHong Zhang { 23892877fffaSHong Zhang Mat B; 23902877fffaSHong Zhang PetscErrorCode ierr; 23912877fffaSHong Zhang Mat_MUMPS *mumps; 2392ace3abfcSBarry Smith PetscBool isSeqAIJ; 23932877fffaSHong Zhang 23942877fffaSHong Zhang PetscFunctionBegin; 23952877fffaSHong Zhang /* Create the factorization matrix */ 2396251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQAIJ,&isSeqAIJ);CHKERRQ(ierr); 2397ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 23982877fffaSHong Zhang ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 2399*e69c285eSBarry Smith ierr = PetscStrallocpy("mumps",&((PetscObject)B)->type_name);CHKERRQ(ierr); 2400*e69c285eSBarry Smith ierr = MatSetUp(B);CHKERRQ(ierr); 24012877fffaSHong Zhang 2402b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 24032205254eSKarl Rupp 24042877fffaSHong Zhang B->ops->view = MatView_MUMPS; 240535bd34faSBarry Smith B->ops->getinfo = MatGetInfo_MUMPS; 24062205254eSKarl Rupp 2407bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 24085a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorSetSchurIS_C",MatFactorSetSchurIS_MUMPS);CHKERRQ(ierr); 24095a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorInvertSchurComplement_C",MatFactorInvertSchurComplement_MUMPS);CHKERRQ(ierr); 24105a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorCreateSchurComplement_C",MatFactorCreateSchurComplement_MUMPS);CHKERRQ(ierr); 24115a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSchurComplement_C",MatFactorGetSchurComplement_MUMPS);CHKERRQ(ierr); 24125a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorSolveSchurComplement_C",MatFactorSolveSchurComplement_MUMPS);CHKERRQ(ierr); 24135a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorSolveSchurComplementTranspose_C",MatFactorSolveSchurComplementTranspose_MUMPS);CHKERRQ(ierr); 2414bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 2415bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 2416bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 2417bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 2418ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 2419ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 2420ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 2421ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 24226444a565SStefano Zampini 2423450b117fSShri Abhyankar if (ftype == MAT_FACTOR_LU) { 2424450b117fSShri Abhyankar B->ops->lufactorsymbolic = MatLUFactorSymbolic_AIJMUMPS; 2425d5f3da31SBarry Smith B->factortype = MAT_FACTOR_LU; 2426bccb9932SShri Abhyankar if (isSeqAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqaij_seqaij; 2427bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpiaij_mpiaij; 2428746480a1SHong Zhang mumps->sym = 0; 2429dcd589f8SShri Abhyankar } else { 243067877ebaSShri Abhyankar B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_MUMPS; 2431450b117fSShri Abhyankar B->factortype = MAT_FACTOR_CHOLESKY; 2432bccb9932SShri Abhyankar if (isSeqAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqaij_seqsbaij; 2433bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpiaij_mpisbaij; 243459ac8732SStefano Zampini #if defined(PETSC_USE_COMPLEX) 243559ac8732SStefano Zampini mumps->sym = 2; 243659ac8732SStefano Zampini #else 24376fdc2a6dSBarry Smith if (A->spd_set && A->spd) mumps->sym = 1; 24386fdc2a6dSBarry Smith else mumps->sym = 2; 243959ac8732SStefano Zampini #endif 2440450b117fSShri Abhyankar } 24412877fffaSHong Zhang 244200c67f3bSHong Zhang /* set solvertype */ 244300c67f3bSHong Zhang ierr = PetscFree(B->solvertype);CHKERRQ(ierr); 244400c67f3bSHong Zhang ierr = PetscStrallocpy(MATSOLVERMUMPS,&B->solvertype);CHKERRQ(ierr); 244500c67f3bSHong Zhang 24462877fffaSHong Zhang mumps->isAIJ = PETSC_TRUE; 24472877fffaSHong Zhang B->ops->destroy = MatDestroy_MUMPS; 2448*e69c285eSBarry Smith B->data = (void*)mumps; 24492205254eSKarl Rupp 2450f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 2451746480a1SHong Zhang 24522877fffaSHong Zhang *F = B; 24532877fffaSHong Zhang PetscFunctionReturn(0); 24542877fffaSHong Zhang } 24552877fffaSHong Zhang 2456bccb9932SShri Abhyankar /* MatGetFactor for Seq and MPI SBAIJ matrices */ 24572877fffaSHong Zhang #undef __FUNCT__ 2458bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_sbaij_mumps" 2459cc2e6a90SBarry Smith static PetscErrorCode MatGetFactor_sbaij_mumps(Mat A,MatFactorType ftype,Mat *F) 24602877fffaSHong Zhang { 24612877fffaSHong Zhang Mat B; 24622877fffaSHong Zhang PetscErrorCode ierr; 24632877fffaSHong Zhang Mat_MUMPS *mumps; 2464ace3abfcSBarry Smith PetscBool isSeqSBAIJ; 24652877fffaSHong Zhang 24662877fffaSHong Zhang PetscFunctionBegin; 2467ce94432eSBarry Smith if (ftype != MAT_FACTOR_CHOLESKY) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with MUMPS LU, use AIJ matrix"); 2468ce94432eSBarry Smith if (A->rmap->bs > 1) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with block size > 1 with MUMPS Cholesky, use AIJ matrix instead"); 2469251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQSBAIJ,&isSeqSBAIJ);CHKERRQ(ierr); 24702877fffaSHong Zhang /* Create the factorization matrix */ 2471ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 24722877fffaSHong Zhang ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 2473*e69c285eSBarry Smith ierr = PetscStrallocpy("mumps",&((PetscObject)B)->type_name);CHKERRQ(ierr); 2474*e69c285eSBarry Smith ierr = MatSetUp(B);CHKERRQ(ierr); 2475*e69c285eSBarry Smith 2476b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 2477bccb9932SShri Abhyankar if (isSeqSBAIJ) { 247816ebf90aSShri Abhyankar mumps->ConvertToTriples = MatConvertToTriples_seqsbaij_seqsbaij; 2479dcd589f8SShri Abhyankar } else { 2480bccb9932SShri Abhyankar mumps->ConvertToTriples = MatConvertToTriples_mpisbaij_mpisbaij; 2481bccb9932SShri Abhyankar } 2482bccb9932SShri Abhyankar 2483*e69c285eSBarry Smith B->ops->getinfo = MatGetInfo_External; 248467877ebaSShri Abhyankar B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_MUMPS; 2485bccb9932SShri Abhyankar B->ops->view = MatView_MUMPS; 24862205254eSKarl Rupp 2487bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 24885a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorSetSchurIS_C",MatFactorSetSchurIS_MUMPS);CHKERRQ(ierr); 24895a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorInvertSchurComplement_C",MatFactorInvertSchurComplement_MUMPS);CHKERRQ(ierr); 24905a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorCreateSchurComplement_C",MatFactorCreateSchurComplement_MUMPS);CHKERRQ(ierr); 24915a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSchurComplement_C",MatFactorGetSchurComplement_MUMPS);CHKERRQ(ierr); 24925a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorSolveSchurComplement_C",MatFactorSolveSchurComplement_MUMPS);CHKERRQ(ierr); 24935a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorSolveSchurComplementTranspose_C",MatFactorSolveSchurComplementTranspose_MUMPS);CHKERRQ(ierr); 2494b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 2495b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 2496b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 2497b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 2498ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 2499ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 2500ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 2501ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 25022205254eSKarl Rupp 2503f4762488SHong Zhang B->factortype = MAT_FACTOR_CHOLESKY; 250459ac8732SStefano Zampini #if defined(PETSC_USE_COMPLEX) 250559ac8732SStefano Zampini mumps->sym = 2; 250659ac8732SStefano Zampini #else 25076fdc2a6dSBarry Smith if (A->spd_set && A->spd) mumps->sym = 1; 25086fdc2a6dSBarry Smith else mumps->sym = 2; 250959ac8732SStefano Zampini #endif 2510a214ac2aSShri Abhyankar 251100c67f3bSHong Zhang /* set solvertype */ 251200c67f3bSHong Zhang ierr = PetscFree(B->solvertype);CHKERRQ(ierr); 251300c67f3bSHong Zhang ierr = PetscStrallocpy(MATSOLVERMUMPS,&B->solvertype);CHKERRQ(ierr); 251400c67f3bSHong Zhang 2515bccb9932SShri Abhyankar mumps->isAIJ = PETSC_FALSE; 2516f3c0ef26SHong Zhang B->ops->destroy = MatDestroy_MUMPS; 2517*e69c285eSBarry Smith B->data = (void*)mumps; 25182205254eSKarl Rupp 2519f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 2520746480a1SHong Zhang 25212877fffaSHong Zhang *F = B; 25222877fffaSHong Zhang PetscFunctionReturn(0); 25232877fffaSHong Zhang } 252497969023SHong Zhang 2525450b117fSShri Abhyankar #undef __FUNCT__ 2526bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_baij_mumps" 2527cc2e6a90SBarry Smith static PetscErrorCode MatGetFactor_baij_mumps(Mat A,MatFactorType ftype,Mat *F) 252867877ebaSShri Abhyankar { 252967877ebaSShri Abhyankar Mat B; 253067877ebaSShri Abhyankar PetscErrorCode ierr; 253167877ebaSShri Abhyankar Mat_MUMPS *mumps; 2532ace3abfcSBarry Smith PetscBool isSeqBAIJ; 253367877ebaSShri Abhyankar 253467877ebaSShri Abhyankar PetscFunctionBegin; 253567877ebaSShri Abhyankar /* Create the factorization matrix */ 2536251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQBAIJ,&isSeqBAIJ);CHKERRQ(ierr); 2537ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 253867877ebaSShri Abhyankar ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 2539*e69c285eSBarry Smith ierr = PetscStrallocpy("mumps",&((PetscObject)B)->type_name);CHKERRQ(ierr); 2540*e69c285eSBarry Smith ierr = MatSetUp(B);CHKERRQ(ierr); 2541450b117fSShri Abhyankar 2542b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 2543450b117fSShri Abhyankar if (ftype == MAT_FACTOR_LU) { 2544450b117fSShri Abhyankar B->ops->lufactorsymbolic = MatLUFactorSymbolic_BAIJMUMPS; 2545450b117fSShri Abhyankar B->factortype = MAT_FACTOR_LU; 2546bccb9932SShri Abhyankar if (isSeqBAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqbaij_seqaij; 2547bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpibaij_mpiaij; 2548746480a1SHong Zhang mumps->sym = 0; 2549f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Cannot use PETSc BAIJ matrices with MUMPS Cholesky, use SBAIJ or AIJ matrix instead\n"); 2550bccb9932SShri Abhyankar 2551*e69c285eSBarry Smith B->ops->getinfo = MatGetInfo_External; 2552450b117fSShri Abhyankar B->ops->view = MatView_MUMPS; 25532205254eSKarl Rupp 2554bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 25555a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorSetSchurIS_C",MatFactorSetSchurIS_MUMPS);CHKERRQ(ierr); 25565a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorInvertSchurComplement_C",MatFactorInvertSchurComplement_MUMPS);CHKERRQ(ierr); 25575a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorCreateSchurComplement_C",MatFactorCreateSchurComplement_MUMPS);CHKERRQ(ierr); 25585a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSchurComplement_C",MatFactorGetSchurComplement_MUMPS);CHKERRQ(ierr); 25595a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorSolveSchurComplement_C",MatFactorSolveSchurComplement_MUMPS);CHKERRQ(ierr); 25605a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorSolveSchurComplementTranspose_C",MatFactorSolveSchurComplementTranspose_MUMPS);CHKERRQ(ierr); 2561bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 2562bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 2563bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 2564bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 2565ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 2566ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 2567ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 2568ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 2569450b117fSShri Abhyankar 257000c67f3bSHong Zhang /* set solvertype */ 257100c67f3bSHong Zhang ierr = PetscFree(B->solvertype);CHKERRQ(ierr); 257200c67f3bSHong Zhang ierr = PetscStrallocpy(MATSOLVERMUMPS,&B->solvertype);CHKERRQ(ierr); 257300c67f3bSHong Zhang 2574450b117fSShri Abhyankar mumps->isAIJ = PETSC_TRUE; 2575450b117fSShri Abhyankar B->ops->destroy = MatDestroy_MUMPS; 2576*e69c285eSBarry Smith B->data = (void*)mumps; 25772205254eSKarl Rupp 2578f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 2579746480a1SHong Zhang 2580450b117fSShri Abhyankar *F = B; 2581450b117fSShri Abhyankar PetscFunctionReturn(0); 2582450b117fSShri Abhyankar } 258342c9c57cSBarry Smith 258442c9c57cSBarry Smith #undef __FUNCT__ 258542c9c57cSBarry Smith #define __FUNCT__ "MatSolverPackageRegister_MUMPS" 258629b38603SBarry Smith PETSC_EXTERN PetscErrorCode MatSolverPackageRegister_MUMPS(void) 258742c9c57cSBarry Smith { 258842c9c57cSBarry Smith PetscErrorCode ierr; 258942c9c57cSBarry Smith 259042c9c57cSBarry Smith PetscFunctionBegin; 259142c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIAIJ,MAT_FACTOR_LU,MatGetFactor_aij_mumps);CHKERRQ(ierr); 259242c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_aij_mumps);CHKERRQ(ierr); 259342c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIBAIJ,MAT_FACTOR_LU,MatGetFactor_baij_mumps);CHKERRQ(ierr); 259442c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_baij_mumps);CHKERRQ(ierr); 259542c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPISBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_sbaij_mumps);CHKERRQ(ierr); 259642c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQAIJ,MAT_FACTOR_LU,MatGetFactor_aij_mumps);CHKERRQ(ierr); 259742c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_aij_mumps);CHKERRQ(ierr); 259842c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQBAIJ,MAT_FACTOR_LU,MatGetFactor_baij_mumps);CHKERRQ(ierr); 259942c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_baij_mumps);CHKERRQ(ierr); 260042c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQSBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_sbaij_mumps);CHKERRQ(ierr); 260142c9c57cSBarry Smith PetscFunctionReturn(0); 260242c9c57cSBarry Smith } 260342c9c57cSBarry Smith 2604