11c2a3de1SBarry Smith 2397b6df1SKris Buschelman /* 3c2b5dc30SHong Zhang Provides an interface to the MUMPS sparse solver 4397b6df1SKris Buschelman */ 551d5961aSHong Zhang 6c6db04a5SJed Brown #include <../src/mat/impls/aij/mpi/mpiaij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <../src/mat/impls/sbaij/mpi/mpisbaij.h> 8b5fa320bSStefano Zampini #include <petscblaslapack.h> 9397b6df1SKris Buschelman 10397b6df1SKris Buschelman EXTERN_C_BEGIN 11397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 122907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 132907cef9SHong Zhang #include <cmumps_c.h> 142907cef9SHong Zhang #else 15c6db04a5SJed Brown #include <zmumps_c.h> 162907cef9SHong Zhang #endif 172907cef9SHong Zhang #else 182907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 192907cef9SHong Zhang #include <smumps_c.h> 20397b6df1SKris Buschelman #else 21c6db04a5SJed Brown #include <dmumps_c.h> 22397b6df1SKris Buschelman #endif 232907cef9SHong Zhang #endif 24397b6df1SKris Buschelman EXTERN_C_END 25397b6df1SKris Buschelman #define JOB_INIT -1 263d472b54SHong Zhang #define JOB_FACTSYMBOLIC 1 273d472b54SHong Zhang #define JOB_FACTNUMERIC 2 283d472b54SHong Zhang #define JOB_SOLVE 3 29397b6df1SKris Buschelman #define JOB_END -2 303d472b54SHong Zhang 312907cef9SHong Zhang /* calls to MUMPS */ 322907cef9SHong Zhang #if defined(PETSC_USE_COMPLEX) 332907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 342907cef9SHong Zhang #define PetscMUMPS_c cmumps_c 352907cef9SHong Zhang #else 362907cef9SHong Zhang #define PetscMUMPS_c zmumps_c 372907cef9SHong Zhang #endif 382907cef9SHong Zhang #else 392907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 402907cef9SHong Zhang #define PetscMUMPS_c smumps_c 412907cef9SHong Zhang #else 422907cef9SHong Zhang #define PetscMUMPS_c dmumps_c 432907cef9SHong Zhang #endif 442907cef9SHong Zhang #endif 452907cef9SHong Zhang 46940cd9d6SSatish Balay /* declare MumpsScalar */ 47940cd9d6SSatish Balay #if defined(PETSC_USE_COMPLEX) 48940cd9d6SSatish Balay #if defined(PETSC_USE_REAL_SINGLE) 49940cd9d6SSatish Balay #define MumpsScalar mumps_complex 50940cd9d6SSatish Balay #else 51940cd9d6SSatish Balay #define MumpsScalar mumps_double_complex 52940cd9d6SSatish Balay #endif 53940cd9d6SSatish Balay #else 54940cd9d6SSatish Balay #define MumpsScalar PetscScalar 55940cd9d6SSatish Balay #endif 563d472b54SHong Zhang 57397b6df1SKris Buschelman /* macros s.t. indices match MUMPS documentation */ 58397b6df1SKris Buschelman #define ICNTL(I) icntl[(I)-1] 59397b6df1SKris Buschelman #define CNTL(I) cntl[(I)-1] 60397b6df1SKris Buschelman #define INFOG(I) infog[(I)-1] 61a7aca84bSHong Zhang #define INFO(I) info[(I)-1] 62397b6df1SKris Buschelman #define RINFOG(I) rinfog[(I)-1] 63adc1d99fSHong Zhang #define RINFO(I) rinfo[(I)-1] 64397b6df1SKris Buschelman 65397b6df1SKris Buschelman typedef struct { 66397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 672907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 682907cef9SHong Zhang CMUMPS_STRUC_C id; 692907cef9SHong Zhang #else 70397b6df1SKris Buschelman ZMUMPS_STRUC_C id; 712907cef9SHong Zhang #endif 722907cef9SHong Zhang #else 732907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 742907cef9SHong Zhang SMUMPS_STRUC_C id; 75397b6df1SKris Buschelman #else 76397b6df1SKris Buschelman DMUMPS_STRUC_C id; 77397b6df1SKris Buschelman #endif 782907cef9SHong Zhang #endif 792907cef9SHong Zhang 80397b6df1SKris Buschelman MatStructure matstruc; 81c1490034SHong Zhang PetscMPIInt myid,size; 82a5e57a09SHong Zhang PetscInt *irn,*jcn,nz,sym; 83397b6df1SKris Buschelman PetscScalar *val; 84397b6df1SKris Buschelman MPI_Comm comm_mumps; 8564e6c443SBarry Smith PetscBool isAIJ,CleanUpMUMPS; 86a5e57a09SHong Zhang PetscInt ICNTL9_pre; /* check if ICNTL(9) is changed from previous MatSolve */ 87801fbe65SHong Zhang VecScatter scat_rhs, scat_sol; /* used by MatSolve() */ 88801fbe65SHong Zhang Vec b_seq,x_seq; 89b34f08ffSHong Zhang PetscInt ninfo,*info; /* display INFO */ 90b5fa320bSStefano Zampini PetscBool schur_second_solve; 91b5fa320bSStefano Zampini PetscInt sizeredrhs; 92b5fa320bSStefano Zampini PetscInt *schur_pivots; 9359ac8732SStefano Zampini PetscInt schur_B_lwork; 94b5fa320bSStefano Zampini PetscScalar *schur_work; 9559ac8732SStefano Zampini PetscScalar *schur_sol; 9659ac8732SStefano Zampini PetscInt schur_sizesol; 9759ac8732SStefano Zampini PetscBool schur_restored; 9859ac8732SStefano Zampini PetscBool schur_factored; 9959ac8732SStefano Zampini PetscBool schur_inverted; 1002205254eSKarl Rupp 101bf0cc555SLisandro Dalcin PetscErrorCode (*Destroy)(Mat); 102bccb9932SShri Abhyankar PetscErrorCode (*ConvertToTriples)(Mat, int, MatReuse, int*, int**, int**, PetscScalar**); 103f0c56d0fSKris Buschelman } Mat_MUMPS; 104f0c56d0fSKris Buschelman 10509573ac7SBarry Smith extern PetscErrorCode MatDuplicate_MUMPS(Mat,MatDuplicateOption,Mat*); 106b24902e0SBarry Smith 10759ac8732SStefano Zampini #undef __FUNCT__ 10859ac8732SStefano Zampini #define __FUNCT__ "MatMumpsResetSchur_Private" 10959ac8732SStefano Zampini static PetscErrorCode MatMumpsResetSchur_Private(Mat_MUMPS* mumps) 110b5fa320bSStefano Zampini { 111b5fa320bSStefano Zampini PetscErrorCode ierr; 112b5fa320bSStefano Zampini 113b5fa320bSStefano Zampini PetscFunctionBegin; 11459ac8732SStefano Zampini ierr = PetscFree2(mumps->id.listvar_schur,mumps->id.schur);CHKERRQ(ierr); 11559ac8732SStefano Zampini ierr = PetscFree(mumps->id.redrhs);CHKERRQ(ierr); 11659ac8732SStefano Zampini ierr = PetscFree(mumps->schur_sol);CHKERRQ(ierr); 11759ac8732SStefano Zampini ierr = PetscFree(mumps->schur_pivots);CHKERRQ(ierr); 11859ac8732SStefano Zampini ierr = PetscFree(mumps->schur_work);CHKERRQ(ierr); 11959ac8732SStefano Zampini if (!mumps->schur_restored) { 12059ac8732SStefano Zampini SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 12159ac8732SStefano Zampini } 12259ac8732SStefano Zampini mumps->id.size_schur = 0; 12359ac8732SStefano Zampini mumps->id.ICNTL(19) = 0; 12459ac8732SStefano Zampini PetscFunctionReturn(0); 12559ac8732SStefano Zampini } 12659ac8732SStefano Zampini 12759ac8732SStefano Zampini #undef __FUNCT__ 12859ac8732SStefano Zampini #define __FUNCT__ "MatMumpsFactorSchur_Private" 12959ac8732SStefano Zampini static PetscErrorCode MatMumpsFactorSchur_Private(Mat_MUMPS* mumps) 13059ac8732SStefano Zampini { 13159ac8732SStefano Zampini PetscBLASInt B_N,B_ierr,B_slda; 13259ac8732SStefano Zampini PetscErrorCode ierr; 13359ac8732SStefano Zampini 13459ac8732SStefano Zampini PetscFunctionBegin; 13559ac8732SStefano Zampini if (mumps->schur_factored) { 13659ac8732SStefano Zampini PetscFunctionReturn(0); 13759ac8732SStefano Zampini } 13859ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.size_schur,&B_N);CHKERRQ(ierr); 13959ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.schur_lld,&B_slda);CHKERRQ(ierr); 14059ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full Schur matrix */ 14159ac8732SStefano Zampini if (!mumps->schur_pivots) { 14259ac8732SStefano Zampini ierr = PetscMalloc1(B_N,&mumps->schur_pivots);CHKERRQ(ierr); 14359ac8732SStefano Zampini } 14459ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 14559ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetrf",LAPACKgetrf_(&B_N,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,&B_ierr)); 14659ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 14759ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GETRF Lapack routine %d",(int)B_ierr); 14859ac8732SStefano Zampini } else { /* either full or lower-triangular (not packed) */ 14959ac8732SStefano Zampini char ord[2]; 15059ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 15159ac8732SStefano Zampini sprintf(ord,"L"); 15259ac8732SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 15359ac8732SStefano Zampini sprintf(ord,"U"); 15459ac8732SStefano Zampini } 15559ac8732SStefano Zampini if (mumps->id.sym == 2) { 15659ac8732SStefano Zampini if (!mumps->schur_pivots) { 15759ac8732SStefano Zampini PetscScalar lwork; 15859ac8732SStefano Zampini 15959ac8732SStefano Zampini ierr = PetscMalloc1(B_N,&mumps->schur_pivots);CHKERRQ(ierr); 16059ac8732SStefano Zampini mumps->schur_B_lwork=-1; 16159ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 16259ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytrf",LAPACKsytrf_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,&lwork,&mumps->schur_B_lwork,&B_ierr)); 16359ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 16459ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SYTRF Lapack routine %d",(int)B_ierr); 16559ac8732SStefano Zampini ierr = PetscBLASIntCast((PetscInt)PetscRealPart(lwork),&mumps->schur_B_lwork);CHKERRQ(ierr); 16659ac8732SStefano Zampini ierr = PetscMalloc1(mumps->schur_B_lwork,&mumps->schur_work);CHKERRQ(ierr); 16759ac8732SStefano Zampini } 16859ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 16959ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytrf",LAPACKsytrf_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,mumps->schur_work,&mumps->schur_B_lwork,&B_ierr)); 17059ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 17159ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYTRF Lapack routine %d",(int)B_ierr); 17259ac8732SStefano Zampini } else { 17359ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 17459ac8732SStefano Zampini PetscStackCallBLAS("LAPACKpotrf",LAPACKpotrf_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,&B_ierr)); 17559ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 17659ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in POTRF Lapack routine %d",(int)B_ierr); 17759ac8732SStefano Zampini } 17859ac8732SStefano Zampini } 17959ac8732SStefano Zampini mumps->schur_factored = PETSC_TRUE; 18059ac8732SStefano Zampini PetscFunctionReturn(0); 18159ac8732SStefano Zampini } 18259ac8732SStefano Zampini 18359ac8732SStefano Zampini #undef __FUNCT__ 18459ac8732SStefano Zampini #define __FUNCT__ "MatMumpsInvertSchur_Private" 18559ac8732SStefano Zampini static PetscErrorCode MatMumpsInvertSchur_Private(Mat_MUMPS* mumps) 18659ac8732SStefano Zampini { 18759ac8732SStefano Zampini PetscBLASInt B_N,B_ierr,B_slda; 18859ac8732SStefano Zampini PetscErrorCode ierr; 18959ac8732SStefano Zampini 19059ac8732SStefano Zampini PetscFunctionBegin; 19159ac8732SStefano Zampini ierr = MatMumpsFactorSchur_Private(mumps);CHKERRQ(ierr); 19259ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.size_schur,&B_N);CHKERRQ(ierr); 19359ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.schur_lld,&B_slda);CHKERRQ(ierr); 19459ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full Schur matrix */ 19559ac8732SStefano Zampini if (!mumps->schur_work) { 19659ac8732SStefano Zampini PetscScalar lwork; 19759ac8732SStefano Zampini 19859ac8732SStefano Zampini mumps->schur_B_lwork = -1; 19959ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 20059ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetri",LAPACKgetri_(&B_N,(PetscScalar*)mumps->id.schur,&B_N,mumps->schur_pivots,&lwork,&mumps->schur_B_lwork,&B_ierr)); 20159ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 20259ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to GETRI Lapack routine %d",(int)B_ierr); 20359ac8732SStefano Zampini ierr = PetscBLASIntCast((PetscInt)PetscRealPart(lwork),&mumps->schur_B_lwork);CHKERRQ(ierr); 20459ac8732SStefano Zampini ierr = PetscMalloc1(mumps->schur_B_lwork,&mumps->schur_work);CHKERRQ(ierr); 20559ac8732SStefano Zampini } 20659ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 20759ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetri",LAPACKgetri_(&B_N,(PetscScalar*)mumps->id.schur,&B_N,mumps->schur_pivots,mumps->schur_work,&mumps->schur_B_lwork,&B_ierr)); 20859ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 20959ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GETRI Lapack routine %d",(int)B_ierr); 21059ac8732SStefano Zampini } else { /* either full or lower-triangular (not packed) */ 21159ac8732SStefano Zampini char ord[2]; 21259ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 21359ac8732SStefano Zampini sprintf(ord,"L"); 21459ac8732SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 21559ac8732SStefano Zampini sprintf(ord,"U"); 21659ac8732SStefano Zampini } 21759ac8732SStefano Zampini if (mumps->id.sym == 2) { 21859ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 21959ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytri",LAPACKsytri_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_N,mumps->schur_pivots,mumps->schur_work,&B_ierr)); 22059ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 22159ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYTRI Lapack routine %d",(int)B_ierr); 22259ac8732SStefano Zampini } else { 22359ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 22459ac8732SStefano Zampini PetscStackCallBLAS("LAPACKpotri",LAPACKpotri_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_N,&B_ierr)); 22559ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 22659ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in POTRI Lapack routine %d",(int)B_ierr); 22759ac8732SStefano Zampini } 22859ac8732SStefano Zampini } 22959ac8732SStefano Zampini mumps->schur_inverted = PETSC_TRUE; 23059ac8732SStefano Zampini PetscFunctionReturn(0); 23159ac8732SStefano Zampini } 23259ac8732SStefano Zampini 23359ac8732SStefano Zampini #undef __FUNCT__ 23459ac8732SStefano Zampini #define __FUNCT__ "MatMumpsSolveSchur_Private" 235e807eca7SStefano Zampini static PetscErrorCode MatMumpsSolveSchur_Private(Mat_MUMPS* mumps, PetscBool sol_in_redrhs) 23659ac8732SStefano Zampini { 23759ac8732SStefano Zampini PetscBLASInt B_N,B_Nrhs,B_ierr,B_slda,B_rlda; 23859ac8732SStefano Zampini PetscScalar one=1.,zero=0.; 23959ac8732SStefano Zampini PetscErrorCode ierr; 24059ac8732SStefano Zampini 24159ac8732SStefano Zampini PetscFunctionBegin; 24259ac8732SStefano Zampini ierr = MatMumpsFactorSchur_Private(mumps);CHKERRQ(ierr); 243b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.size_schur,&B_N);CHKERRQ(ierr); 244b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.schur_lld,&B_slda);CHKERRQ(ierr); 245b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.nrhs,&B_Nrhs);CHKERRQ(ierr); 246b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.lredrhs,&B_rlda);CHKERRQ(ierr); 24759ac8732SStefano Zampini if (mumps->schur_inverted) { 24859ac8732SStefano Zampini PetscInt sizesol = B_Nrhs*B_N; 24959ac8732SStefano Zampini if (!mumps->schur_sol || sizesol > mumps->schur_sizesol) { 25059ac8732SStefano Zampini ierr = PetscFree(mumps->schur_sol);CHKERRQ(ierr); 25159ac8732SStefano Zampini ierr = PetscMalloc1(sizesol,&mumps->schur_sol);CHKERRQ(ierr); 25259ac8732SStefano Zampini mumps->schur_sizesol = sizesol; 253b5fa320bSStefano Zampini } 25459ac8732SStefano Zampini if (!mumps->sym) { 25559ac8732SStefano Zampini char type[2]; 256b5fa320bSStefano Zampini if (mumps->id.ICNTL(19) == 1) { /* stored by rows */ 25759ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 25859ac8732SStefano Zampini sprintf(type,"N"); 259b5fa320bSStefano Zampini } else { 26059ac8732SStefano Zampini sprintf(type,"T"); 261b5fa320bSStefano Zampini } 26259ac8732SStefano Zampini } else { /* stored by columns */ 26359ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 26459ac8732SStefano Zampini sprintf(type,"T"); 26559ac8732SStefano Zampini } else { 26659ac8732SStefano Zampini sprintf(type,"N"); 26759ac8732SStefano Zampini } 26859ac8732SStefano Zampini } 26959ac8732SStefano Zampini PetscStackCallBLAS("BLASgemm",BLASgemm_(type,"N",&B_N,&B_Nrhs,&B_N,&one,(PetscScalar*)mumps->id.schur,&B_slda,(PetscScalar*)mumps->id.redrhs,&B_rlda,&zero,mumps->schur_sol,&B_rlda)); 27059ac8732SStefano Zampini } else { 27159ac8732SStefano Zampini char ord[2]; 27259ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 27359ac8732SStefano Zampini sprintf(ord,"L"); 27459ac8732SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 27559ac8732SStefano Zampini sprintf(ord,"U"); 27659ac8732SStefano Zampini } 27759ac8732SStefano Zampini PetscStackCallBLAS("BLASsymm",BLASsymm_("L",ord,&B_N,&B_Nrhs,&one,(PetscScalar*)mumps->id.schur,&B_slda,(PetscScalar*)mumps->id.redrhs,&B_rlda,&zero,mumps->schur_sol,&B_rlda)); 27859ac8732SStefano Zampini } 279e807eca7SStefano Zampini if (sol_in_redrhs) { 28059ac8732SStefano Zampini ierr = PetscMemcpy(mumps->id.redrhs,mumps->schur_sol,sizesol*sizeof(PetscScalar));CHKERRQ(ierr); 281e807eca7SStefano Zampini } 28259ac8732SStefano Zampini } else { 28359ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full Schur matrix */ 28459ac8732SStefano Zampini char type[2]; 28559ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 1) { /* stored by rows */ 28659ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 28759ac8732SStefano Zampini sprintf(type,"N"); 28859ac8732SStefano Zampini } else { 28959ac8732SStefano Zampini sprintf(type,"T"); 29059ac8732SStefano Zampini } 29159ac8732SStefano Zampini } else { /* stored by columns */ 29259ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 29359ac8732SStefano Zampini sprintf(type,"T"); 29459ac8732SStefano Zampini } else { 29559ac8732SStefano Zampini sprintf(type,"N"); 29659ac8732SStefano Zampini } 29759ac8732SStefano Zampini } 29859ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 29959ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetrs",LAPACKgetrs_(type,&B_N,&B_Nrhs,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,(PetscScalar*)mumps->id.redrhs,&B_rlda,&B_ierr)); 300b5fa320bSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 301b5fa320bSStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GETRS Lapack routine %d",(int)B_ierr); 302b5fa320bSStefano Zampini } else { /* either full or lower-triangular (not packed) */ 303b5fa320bSStefano Zampini char ord[2]; 304b5fa320bSStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 305b5fa320bSStefano Zampini sprintf(ord,"L"); 306b5fa320bSStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 307b5fa320bSStefano Zampini sprintf(ord,"U"); 308b5fa320bSStefano Zampini } 309b5fa320bSStefano Zampini if (mumps->id.sym == 2) { 310b5fa320bSStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 31159ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytrs",LAPACKsytrs_(ord,&B_N,&B_Nrhs,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,(PetscScalar*)mumps->id.redrhs,&B_rlda,&B_ierr)); 312b5fa320bSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 313b5fa320bSStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYTRS Lapack routine %d",(int)B_ierr); 314b5fa320bSStefano Zampini } else { 315b5fa320bSStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 31659ac8732SStefano Zampini PetscStackCallBLAS("LAPACKpotrs",LAPACKpotrs_(ord,&B_N,&B_Nrhs,(PetscScalar*)mumps->id.schur,&B_slda,(PetscScalar*)mumps->id.redrhs,&B_rlda,&B_ierr)); 317b5fa320bSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 318b5fa320bSStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in POTRS Lapack routine %d",(int)B_ierr); 319b5fa320bSStefano Zampini } 320b5fa320bSStefano Zampini } 321e807eca7SStefano Zampini if (!sol_in_redrhs) { 322e807eca7SStefano Zampini PetscInt sizesol = B_Nrhs*B_N; 323e807eca7SStefano Zampini if (!mumps->schur_sol || sizesol > mumps->schur_sizesol) { 324e807eca7SStefano Zampini ierr = PetscFree(mumps->schur_sol);CHKERRQ(ierr); 325e807eca7SStefano Zampini ierr = PetscMalloc1(sizesol,&mumps->schur_sol);CHKERRQ(ierr); 326e807eca7SStefano Zampini mumps->schur_sizesol = sizesol; 327e807eca7SStefano Zampini } 328e807eca7SStefano Zampini ierr = PetscMemcpy(mumps->schur_sol,mumps->id.redrhs,sizesol*sizeof(PetscScalar));CHKERRQ(ierr); 329e807eca7SStefano Zampini } 33059ac8732SStefano Zampini } 331b5fa320bSStefano Zampini PetscFunctionReturn(0); 332b5fa320bSStefano Zampini } 333b5fa320bSStefano Zampini 33459ac8732SStefano Zampini #undef __FUNCT__ 33559ac8732SStefano Zampini #define __FUNCT__ "MatMumpsHandleSchur_Private" 336b5fa320bSStefano Zampini static PetscErrorCode MatMumpsHandleSchur_Private(Mat_MUMPS* mumps) 337b5fa320bSStefano Zampini { 338b5fa320bSStefano Zampini PetscErrorCode ierr; 339b5fa320bSStefano Zampini 340b5fa320bSStefano Zampini PetscFunctionBegin; 341b5fa320bSStefano Zampini if (!mumps->id.ICNTL(19)) { /* do nothing when Schur complement has not been computed */ 342b5fa320bSStefano Zampini PetscFunctionReturn(0); 343b5fa320bSStefano Zampini } 344b5fa320bSStefano Zampini if (!mumps->schur_second_solve) { /* prepare for the condensation step */ 345b5fa320bSStefano Zampini /* check if schur complement has been computed 346e807eca7SStefano Zampini We set by default ICNTL(26) == -1 when Schur indices have been provided by the user. 347b5fa320bSStefano Zampini According to MUMPS (5.0.0) manual, any value should be harmful during the factorization phase 348b5fa320bSStefano Zampini Unless the user provides a valid value for ICNTL(26), MatSolve and MatMatSolve routines solve the full system. 349b5fa320bSStefano Zampini This requires an extra call to PetscMUMPS_c and the computation of the factors for S, handled setting double_schur_solve to PETSC_TRUE */ 350b5fa320bSStefano Zampini if (mumps->id.ICNTL(26) < 0 || mumps->id.ICNTL(26) > 2) { 351b5fa320bSStefano Zampini PetscInt sizeredrhs = mumps->id.nrhs*mumps->id.size_schur; 352b5fa320bSStefano Zampini /* allocate MUMPS internal array to store reduced right-hand sides */ 353b5fa320bSStefano Zampini if (!mumps->id.redrhs || sizeredrhs > mumps->sizeredrhs) { 354b5fa320bSStefano Zampini ierr = PetscFree(mumps->id.redrhs);CHKERRQ(ierr); 355b5fa320bSStefano Zampini mumps->id.lredrhs = mumps->id.size_schur; 356b5fa320bSStefano Zampini ierr = PetscMalloc1(mumps->id.nrhs*mumps->id.lredrhs,&mumps->id.redrhs);CHKERRQ(ierr); 357b5fa320bSStefano Zampini mumps->sizeredrhs = mumps->id.nrhs*mumps->id.lredrhs; 358b5fa320bSStefano Zampini } 359b5fa320bSStefano Zampini mumps->schur_second_solve = PETSC_TRUE; 360b5fa320bSStefano Zampini mumps->id.ICNTL(26) = 1; /* condensation phase */ 361b5fa320bSStefano Zampini } 362b5fa320bSStefano Zampini } else { /* prepare for the expansion step */ 363b5fa320bSStefano Zampini /* solve Schur complement (this should be done by the MUMPS user, so basically us) */ 364e807eca7SStefano Zampini ierr = MatMumpsSolveSchur_Private(mumps,PETSC_TRUE);CHKERRQ(ierr); 365b5fa320bSStefano Zampini mumps->id.ICNTL(26) = 2; /* expansion phase */ 366b5fa320bSStefano Zampini PetscMUMPS_c(&mumps->id); 367b5fa320bSStefano Zampini if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 368b5fa320bSStefano Zampini /* restore defaults */ 369b5fa320bSStefano Zampini mumps->id.ICNTL(26) = -1; 370b5fa320bSStefano Zampini mumps->schur_second_solve = PETSC_FALSE; 371b5fa320bSStefano Zampini } 372b5fa320bSStefano Zampini PetscFunctionReturn(0); 373b5fa320bSStefano Zampini } 374b5fa320bSStefano Zampini 375397b6df1SKris Buschelman /* 376d341cd04SHong Zhang MatConvertToTriples_A_B - convert Petsc matrix to triples: row[nz], col[nz], val[nz] 377d341cd04SHong Zhang 378397b6df1SKris Buschelman input: 37967877ebaSShri Abhyankar A - matrix in aij,baij or sbaij (bs=1) format 380397b6df1SKris Buschelman shift - 0: C style output triple; 1: Fortran style output triple. 381bccb9932SShri Abhyankar reuse - MAT_INITIAL_MATRIX: spaces are allocated and values are set for the triple 382bccb9932SShri Abhyankar MAT_REUSE_MATRIX: only the values in v array are updated 383397b6df1SKris Buschelman output: 384397b6df1SKris Buschelman nnz - dim of r, c, and v (number of local nonzero entries of A) 385397b6df1SKris Buschelman r, c, v - row and col index, matrix values (matrix triples) 386eb9baa12SBarry Smith 387eb9baa12SBarry Smith The returned values r, c, and sometimes v are obtained in a single PetscMalloc(). Then in MatDestroy_MUMPS() it is 388eb9baa12SBarry Smith freed with PetscFree((mumps->irn); This is not ideal code, the fact that v is ONLY sometimes part of mumps->irn means 389eb9baa12SBarry Smith that the PetscMalloc() cannot easily be replaced with a PetscMalloc3(). 390eb9baa12SBarry Smith 391397b6df1SKris Buschelman */ 39216ebf90aSShri Abhyankar 39316ebf90aSShri Abhyankar #undef __FUNCT__ 39416ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqaij_seqaij" 395bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqaij_seqaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 396b24902e0SBarry Smith { 397185f6596SHong Zhang const PetscInt *ai,*aj,*ajj,M=A->rmap->n; 39867877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 399dfbe8321SBarry Smith PetscErrorCode ierr; 400c1490034SHong Zhang PetscInt *row,*col; 40116ebf90aSShri Abhyankar Mat_SeqAIJ *aa=(Mat_SeqAIJ*)A->data; 402397b6df1SKris Buschelman 403397b6df1SKris Buschelman PetscFunctionBegin; 40416ebf90aSShri Abhyankar *v=aa->a; 405bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 4062205254eSKarl Rupp nz = aa->nz; 4072205254eSKarl Rupp ai = aa->i; 4082205254eSKarl Rupp aj = aa->j; 40916ebf90aSShri Abhyankar *nnz = nz; 410785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 411185f6596SHong Zhang col = row + nz; 412185f6596SHong Zhang 41316ebf90aSShri Abhyankar nz = 0; 41416ebf90aSShri Abhyankar for (i=0; i<M; i++) { 41516ebf90aSShri Abhyankar rnz = ai[i+1] - ai[i]; 41667877ebaSShri Abhyankar ajj = aj + ai[i]; 41767877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 41867877ebaSShri Abhyankar row[nz] = i+shift; col[nz++] = ajj[j] + shift; 41916ebf90aSShri Abhyankar } 42016ebf90aSShri Abhyankar } 42116ebf90aSShri Abhyankar *r = row; *c = col; 42216ebf90aSShri Abhyankar } 42316ebf90aSShri Abhyankar PetscFunctionReturn(0); 42416ebf90aSShri Abhyankar } 425397b6df1SKris Buschelman 42616ebf90aSShri Abhyankar #undef __FUNCT__ 42767877ebaSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqbaij_seqaij" 428bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqbaij_seqaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 42967877ebaSShri Abhyankar { 43067877ebaSShri Abhyankar Mat_SeqBAIJ *aa=(Mat_SeqBAIJ*)A->data; 43133d57670SJed Brown const PetscInt *ai,*aj,*ajj,bs2 = aa->bs2; 43233d57670SJed Brown PetscInt bs,M,nz,idx=0,rnz,i,j,k,m; 43367877ebaSShri Abhyankar PetscErrorCode ierr; 43467877ebaSShri Abhyankar PetscInt *row,*col; 43567877ebaSShri Abhyankar 43667877ebaSShri Abhyankar PetscFunctionBegin; 43733d57670SJed Brown ierr = MatGetBlockSize(A,&bs);CHKERRQ(ierr); 43833d57670SJed Brown M = A->rmap->N/bs; 439cf3759fdSShri Abhyankar *v = aa->a; 440bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 441cf3759fdSShri Abhyankar ai = aa->i; aj = aa->j; 44267877ebaSShri Abhyankar nz = bs2*aa->nz; 44367877ebaSShri Abhyankar *nnz = nz; 444785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 445185f6596SHong Zhang col = row + nz; 446185f6596SHong Zhang 44767877ebaSShri Abhyankar for (i=0; i<M; i++) { 44867877ebaSShri Abhyankar ajj = aj + ai[i]; 44967877ebaSShri Abhyankar rnz = ai[i+1] - ai[i]; 45067877ebaSShri Abhyankar for (k=0; k<rnz; k++) { 45167877ebaSShri Abhyankar for (j=0; j<bs; j++) { 45267877ebaSShri Abhyankar for (m=0; m<bs; m++) { 45367877ebaSShri Abhyankar row[idx] = i*bs + m + shift; 454cf3759fdSShri Abhyankar col[idx++] = bs*(ajj[k]) + j + shift; 45567877ebaSShri Abhyankar } 45667877ebaSShri Abhyankar } 45767877ebaSShri Abhyankar } 45867877ebaSShri Abhyankar } 459cf3759fdSShri Abhyankar *r = row; *c = col; 46067877ebaSShri Abhyankar } 46167877ebaSShri Abhyankar PetscFunctionReturn(0); 46267877ebaSShri Abhyankar } 46367877ebaSShri Abhyankar 46467877ebaSShri Abhyankar #undef __FUNCT__ 46516ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqsbaij_seqsbaij" 466bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqsbaij_seqsbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 46716ebf90aSShri Abhyankar { 46867877ebaSShri Abhyankar const PetscInt *ai, *aj,*ajj,M=A->rmap->n; 46967877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 47016ebf90aSShri Abhyankar PetscErrorCode ierr; 47116ebf90aSShri Abhyankar PetscInt *row,*col; 47216ebf90aSShri Abhyankar Mat_SeqSBAIJ *aa=(Mat_SeqSBAIJ*)A->data; 47316ebf90aSShri Abhyankar 47416ebf90aSShri Abhyankar PetscFunctionBegin; 475882afa5aSHong Zhang *v = aa->a; 476bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 4772205254eSKarl Rupp nz = aa->nz; 4782205254eSKarl Rupp ai = aa->i; 4792205254eSKarl Rupp aj = aa->j; 4802205254eSKarl Rupp *v = aa->a; 48116ebf90aSShri Abhyankar *nnz = nz; 482785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 483185f6596SHong Zhang col = row + nz; 484185f6596SHong Zhang 48516ebf90aSShri Abhyankar nz = 0; 48616ebf90aSShri Abhyankar for (i=0; i<M; i++) { 48716ebf90aSShri Abhyankar rnz = ai[i+1] - ai[i]; 48867877ebaSShri Abhyankar ajj = aj + ai[i]; 48967877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 49067877ebaSShri Abhyankar row[nz] = i+shift; col[nz++] = ajj[j] + shift; 49116ebf90aSShri Abhyankar } 49216ebf90aSShri Abhyankar } 49316ebf90aSShri Abhyankar *r = row; *c = col; 49416ebf90aSShri Abhyankar } 49516ebf90aSShri Abhyankar PetscFunctionReturn(0); 49616ebf90aSShri Abhyankar } 49716ebf90aSShri Abhyankar 49816ebf90aSShri Abhyankar #undef __FUNCT__ 49916ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqaij_seqsbaij" 500bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqaij_seqsbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 50116ebf90aSShri Abhyankar { 50267877ebaSShri Abhyankar const PetscInt *ai,*aj,*ajj,*adiag,M=A->rmap->n; 50367877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 50467877ebaSShri Abhyankar const PetscScalar *av,*v1; 50516ebf90aSShri Abhyankar PetscScalar *val; 50616ebf90aSShri Abhyankar PetscErrorCode ierr; 50716ebf90aSShri Abhyankar PetscInt *row,*col; 508829b1710SHong Zhang Mat_SeqAIJ *aa=(Mat_SeqAIJ*)A->data; 50916ebf90aSShri Abhyankar 51016ebf90aSShri Abhyankar PetscFunctionBegin; 51116ebf90aSShri Abhyankar ai =aa->i; aj=aa->j;av=aa->a; 51216ebf90aSShri Abhyankar adiag=aa->diag; 513bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 514829b1710SHong Zhang /* count nz in the uppper triangular part of A */ 515829b1710SHong Zhang nz = 0; 516829b1710SHong Zhang for (i=0; i<M; i++) nz += ai[i+1] - adiag[i]; 51716ebf90aSShri Abhyankar *nnz = nz; 518829b1710SHong Zhang 519185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 520185f6596SHong Zhang col = row + nz; 521185f6596SHong Zhang val = (PetscScalar*)(col + nz); 522185f6596SHong Zhang 52316ebf90aSShri Abhyankar nz = 0; 52416ebf90aSShri Abhyankar for (i=0; i<M; i++) { 52516ebf90aSShri Abhyankar rnz = ai[i+1] - adiag[i]; 52667877ebaSShri Abhyankar ajj = aj + adiag[i]; 527cf3759fdSShri Abhyankar v1 = av + adiag[i]; 52867877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 52967877ebaSShri Abhyankar row[nz] = i+shift; col[nz] = ajj[j] + shift; val[nz++] = v1[j]; 53016ebf90aSShri Abhyankar } 53116ebf90aSShri Abhyankar } 53216ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 533397b6df1SKris Buschelman } else { 53416ebf90aSShri Abhyankar nz = 0; val = *v; 53516ebf90aSShri Abhyankar for (i=0; i <M; i++) { 53616ebf90aSShri Abhyankar rnz = ai[i+1] - adiag[i]; 53767877ebaSShri Abhyankar ajj = aj + adiag[i]; 53867877ebaSShri Abhyankar v1 = av + adiag[i]; 53967877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 54067877ebaSShri Abhyankar val[nz++] = v1[j]; 54116ebf90aSShri Abhyankar } 54216ebf90aSShri Abhyankar } 54316ebf90aSShri Abhyankar } 54416ebf90aSShri Abhyankar PetscFunctionReturn(0); 54516ebf90aSShri Abhyankar } 54616ebf90aSShri Abhyankar 54716ebf90aSShri Abhyankar #undef __FUNCT__ 54816ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpisbaij_mpisbaij" 549bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpisbaij_mpisbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 55016ebf90aSShri Abhyankar { 55116ebf90aSShri Abhyankar const PetscInt *ai, *aj, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 55216ebf90aSShri Abhyankar PetscErrorCode ierr; 55316ebf90aSShri Abhyankar PetscInt rstart,nz,i,j,jj,irow,countA,countB; 55416ebf90aSShri Abhyankar PetscInt *row,*col; 55516ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 55616ebf90aSShri Abhyankar PetscScalar *val; 557397b6df1SKris Buschelman Mat_MPISBAIJ *mat = (Mat_MPISBAIJ*)A->data; 558397b6df1SKris Buschelman Mat_SeqSBAIJ *aa = (Mat_SeqSBAIJ*)(mat->A)->data; 559397b6df1SKris Buschelman Mat_SeqBAIJ *bb = (Mat_SeqBAIJ*)(mat->B)->data; 56016ebf90aSShri Abhyankar 56116ebf90aSShri Abhyankar PetscFunctionBegin; 562d0f46423SBarry Smith ai=aa->i; aj=aa->j; bi=bb->i; bj=bb->j; rstart= A->rmap->rstart; 563397b6df1SKris Buschelman av=aa->a; bv=bb->a; 564397b6df1SKris Buschelman 5652205254eSKarl Rupp garray = mat->garray; 5662205254eSKarl Rupp 567bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 56816ebf90aSShri Abhyankar nz = aa->nz + bb->nz; 56916ebf90aSShri Abhyankar *nnz = nz; 570185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 571185f6596SHong Zhang col = row + nz; 572185f6596SHong Zhang val = (PetscScalar*)(col + nz); 573185f6596SHong Zhang 574397b6df1SKris Buschelman *r = row; *c = col; *v = val; 575397b6df1SKris Buschelman } else { 576397b6df1SKris Buschelman row = *r; col = *c; val = *v; 577397b6df1SKris Buschelman } 578397b6df1SKris Buschelman 579028e57e8SHong Zhang jj = 0; irow = rstart; 580397b6df1SKris Buschelman for (i=0; i<m; i++) { 581397b6df1SKris Buschelman ajj = aj + ai[i]; /* ptr to the beginning of this row */ 582397b6df1SKris Buschelman countA = ai[i+1] - ai[i]; 583397b6df1SKris Buschelman countB = bi[i+1] - bi[i]; 584397b6df1SKris Buschelman bjj = bj + bi[i]; 58516ebf90aSShri Abhyankar v1 = av + ai[i]; 58616ebf90aSShri Abhyankar v2 = bv + bi[i]; 587397b6df1SKris Buschelman 588397b6df1SKris Buschelman /* A-part */ 589397b6df1SKris Buschelman for (j=0; j<countA; j++) { 590bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 591397b6df1SKris Buschelman row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 592397b6df1SKris Buschelman } 59316ebf90aSShri Abhyankar val[jj++] = v1[j]; 594397b6df1SKris Buschelman } 59516ebf90aSShri Abhyankar 59616ebf90aSShri Abhyankar /* B-part */ 59716ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 598bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 599397b6df1SKris Buschelman row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 600397b6df1SKris Buschelman } 60116ebf90aSShri Abhyankar val[jj++] = v2[j]; 60216ebf90aSShri Abhyankar } 60316ebf90aSShri Abhyankar irow++; 60416ebf90aSShri Abhyankar } 60516ebf90aSShri Abhyankar PetscFunctionReturn(0); 60616ebf90aSShri Abhyankar } 60716ebf90aSShri Abhyankar 60816ebf90aSShri Abhyankar #undef __FUNCT__ 60916ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpiaij_mpiaij" 610bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpiaij_mpiaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 61116ebf90aSShri Abhyankar { 61216ebf90aSShri Abhyankar const PetscInt *ai, *aj, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 61316ebf90aSShri Abhyankar PetscErrorCode ierr; 61416ebf90aSShri Abhyankar PetscInt rstart,nz,i,j,jj,irow,countA,countB; 61516ebf90aSShri Abhyankar PetscInt *row,*col; 61616ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 61716ebf90aSShri Abhyankar PetscScalar *val; 61816ebf90aSShri Abhyankar Mat_MPIAIJ *mat = (Mat_MPIAIJ*)A->data; 61916ebf90aSShri Abhyankar Mat_SeqAIJ *aa = (Mat_SeqAIJ*)(mat->A)->data; 62016ebf90aSShri Abhyankar Mat_SeqAIJ *bb = (Mat_SeqAIJ*)(mat->B)->data; 62116ebf90aSShri Abhyankar 62216ebf90aSShri Abhyankar PetscFunctionBegin; 62316ebf90aSShri Abhyankar ai=aa->i; aj=aa->j; bi=bb->i; bj=bb->j; rstart= A->rmap->rstart; 62416ebf90aSShri Abhyankar av=aa->a; bv=bb->a; 62516ebf90aSShri Abhyankar 6262205254eSKarl Rupp garray = mat->garray; 6272205254eSKarl Rupp 628bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 62916ebf90aSShri Abhyankar nz = aa->nz + bb->nz; 63016ebf90aSShri Abhyankar *nnz = nz; 631185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 632185f6596SHong Zhang col = row + nz; 633185f6596SHong Zhang val = (PetscScalar*)(col + nz); 634185f6596SHong Zhang 63516ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 63616ebf90aSShri Abhyankar } else { 63716ebf90aSShri Abhyankar row = *r; col = *c; val = *v; 63816ebf90aSShri Abhyankar } 63916ebf90aSShri Abhyankar 64016ebf90aSShri Abhyankar jj = 0; irow = rstart; 64116ebf90aSShri Abhyankar for (i=0; i<m; i++) { 64216ebf90aSShri Abhyankar ajj = aj + ai[i]; /* ptr to the beginning of this row */ 64316ebf90aSShri Abhyankar countA = ai[i+1] - ai[i]; 64416ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 64516ebf90aSShri Abhyankar bjj = bj + bi[i]; 64616ebf90aSShri Abhyankar v1 = av + ai[i]; 64716ebf90aSShri Abhyankar v2 = bv + bi[i]; 64816ebf90aSShri Abhyankar 64916ebf90aSShri Abhyankar /* A-part */ 65016ebf90aSShri Abhyankar for (j=0; j<countA; j++) { 651bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 65216ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 65316ebf90aSShri Abhyankar } 65416ebf90aSShri Abhyankar val[jj++] = v1[j]; 65516ebf90aSShri Abhyankar } 65616ebf90aSShri Abhyankar 65716ebf90aSShri Abhyankar /* B-part */ 65816ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 659bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 66016ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 66116ebf90aSShri Abhyankar } 66216ebf90aSShri Abhyankar val[jj++] = v2[j]; 66316ebf90aSShri Abhyankar } 66416ebf90aSShri Abhyankar irow++; 66516ebf90aSShri Abhyankar } 66616ebf90aSShri Abhyankar PetscFunctionReturn(0); 66716ebf90aSShri Abhyankar } 66816ebf90aSShri Abhyankar 66916ebf90aSShri Abhyankar #undef __FUNCT__ 67067877ebaSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpibaij_mpiaij" 671bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpibaij_mpiaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 67267877ebaSShri Abhyankar { 67367877ebaSShri Abhyankar Mat_MPIBAIJ *mat = (Mat_MPIBAIJ*)A->data; 67467877ebaSShri Abhyankar Mat_SeqBAIJ *aa = (Mat_SeqBAIJ*)(mat->A)->data; 67567877ebaSShri Abhyankar Mat_SeqBAIJ *bb = (Mat_SeqBAIJ*)(mat->B)->data; 67667877ebaSShri Abhyankar const PetscInt *ai = aa->i, *bi = bb->i, *aj = aa->j, *bj = bb->j,*ajj, *bjj; 677d985c460SShri Abhyankar const PetscInt *garray = mat->garray,mbs=mat->mbs,rstart=A->rmap->rstart; 67833d57670SJed Brown const PetscInt bs2=mat->bs2; 67967877ebaSShri Abhyankar PetscErrorCode ierr; 68033d57670SJed Brown PetscInt bs,nz,i,j,k,n,jj,irow,countA,countB,idx; 68167877ebaSShri Abhyankar PetscInt *row,*col; 68267877ebaSShri Abhyankar const PetscScalar *av=aa->a, *bv=bb->a,*v1,*v2; 68367877ebaSShri Abhyankar PetscScalar *val; 68467877ebaSShri Abhyankar 68567877ebaSShri Abhyankar PetscFunctionBegin; 68633d57670SJed Brown ierr = MatGetBlockSize(A,&bs);CHKERRQ(ierr); 687bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 68867877ebaSShri Abhyankar nz = bs2*(aa->nz + bb->nz); 68967877ebaSShri Abhyankar *nnz = nz; 690185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 691185f6596SHong Zhang col = row + nz; 692185f6596SHong Zhang val = (PetscScalar*)(col + nz); 693185f6596SHong Zhang 69467877ebaSShri Abhyankar *r = row; *c = col; *v = val; 69567877ebaSShri Abhyankar } else { 69667877ebaSShri Abhyankar row = *r; col = *c; val = *v; 69767877ebaSShri Abhyankar } 69867877ebaSShri Abhyankar 699d985c460SShri Abhyankar jj = 0; irow = rstart; 70067877ebaSShri Abhyankar for (i=0; i<mbs; i++) { 70167877ebaSShri Abhyankar countA = ai[i+1] - ai[i]; 70267877ebaSShri Abhyankar countB = bi[i+1] - bi[i]; 70367877ebaSShri Abhyankar ajj = aj + ai[i]; 70467877ebaSShri Abhyankar bjj = bj + bi[i]; 70567877ebaSShri Abhyankar v1 = av + bs2*ai[i]; 70667877ebaSShri Abhyankar v2 = bv + bs2*bi[i]; 70767877ebaSShri Abhyankar 70867877ebaSShri Abhyankar idx = 0; 70967877ebaSShri Abhyankar /* A-part */ 71067877ebaSShri Abhyankar for (k=0; k<countA; k++) { 71167877ebaSShri Abhyankar for (j=0; j<bs; j++) { 71267877ebaSShri Abhyankar for (n=0; n<bs; n++) { 713bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 714d985c460SShri Abhyankar row[jj] = irow + n + shift; 715d985c460SShri Abhyankar col[jj] = rstart + bs*ajj[k] + j + shift; 71667877ebaSShri Abhyankar } 71767877ebaSShri Abhyankar val[jj++] = v1[idx++]; 71867877ebaSShri Abhyankar } 71967877ebaSShri Abhyankar } 72067877ebaSShri Abhyankar } 72167877ebaSShri Abhyankar 72267877ebaSShri Abhyankar idx = 0; 72367877ebaSShri Abhyankar /* B-part */ 72467877ebaSShri Abhyankar for (k=0; k<countB; k++) { 72567877ebaSShri Abhyankar for (j=0; j<bs; j++) { 72667877ebaSShri Abhyankar for (n=0; n<bs; n++) { 727bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 728d985c460SShri Abhyankar row[jj] = irow + n + shift; 729d985c460SShri Abhyankar col[jj] = bs*garray[bjj[k]] + j + shift; 73067877ebaSShri Abhyankar } 731d985c460SShri Abhyankar val[jj++] = v2[idx++]; 73267877ebaSShri Abhyankar } 73367877ebaSShri Abhyankar } 73467877ebaSShri Abhyankar } 735d985c460SShri Abhyankar irow += bs; 73667877ebaSShri Abhyankar } 73767877ebaSShri Abhyankar PetscFunctionReturn(0); 73867877ebaSShri Abhyankar } 73967877ebaSShri Abhyankar 74067877ebaSShri Abhyankar #undef __FUNCT__ 74116ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpiaij_mpisbaij" 742bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpiaij_mpisbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 74316ebf90aSShri Abhyankar { 74416ebf90aSShri Abhyankar const PetscInt *ai, *aj,*adiag, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 74516ebf90aSShri Abhyankar PetscErrorCode ierr; 746e0bace9bSHong Zhang PetscInt rstart,nz,nza,nzb,i,j,jj,irow,countA,countB; 74716ebf90aSShri Abhyankar PetscInt *row,*col; 74816ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 74916ebf90aSShri Abhyankar PetscScalar *val; 75016ebf90aSShri Abhyankar Mat_MPIAIJ *mat = (Mat_MPIAIJ*)A->data; 75116ebf90aSShri Abhyankar Mat_SeqAIJ *aa =(Mat_SeqAIJ*)(mat->A)->data; 75216ebf90aSShri Abhyankar Mat_SeqAIJ *bb =(Mat_SeqAIJ*)(mat->B)->data; 75316ebf90aSShri Abhyankar 75416ebf90aSShri Abhyankar PetscFunctionBegin; 75516ebf90aSShri Abhyankar ai=aa->i; aj=aa->j; adiag=aa->diag; 75616ebf90aSShri Abhyankar bi=bb->i; bj=bb->j; garray = mat->garray; 75716ebf90aSShri Abhyankar av=aa->a; bv=bb->a; 7582205254eSKarl Rupp 75916ebf90aSShri Abhyankar rstart = A->rmap->rstart; 76016ebf90aSShri Abhyankar 761bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 762e0bace9bSHong Zhang nza = 0; /* num of upper triangular entries in mat->A, including diagonals */ 763e0bace9bSHong Zhang nzb = 0; /* num of upper triangular entries in mat->B */ 76416ebf90aSShri Abhyankar for (i=0; i<m; i++) { 765e0bace9bSHong Zhang nza += (ai[i+1] - adiag[i]); 76616ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 76716ebf90aSShri Abhyankar bjj = bj + bi[i]; 768e0bace9bSHong Zhang for (j=0; j<countB; j++) { 769e0bace9bSHong Zhang if (garray[bjj[j]] > rstart) nzb++; 770e0bace9bSHong Zhang } 771e0bace9bSHong Zhang } 77216ebf90aSShri Abhyankar 773e0bace9bSHong Zhang nz = nza + nzb; /* total nz of upper triangular part of mat */ 77416ebf90aSShri Abhyankar *nnz = nz; 775185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 776185f6596SHong Zhang col = row + nz; 777185f6596SHong Zhang val = (PetscScalar*)(col + nz); 778185f6596SHong Zhang 77916ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 78016ebf90aSShri Abhyankar } else { 78116ebf90aSShri Abhyankar row = *r; col = *c; val = *v; 78216ebf90aSShri Abhyankar } 78316ebf90aSShri Abhyankar 78416ebf90aSShri Abhyankar jj = 0; irow = rstart; 78516ebf90aSShri Abhyankar for (i=0; i<m; i++) { 78616ebf90aSShri Abhyankar ajj = aj + adiag[i]; /* ptr to the beginning of the diagonal of this row */ 78716ebf90aSShri Abhyankar v1 = av + adiag[i]; 78816ebf90aSShri Abhyankar countA = ai[i+1] - adiag[i]; 78916ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 79016ebf90aSShri Abhyankar bjj = bj + bi[i]; 79116ebf90aSShri Abhyankar v2 = bv + bi[i]; 79216ebf90aSShri Abhyankar 79316ebf90aSShri Abhyankar /* A-part */ 79416ebf90aSShri Abhyankar for (j=0; j<countA; j++) { 795bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 79616ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 79716ebf90aSShri Abhyankar } 79816ebf90aSShri Abhyankar val[jj++] = v1[j]; 79916ebf90aSShri Abhyankar } 80016ebf90aSShri Abhyankar 80116ebf90aSShri Abhyankar /* B-part */ 80216ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 80316ebf90aSShri Abhyankar if (garray[bjj[j]] > rstart) { 804bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 80516ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 80616ebf90aSShri Abhyankar } 80716ebf90aSShri Abhyankar val[jj++] = v2[j]; 80816ebf90aSShri Abhyankar } 809397b6df1SKris Buschelman } 810397b6df1SKris Buschelman irow++; 811397b6df1SKris Buschelman } 812397b6df1SKris Buschelman PetscFunctionReturn(0); 813397b6df1SKris Buschelman } 814397b6df1SKris Buschelman 815397b6df1SKris Buschelman #undef __FUNCT__ 81620be8e61SHong Zhang #define __FUNCT__ "MatGetDiagonal_MUMPS" 81720be8e61SHong Zhang PetscErrorCode MatGetDiagonal_MUMPS(Mat A,Vec v) 81820be8e61SHong Zhang { 81920be8e61SHong Zhang PetscFunctionBegin; 82020be8e61SHong Zhang SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Mat type: MUMPS factor"); 82120be8e61SHong Zhang PetscFunctionReturn(0); 82220be8e61SHong Zhang } 82320be8e61SHong Zhang 82420be8e61SHong Zhang #undef __FUNCT__ 8253924e44cSKris Buschelman #define __FUNCT__ "MatDestroy_MUMPS" 826dfbe8321SBarry Smith PetscErrorCode MatDestroy_MUMPS(Mat A) 827dfbe8321SBarry Smith { 828a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 829dfbe8321SBarry Smith PetscErrorCode ierr; 830b24902e0SBarry Smith 831397b6df1SKris Buschelman PetscFunctionBegin; 832a5e57a09SHong Zhang if (mumps->CleanUpMUMPS) { 833397b6df1SKris Buschelman /* Terminate instance, deallocate memories */ 834a5e57a09SHong Zhang ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr); 835a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_rhs);CHKERRQ(ierr); 836a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 837801fbe65SHong Zhang ierr = VecDestroy(&mumps->b_seq);CHKERRQ(ierr); 838a5e57a09SHong Zhang ierr = VecDestroy(&mumps->x_seq);CHKERRQ(ierr); 839a5e57a09SHong Zhang ierr = PetscFree(mumps->id.perm_in);CHKERRQ(ierr); 840a5e57a09SHong Zhang ierr = PetscFree(mumps->irn);CHKERRQ(ierr); 841b34f08ffSHong Zhang ierr = PetscFree(mumps->info);CHKERRQ(ierr); 84259ac8732SStefano Zampini ierr = MatMumpsResetSchur_Private(mumps);CHKERRQ(ierr); 843a5e57a09SHong Zhang mumps->id.job = JOB_END; 844a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 845a5e57a09SHong Zhang ierr = MPI_Comm_free(&(mumps->comm_mumps));CHKERRQ(ierr); 846397b6df1SKris Buschelman } 847a5e57a09SHong Zhang if (mumps->Destroy) { 848a5e57a09SHong Zhang ierr = (mumps->Destroy)(A);CHKERRQ(ierr); 849bf0cc555SLisandro Dalcin } 850bf0cc555SLisandro Dalcin ierr = PetscFree(A->spptr);CHKERRQ(ierr); 851bf0cc555SLisandro Dalcin 85297969023SHong Zhang /* clear composed functions */ 853bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatFactorGetSolverPackage_C",NULL);CHKERRQ(ierr); 854bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetIcntl_C",NULL);CHKERRQ(ierr); 855bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetIcntl_C",NULL);CHKERRQ(ierr); 856bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetCntl_C",NULL);CHKERRQ(ierr); 857bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetCntl_C",NULL);CHKERRQ(ierr); 858bc6112feSHong Zhang 859ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetInfo_C",NULL);CHKERRQ(ierr); 860ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetInfog_C",NULL);CHKERRQ(ierr); 861ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetRinfo_C",NULL);CHKERRQ(ierr); 862ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetRinfog_C",NULL);CHKERRQ(ierr); 8636444a565SStefano Zampini 8646444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetSchurIndices_C",NULL);CHKERRQ(ierr); 86559ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsInvertSchurComplement_C",NULL);CHKERRQ(ierr); 86659ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsCreateSchurComplement_C",NULL);CHKERRQ(ierr); 8676444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetSchurComplement_C",NULL);CHKERRQ(ierr); 86859ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsRestoreSchurComplement_C",NULL);CHKERRQ(ierr); 869e807eca7SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSolveSchurComplement_C",NULL);CHKERRQ(ierr); 870*7404bcfbSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSolveSchurComplementTranspose_C",NULL);CHKERRQ(ierr); 871397b6df1SKris Buschelman PetscFunctionReturn(0); 872397b6df1SKris Buschelman } 873397b6df1SKris Buschelman 874397b6df1SKris Buschelman #undef __FUNCT__ 875f6c57405SHong Zhang #define __FUNCT__ "MatSolve_MUMPS" 876b24902e0SBarry Smith PetscErrorCode MatSolve_MUMPS(Mat A,Vec b,Vec x) 877b24902e0SBarry Smith { 878a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 879d54de34fSKris Buschelman PetscScalar *array; 88067877ebaSShri Abhyankar Vec b_seq; 881329ec9b3SHong Zhang IS is_iden,is_petsc; 882dfbe8321SBarry Smith PetscErrorCode ierr; 883329ec9b3SHong Zhang PetscInt i; 884883f2eb9SBarry Smith static PetscBool cite1 = PETSC_FALSE,cite2 = PETSC_FALSE; 885397b6df1SKris Buschelman 886397b6df1SKris Buschelman PetscFunctionBegin; 887883f2eb9SBarry Smith ierr = PetscCitationsRegister("@article{MUMPS01,\n author = {P.~R. Amestoy and I.~S. Duff and J.-Y. L'Excellent and J. Koster},\n title = {A fully asynchronous multifrontal solver using distributed dynamic scheduling},\n journal = {SIAM Journal on Matrix Analysis and Applications},\n volume = {23},\n number = {1},\n pages = {15--41},\n year = {2001}\n}\n",&cite1);CHKERRQ(ierr); 888883f2eb9SBarry Smith ierr = PetscCitationsRegister("@article{MUMPS02,\n author = {P.~R. Amestoy and A. Guermouche and J.-Y. L'Excellent and S. Pralet},\n title = {Hybrid scheduling for the parallel solution of linear systems},\n journal = {Parallel Computing},\n volume = {32},\n number = {2},\n pages = {136--156},\n year = {2006}\n}\n",&cite2);CHKERRQ(ierr); 889a5e57a09SHong Zhang mumps->id.nrhs = 1; 890a5e57a09SHong Zhang b_seq = mumps->b_seq; 891a5e57a09SHong Zhang if (mumps->size > 1) { 892329ec9b3SHong Zhang /* MUMPS only supports centralized rhs. Scatter b into a seqential rhs vector */ 893a5e57a09SHong Zhang ierr = VecScatterBegin(mumps->scat_rhs,b,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 894a5e57a09SHong Zhang ierr = VecScatterEnd(mumps->scat_rhs,b,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 895a5e57a09SHong Zhang if (!mumps->myid) {ierr = VecGetArray(b_seq,&array);CHKERRQ(ierr);} 896397b6df1SKris Buschelman } else { /* size == 1 */ 897397b6df1SKris Buschelman ierr = VecCopy(b,x);CHKERRQ(ierr); 898397b6df1SKris Buschelman ierr = VecGetArray(x,&array);CHKERRQ(ierr); 899397b6df1SKris Buschelman } 900a5e57a09SHong Zhang if (!mumps->myid) { /* define rhs on the host */ 901a5e57a09SHong Zhang mumps->id.nrhs = 1; 902940cd9d6SSatish Balay mumps->id.rhs = (MumpsScalar*)array; 903397b6df1SKris Buschelman } 904397b6df1SKris Buschelman 905b5fa320bSStefano Zampini /* handle condensation step of Schur complement (if any) */ 906b5fa320bSStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps);CHKERRQ(ierr); 907b5fa320bSStefano Zampini 908397b6df1SKris Buschelman /* solve phase */ 909329ec9b3SHong Zhang /*-------------*/ 910a5e57a09SHong Zhang mumps->id.job = JOB_SOLVE; 911a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 912a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 913397b6df1SKris Buschelman 914b5fa320bSStefano Zampini /* handle expansion step of Schur complement (if any) */ 915b5fa320bSStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps);CHKERRQ(ierr); 916b5fa320bSStefano Zampini 917a5e57a09SHong Zhang if (mumps->size > 1) { /* convert mumps distributed solution to petsc mpi x */ 918a5e57a09SHong Zhang if (mumps->scat_sol && mumps->ICNTL9_pre != mumps->id.ICNTL(9)) { 919a5e57a09SHong Zhang /* when id.ICNTL(9) changes, the contents of lsol_loc may change (not its size, lsol_loc), recreates scat_sol */ 920a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 921397b6df1SKris Buschelman } 922a5e57a09SHong Zhang if (!mumps->scat_sol) { /* create scatter scat_sol */ 923a5e57a09SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,mumps->id.lsol_loc,0,1,&is_iden);CHKERRQ(ierr); /* from */ 924a5e57a09SHong Zhang for (i=0; i<mumps->id.lsol_loc; i++) { 925a5e57a09SHong Zhang mumps->id.isol_loc[i] -= 1; /* change Fortran style to C style */ 926a5e57a09SHong Zhang } 927a5e57a09SHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,mumps->id.lsol_loc,mumps->id.isol_loc,PETSC_COPY_VALUES,&is_petsc);CHKERRQ(ierr); /* to */ 928a5e57a09SHong Zhang ierr = VecScatterCreate(mumps->x_seq,is_iden,x,is_petsc,&mumps->scat_sol);CHKERRQ(ierr); 9296bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 9306bf464f9SBarry Smith ierr = ISDestroy(&is_petsc);CHKERRQ(ierr); 9312205254eSKarl Rupp 932a5e57a09SHong Zhang mumps->ICNTL9_pre = mumps->id.ICNTL(9); /* save current value of id.ICNTL(9) */ 933397b6df1SKris Buschelman } 934a5e57a09SHong Zhang 935a5e57a09SHong Zhang ierr = VecScatterBegin(mumps->scat_sol,mumps->x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 936a5e57a09SHong Zhang ierr = VecScatterEnd(mumps->scat_sol,mumps->x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 937329ec9b3SHong Zhang } 938397b6df1SKris Buschelman PetscFunctionReturn(0); 939397b6df1SKris Buschelman } 940397b6df1SKris Buschelman 94151d5961aSHong Zhang #undef __FUNCT__ 94251d5961aSHong Zhang #define __FUNCT__ "MatSolveTranspose_MUMPS" 94351d5961aSHong Zhang PetscErrorCode MatSolveTranspose_MUMPS(Mat A,Vec b,Vec x) 94451d5961aSHong Zhang { 945a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 94651d5961aSHong Zhang PetscErrorCode ierr; 94751d5961aSHong Zhang 94851d5961aSHong Zhang PetscFunctionBegin; 949a5e57a09SHong Zhang mumps->id.ICNTL(9) = 0; 9500ad0caddSJed Brown ierr = MatSolve_MUMPS(A,b,x);CHKERRQ(ierr); 951a5e57a09SHong Zhang mumps->id.ICNTL(9) = 1; 95251d5961aSHong Zhang PetscFunctionReturn(0); 95351d5961aSHong Zhang } 95451d5961aSHong Zhang 955e0b74bf9SHong Zhang #undef __FUNCT__ 956e0b74bf9SHong Zhang #define __FUNCT__ "MatMatSolve_MUMPS" 957e0b74bf9SHong Zhang PetscErrorCode MatMatSolve_MUMPS(Mat A,Mat B,Mat X) 958e0b74bf9SHong Zhang { 959bda8bf91SBarry Smith PetscErrorCode ierr; 960bda8bf91SBarry Smith PetscBool flg; 9614e34a73bSHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 962334c5f61SHong Zhang PetscInt i,nrhs,M; 9632cd7d884SHong Zhang PetscScalar *array,*bray; 964bda8bf91SBarry Smith 965e0b74bf9SHong Zhang PetscFunctionBegin; 9660298fd71SBarry Smith ierr = PetscObjectTypeCompareAny((PetscObject)B,&flg,MATSEQDENSE,MATMPIDENSE,NULL);CHKERRQ(ierr); 967801fbe65SHong Zhang if (!flg) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_ARG_WRONG,"Matrix B must be MATDENSE matrix"); 9680298fd71SBarry Smith ierr = PetscObjectTypeCompareAny((PetscObject)X,&flg,MATSEQDENSE,MATMPIDENSE,NULL);CHKERRQ(ierr); 969801fbe65SHong Zhang if (!flg) SETERRQ(PetscObjectComm((PetscObject)X),PETSC_ERR_ARG_WRONG,"Matrix X must be MATDENSE matrix"); 970801fbe65SHong Zhang if (B->rmap->n != X->rmap->n) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_ARG_WRONG,"Matrix B and X must have same row distribution"); 9714e34a73bSHong Zhang 9722cd7d884SHong Zhang ierr = MatGetSize(B,&M,&nrhs);CHKERRQ(ierr); 973334c5f61SHong Zhang mumps->id.nrhs = nrhs; 974334c5f61SHong Zhang mumps->id.lrhs = M; 9754e34a73bSHong Zhang 9762cd7d884SHong Zhang if (mumps->size == 1) { 9772cd7d884SHong Zhang /* copy B to X */ 9782cd7d884SHong Zhang ierr = MatDenseGetArray(B,&bray);CHKERRQ(ierr); 9792cd7d884SHong Zhang ierr = MatDenseGetArray(X,&array);CHKERRQ(ierr); 9806444a565SStefano Zampini ierr = PetscMemcpy(array,bray,M*nrhs*sizeof(PetscScalar));CHKERRQ(ierr); 9812cd7d884SHong Zhang ierr = MatDenseRestoreArray(B,&bray);CHKERRQ(ierr); 982940cd9d6SSatish Balay mumps->id.rhs = (MumpsScalar*)array; 983b5fa320bSStefano Zampini /* handle condensation step of Schur complement (if any) */ 984b5fa320bSStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps);CHKERRQ(ierr); 985801fbe65SHong Zhang 9862cd7d884SHong Zhang /* solve phase */ 9872cd7d884SHong Zhang /*-------------*/ 9882cd7d884SHong Zhang mumps->id.job = JOB_SOLVE; 9892cd7d884SHong Zhang PetscMUMPS_c(&mumps->id); 9902cd7d884SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 991b5fa320bSStefano Zampini 992b5fa320bSStefano Zampini /* handle expansion step of Schur complement (if any) */ 993b5fa320bSStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps);CHKERRQ(ierr); 9942cd7d884SHong Zhang ierr = MatDenseRestoreArray(X,&array);CHKERRQ(ierr); 995334c5f61SHong Zhang } else { /*--------- parallel case --------*/ 99671aed81dSHong Zhang PetscInt lsol_loc,nlsol_loc,*isol_loc,*idx,*iidx,*idxx,*isol_loc_save; 9971070efccSSatish Balay MumpsScalar *sol_loc,*sol_loc_save; 998801fbe65SHong Zhang IS is_to,is_from; 999334c5f61SHong Zhang PetscInt k,proc,j,m; 1000801fbe65SHong Zhang const PetscInt *rstart; 1001334c5f61SHong Zhang Vec v_mpi,b_seq,x_seq; 1002334c5f61SHong Zhang VecScatter scat_rhs,scat_sol; 1003801fbe65SHong Zhang 1004801fbe65SHong Zhang /* create x_seq to hold local solution */ 100571aed81dSHong Zhang isol_loc_save = mumps->id.isol_loc; /* save it for MatSovle() */ 100671aed81dSHong Zhang sol_loc_save = mumps->id.sol_loc; 1007801fbe65SHong Zhang 100871aed81dSHong Zhang lsol_loc = mumps->id.INFO(23); 100971aed81dSHong Zhang nlsol_loc = nrhs*lsol_loc; /* length of sol_loc */ 101071aed81dSHong Zhang ierr = PetscMalloc2(nlsol_loc,&sol_loc,nlsol_loc,&isol_loc);CHKERRQ(ierr); 1011940cd9d6SSatish Balay mumps->id.sol_loc = (MumpsScalar*)sol_loc; 1012801fbe65SHong Zhang mumps->id.isol_loc = isol_loc; 1013801fbe65SHong Zhang 10141070efccSSatish Balay ierr = VecCreateSeqWithArray(PETSC_COMM_SELF,1,nlsol_loc,(PetscScalar*)sol_loc,&x_seq);CHKERRQ(ierr); 10152cd7d884SHong Zhang 101674f0fcc7SHong Zhang /* copy rhs matrix B into vector v_mpi */ 1017334c5f61SHong Zhang ierr = MatGetLocalSize(B,&m,NULL);CHKERRQ(ierr); 1018801fbe65SHong Zhang ierr = MatDenseGetArray(B,&bray);CHKERRQ(ierr); 101974f0fcc7SHong Zhang ierr = VecCreateMPIWithArray(PetscObjectComm((PetscObject)B),1,nrhs*m,nrhs*M,(const PetscScalar*)bray,&v_mpi);CHKERRQ(ierr); 1020801fbe65SHong Zhang ierr = MatDenseRestoreArray(B,&bray);CHKERRQ(ierr); 1021801fbe65SHong Zhang 1022334c5f61SHong Zhang /* scatter v_mpi to b_seq because MUMPS only supports centralized rhs */ 102374f0fcc7SHong Zhang /* idx: maps from k-th index of v_mpi to (i,j)-th global entry of B; 1024801fbe65SHong Zhang iidx: inverse of idx, will be used by scattering xx_seq -> X */ 1025801fbe65SHong Zhang ierr = PetscMalloc2(nrhs*M,&idx,nrhs*M,&iidx);CHKERRQ(ierr); 1026801fbe65SHong Zhang ierr = MatGetOwnershipRanges(B,&rstart);CHKERRQ(ierr); 1027801fbe65SHong Zhang k = 0; 1028801fbe65SHong Zhang for (proc=0; proc<mumps->size; proc++){ 1029801fbe65SHong Zhang for (j=0; j<nrhs; j++){ 1030801fbe65SHong Zhang for (i=rstart[proc]; i<rstart[proc+1]; i++){ 1031801fbe65SHong Zhang iidx[j*M + i] = k; 1032801fbe65SHong Zhang idx[k++] = j*M + i; 1033801fbe65SHong Zhang } 1034801fbe65SHong Zhang } 10352cd7d884SHong Zhang } 10362cd7d884SHong Zhang 1037801fbe65SHong Zhang if (!mumps->myid) { 1038334c5f61SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,nrhs*M,&b_seq);CHKERRQ(ierr); 1039801fbe65SHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,nrhs*M,idx,PETSC_COPY_VALUES,&is_to);CHKERRQ(ierr); 1040801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,nrhs*M,0,1,&is_from);CHKERRQ(ierr); 1041801fbe65SHong Zhang } else { 1042334c5f61SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&b_seq);CHKERRQ(ierr); 1043801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_to);CHKERRQ(ierr); 1044801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_from);CHKERRQ(ierr); 1045801fbe65SHong Zhang } 1046334c5f61SHong Zhang ierr = VecScatterCreate(v_mpi,is_from,b_seq,is_to,&scat_rhs);CHKERRQ(ierr); 1047334c5f61SHong Zhang ierr = VecScatterBegin(scat_rhs,v_mpi,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1048801fbe65SHong Zhang ierr = ISDestroy(&is_to);CHKERRQ(ierr); 1049801fbe65SHong Zhang ierr = ISDestroy(&is_from);CHKERRQ(ierr); 1050334c5f61SHong Zhang ierr = VecScatterEnd(scat_rhs,v_mpi,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1051801fbe65SHong Zhang 1052801fbe65SHong Zhang if (!mumps->myid) { /* define rhs on the host */ 1053334c5f61SHong Zhang ierr = VecGetArray(b_seq,&bray);CHKERRQ(ierr); 1054940cd9d6SSatish Balay mumps->id.rhs = (MumpsScalar*)bray; 1055334c5f61SHong Zhang ierr = VecRestoreArray(b_seq,&bray);CHKERRQ(ierr); 1056801fbe65SHong Zhang } 1057801fbe65SHong Zhang 1058801fbe65SHong Zhang /* solve phase */ 1059801fbe65SHong Zhang /*-------------*/ 1060801fbe65SHong Zhang mumps->id.job = JOB_SOLVE; 1061801fbe65SHong Zhang PetscMUMPS_c(&mumps->id); 1062801fbe65SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 1063801fbe65SHong Zhang 1064334c5f61SHong Zhang /* scatter mumps distributed solution to petsc vector v_mpi, which shares local arrays with solution matrix X */ 106574f0fcc7SHong Zhang ierr = MatDenseGetArray(X,&array);CHKERRQ(ierr); 106674f0fcc7SHong Zhang ierr = VecPlaceArray(v_mpi,array);CHKERRQ(ierr); 1067801fbe65SHong Zhang 1068334c5f61SHong Zhang /* create scatter scat_sol */ 106971aed81dSHong Zhang ierr = PetscMalloc1(nlsol_loc,&idxx);CHKERRQ(ierr); 107071aed81dSHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,nlsol_loc,0,1,&is_from);CHKERRQ(ierr); 107171aed81dSHong Zhang for (i=0; i<lsol_loc; i++) { 1072334c5f61SHong Zhang isol_loc[i] -= 1; /* change Fortran style to C style */ 1073334c5f61SHong Zhang idxx[i] = iidx[isol_loc[i]]; 1074801fbe65SHong Zhang for (j=1; j<nrhs; j++){ 1075334c5f61SHong Zhang idxx[j*lsol_loc+i] = iidx[isol_loc[i]+j*M]; 1076801fbe65SHong Zhang } 1077801fbe65SHong Zhang } 107871aed81dSHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,nlsol_loc,idxx,PETSC_COPY_VALUES,&is_to);CHKERRQ(ierr); 1079334c5f61SHong Zhang ierr = VecScatterCreate(x_seq,is_from,v_mpi,is_to,&scat_sol);CHKERRQ(ierr); 1080334c5f61SHong Zhang ierr = VecScatterBegin(scat_sol,x_seq,v_mpi,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1081801fbe65SHong Zhang ierr = ISDestroy(&is_from);CHKERRQ(ierr); 1082801fbe65SHong Zhang ierr = ISDestroy(&is_to);CHKERRQ(ierr); 1083334c5f61SHong Zhang ierr = VecScatterEnd(scat_sol,x_seq,v_mpi,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1084801fbe65SHong Zhang ierr = MatDenseRestoreArray(X,&array);CHKERRQ(ierr); 108571aed81dSHong Zhang 108671aed81dSHong Zhang /* free spaces */ 108771aed81dSHong Zhang mumps->id.sol_loc = sol_loc_save; 108871aed81dSHong Zhang mumps->id.isol_loc = isol_loc_save; 108971aed81dSHong Zhang 109071aed81dSHong Zhang ierr = PetscFree2(sol_loc,isol_loc);CHKERRQ(ierr); 1091801fbe65SHong Zhang ierr = PetscFree2(idx,iidx);CHKERRQ(ierr); 1092801fbe65SHong Zhang ierr = PetscFree(idxx);CHKERRQ(ierr); 109371aed81dSHong Zhang ierr = VecDestroy(&x_seq);CHKERRQ(ierr); 109474f0fcc7SHong Zhang ierr = VecDestroy(&v_mpi);CHKERRQ(ierr); 1095334c5f61SHong Zhang ierr = VecDestroy(&b_seq);CHKERRQ(ierr); 1096334c5f61SHong Zhang ierr = VecScatterDestroy(&scat_rhs);CHKERRQ(ierr); 1097334c5f61SHong Zhang ierr = VecScatterDestroy(&scat_sol);CHKERRQ(ierr); 1098801fbe65SHong Zhang } 1099e0b74bf9SHong Zhang PetscFunctionReturn(0); 1100e0b74bf9SHong Zhang } 1101e0b74bf9SHong Zhang 1102ace3df97SHong Zhang #if !defined(PETSC_USE_COMPLEX) 1103a58c3f20SHong Zhang /* 1104a58c3f20SHong Zhang input: 1105a58c3f20SHong Zhang F: numeric factor 1106a58c3f20SHong Zhang output: 1107a58c3f20SHong Zhang nneg: total number of negative pivots 1108a58c3f20SHong Zhang nzero: 0 1109a58c3f20SHong Zhang npos: (global dimension of F) - nneg 1110a58c3f20SHong Zhang */ 1111a58c3f20SHong Zhang 1112a58c3f20SHong Zhang #undef __FUNCT__ 1113a58c3f20SHong Zhang #define __FUNCT__ "MatGetInertia_SBAIJMUMPS" 1114dfbe8321SBarry Smith PetscErrorCode MatGetInertia_SBAIJMUMPS(Mat F,int *nneg,int *nzero,int *npos) 1115a58c3f20SHong Zhang { 1116a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 1117dfbe8321SBarry Smith PetscErrorCode ierr; 1118c1490034SHong Zhang PetscMPIInt size; 1119a58c3f20SHong Zhang 1120a58c3f20SHong Zhang PetscFunctionBegin; 1121ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)F),&size);CHKERRQ(ierr); 1122bcb30aebSHong Zhang /* MUMPS 4.3.1 calls ScaLAPACK when ICNTL(13)=0 (default), which does not offer the possibility to compute the inertia of a dense matrix. Set ICNTL(13)=1 to skip ScaLAPACK */ 1123a5e57a09SHong Zhang if (size > 1 && mumps->id.ICNTL(13) != 1) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"ICNTL(13)=%d. -mat_mumps_icntl_13 must be set as 1 for correct global matrix inertia\n",mumps->id.INFOG(13)); 1124ed85ac9fSHong Zhang 1125710ac8efSHong Zhang if (nneg) *nneg = mumps->id.INFOG(12); 1126ed85ac9fSHong Zhang if (nzero || npos) { 1127ed85ac9fSHong Zhang if (mumps->id.ICNTL(24) != 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"-mat_mumps_icntl_24 must be set as 1 for null pivot row detection"); 1128710ac8efSHong Zhang if (nzero) *nzero = mumps->id.INFOG(28); 1129710ac8efSHong Zhang if (npos) *npos = F->rmap->N - (mumps->id.INFOG(12) + mumps->id.INFOG(28)); 1130a58c3f20SHong Zhang } 1131a58c3f20SHong Zhang PetscFunctionReturn(0); 1132a58c3f20SHong Zhang } 1133ace3df97SHong Zhang #endif /* !defined(PETSC_USE_COMPLEX) */ 1134a58c3f20SHong Zhang 1135397b6df1SKris Buschelman #undef __FUNCT__ 1136f6c57405SHong Zhang #define __FUNCT__ "MatFactorNumeric_MUMPS" 11370481f469SBarry Smith PetscErrorCode MatFactorNumeric_MUMPS(Mat F,Mat A,const MatFactorInfo *info) 1138af281ebdSHong Zhang { 1139a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)(F)->spptr; 11406849ba73SBarry Smith PetscErrorCode ierr; 1141e09efc27SHong Zhang Mat F_diag; 1142ace3abfcSBarry Smith PetscBool isMPIAIJ; 1143397b6df1SKris Buschelman 1144397b6df1SKris Buschelman PetscFunctionBegin; 1145a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_REUSE_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 1146397b6df1SKris Buschelman 1147397b6df1SKris Buschelman /* numerical factorization phase */ 1148329ec9b3SHong Zhang /*-------------------------------*/ 1149a5e57a09SHong Zhang mumps->id.job = JOB_FACTNUMERIC; 11504e34a73bSHong Zhang if (!mumps->id.ICNTL(18)) { /* A is centralized */ 1151a5e57a09SHong Zhang if (!mumps->myid) { 1152940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 1153397b6df1SKris Buschelman } 1154397b6df1SKris Buschelman } else { 1155940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 1156397b6df1SKris Buschelman } 1157a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1158a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) { 1159151787a6SHong Zhang if (mumps->id.INFO(1) == -13) { 1160151787a6SHong Zhang if (mumps->id.INFO(2) < 0) { 1161151787a6SHong Zhang SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: Cannot allocate required memory %d megabytes\n",-mumps->id.INFO(2)); 1162151787a6SHong Zhang } else { 1163151787a6SHong Zhang SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: Cannot allocate required memory %d bytes\n",mumps->id.INFO(2)); 1164151787a6SHong Zhang } 1165151787a6SHong Zhang } else SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: INFO(1)=%d, INFO(2)=%d\n",mumps->id.INFO(1),mumps->id.INFO(2)); 1166397b6df1SKris Buschelman } 1167a5e57a09SHong Zhang if (!mumps->myid && mumps->id.ICNTL(16) > 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB," mumps->id.ICNTL(16):=%d\n",mumps->id.INFOG(16)); 1168397b6df1SKris Buschelman 1169dcd589f8SShri Abhyankar (F)->assembled = PETSC_TRUE; 1170a5e57a09SHong Zhang mumps->matstruc = SAME_NONZERO_PATTERN; 1171a5e57a09SHong Zhang mumps->CleanUpMUMPS = PETSC_TRUE; 1172b5fa320bSStefano Zampini mumps->schur_factored = PETSC_FALSE; 117359ac8732SStefano Zampini mumps->schur_inverted = PETSC_FALSE; 117467877ebaSShri Abhyankar 1175066565c5SStefano Zampini /* just to be sure that ICNTL(19) value returned by a call from MatMumpsGetIcntl is always consistent */ 1176066565c5SStefano Zampini if (!mumps->sym && mumps->id.ICNTL(19) && mumps->id.ICNTL(19) != 1) mumps->id.ICNTL(19) = 3; 1177066565c5SStefano Zampini 1178a5e57a09SHong Zhang if (mumps->size > 1) { 117967877ebaSShri Abhyankar PetscInt lsol_loc; 118067877ebaSShri Abhyankar PetscScalar *sol_loc; 11812205254eSKarl Rupp 1182c2093ab7SHong Zhang ierr = PetscObjectTypeCompare((PetscObject)A,MATMPIAIJ,&isMPIAIJ);CHKERRQ(ierr); 1183c2093ab7SHong Zhang if (isMPIAIJ) F_diag = ((Mat_MPIAIJ*)(F)->data)->A; 1184c2093ab7SHong Zhang else F_diag = ((Mat_MPISBAIJ*)(F)->data)->A; 1185c2093ab7SHong Zhang F_diag->assembled = PETSC_TRUE; 1186c2093ab7SHong Zhang 1187c2093ab7SHong Zhang /* distributed solution; Create x_seq=sol_loc for repeated use */ 1188c2093ab7SHong Zhang if (mumps->x_seq) { 1189c2093ab7SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 1190c2093ab7SHong Zhang ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr); 1191c2093ab7SHong Zhang ierr = VecDestroy(&mumps->x_seq);CHKERRQ(ierr); 1192c2093ab7SHong Zhang } 1193a5e57a09SHong Zhang lsol_loc = mumps->id.INFO(23); /* length of sol_loc */ 1194dcca6d9dSJed Brown ierr = PetscMalloc2(lsol_loc,&sol_loc,lsol_loc,&mumps->id.isol_loc);CHKERRQ(ierr); 1195a5e57a09SHong Zhang mumps->id.lsol_loc = lsol_loc; 1196940cd9d6SSatish Balay mumps->id.sol_loc = (MumpsScalar*)sol_loc; 1197a5e57a09SHong Zhang ierr = VecCreateSeqWithArray(PETSC_COMM_SELF,1,lsol_loc,sol_loc,&mumps->x_seq);CHKERRQ(ierr); 119867877ebaSShri Abhyankar } 1199397b6df1SKris Buschelman PetscFunctionReturn(0); 1200397b6df1SKris Buschelman } 1201397b6df1SKris Buschelman 12029a2535b5SHong Zhang /* Sets MUMPS options from the options database */ 1203dcd589f8SShri Abhyankar #undef __FUNCT__ 12049a2535b5SHong Zhang #define __FUNCT__ "PetscSetMUMPSFromOptions" 12059a2535b5SHong Zhang PetscErrorCode PetscSetMUMPSFromOptions(Mat F, Mat A) 1206dcd589f8SShri Abhyankar { 12079a2535b5SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1208dcd589f8SShri Abhyankar PetscErrorCode ierr; 1209b34f08ffSHong Zhang PetscInt icntl,info[40],i,ninfo=40; 1210ace3abfcSBarry Smith PetscBool flg; 1211dcd589f8SShri Abhyankar 1212dcd589f8SShri Abhyankar PetscFunctionBegin; 1213ce94432eSBarry Smith ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)A),((PetscObject)A)->prefix,"MUMPS Options","Mat");CHKERRQ(ierr); 12149a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_1","ICNTL(1): output stream for error messages","None",mumps->id.ICNTL(1),&icntl,&flg);CHKERRQ(ierr); 12159a2535b5SHong Zhang if (flg) mumps->id.ICNTL(1) = icntl; 12169a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_2","ICNTL(2): output stream for diagnostic printing, statistics, and warning","None",mumps->id.ICNTL(2),&icntl,&flg);CHKERRQ(ierr); 12179a2535b5SHong Zhang if (flg) mumps->id.ICNTL(2) = icntl; 12189a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_3","ICNTL(3): output stream for global information, collected on the host","None",mumps->id.ICNTL(3),&icntl,&flg);CHKERRQ(ierr); 12199a2535b5SHong Zhang if (flg) mumps->id.ICNTL(3) = icntl; 1220dcd589f8SShri Abhyankar 12219a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_4","ICNTL(4): level of printing (0 to 4)","None",mumps->id.ICNTL(4),&icntl,&flg);CHKERRQ(ierr); 12229a2535b5SHong Zhang if (flg) mumps->id.ICNTL(4) = icntl; 12239a2535b5SHong Zhang if (mumps->id.ICNTL(4) || PetscLogPrintInfo) mumps->id.ICNTL(3) = 6; /* resume MUMPS default id.ICNTL(3) = 6 */ 12249a2535b5SHong Zhang 1225d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_6","ICNTL(6): permutes to a zero-free diagonal and/or scale the matrix (0 to 7)","None",mumps->id.ICNTL(6),&icntl,&flg);CHKERRQ(ierr); 12269a2535b5SHong Zhang if (flg) mumps->id.ICNTL(6) = icntl; 12279a2535b5SHong Zhang 1228d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_7","ICNTL(7): computes a symmetric permutation in sequential analysis (0 to 7). 3=Scotch, 4=PORD, 5=Metis","None",mumps->id.ICNTL(7),&icntl,&flg);CHKERRQ(ierr); 1229dcd589f8SShri Abhyankar if (flg) { 12302205254eSKarl Rupp if (icntl== 1 && mumps->size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"pivot order be set by the user in PERM_IN -- not supported by the PETSc/MUMPS interface\n"); 12312205254eSKarl Rupp else mumps->id.ICNTL(7) = icntl; 1232dcd589f8SShri Abhyankar } 1233e0b74bf9SHong Zhang 12340298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_8","ICNTL(8): scaling strategy (-2 to 8 or 77)","None",mumps->id.ICNTL(8),&mumps->id.ICNTL(8),NULL);CHKERRQ(ierr); 1235d341cd04SHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_9","ICNTL(9): computes the solution using A or A^T","None",mumps->id.ICNTL(9),&mumps->id.ICNTL(9),NULL);CHKERRQ(ierr); handled by MatSolveTranspose_MUMPS() */ 12360298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_10","ICNTL(10): max num of refinements","None",mumps->id.ICNTL(10),&mumps->id.ICNTL(10),NULL);CHKERRQ(ierr); 1237d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_11","ICNTL(11): statistics related to an error analysis (via -ksp_view)","None",mumps->id.ICNTL(11),&mumps->id.ICNTL(11),NULL);CHKERRQ(ierr); 1238d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_12","ICNTL(12): an ordering strategy for symmetric matrices (0 to 3)","None",mumps->id.ICNTL(12),&mumps->id.ICNTL(12),NULL);CHKERRQ(ierr); 1239d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_13","ICNTL(13): parallelism of the root node (enable ScaLAPACK) and its splitting","None",mumps->id.ICNTL(13),&mumps->id.ICNTL(13),NULL);CHKERRQ(ierr); 1240d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_14","ICNTL(14): percentage increase in the estimated working space","None",mumps->id.ICNTL(14),&mumps->id.ICNTL(14),NULL);CHKERRQ(ierr); 1241d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_19","ICNTL(19): computes the Schur complement","None",mumps->id.ICNTL(19),&mumps->id.ICNTL(19),NULL);CHKERRQ(ierr); 124259ac8732SStefano Zampini if (mumps->id.ICNTL(19) <= 0 || mumps->id.ICNTL(19) > 3) { /* reset any schur data (if any) */ 124359ac8732SStefano Zampini ierr = MatMumpsResetSchur_Private(mumps);CHKERRQ(ierr); 124459ac8732SStefano Zampini } 12454e34a73bSHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_20","ICNTL(20): the format (dense or sparse) of the right-hand sides","None",mumps->id.ICNTL(20),&mumps->id.ICNTL(20),NULL);CHKERRQ(ierr); -- sparse rhs is not supported in PETSc API */ 1246d341cd04SHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_21","ICNTL(21): the distribution (centralized or distributed) of the solution vectors","None",mumps->id.ICNTL(21),&mumps->id.ICNTL(21),NULL);CHKERRQ(ierr); we only use distributed solution vector */ 12479a2535b5SHong Zhang 1248d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_22","ICNTL(22): in-core/out-of-core factorization and solve (0 or 1)","None",mumps->id.ICNTL(22),&mumps->id.ICNTL(22),NULL);CHKERRQ(ierr); 12490298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_23","ICNTL(23): max size of the working memory (MB) that can allocate per processor","None",mumps->id.ICNTL(23),&mumps->id.ICNTL(23),NULL);CHKERRQ(ierr); 12500298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_24","ICNTL(24): detection of null pivot rows (0 or 1)","None",mumps->id.ICNTL(24),&mumps->id.ICNTL(24),NULL);CHKERRQ(ierr); 12519a2535b5SHong Zhang if (mumps->id.ICNTL(24)) { 12529a2535b5SHong Zhang mumps->id.ICNTL(13) = 1; /* turn-off ScaLAPACK to help with the correct detection of null pivots */ 1253d7ebd59bSHong Zhang } 1254d7ebd59bSHong Zhang 1255d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_25","ICNTL(25): compute a solution of a deficient matrix and a null space basis","None",mumps->id.ICNTL(25),&mumps->id.ICNTL(25),NULL);CHKERRQ(ierr); 1256d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_26","ICNTL(26): drives the solution phase if a Schur complement matrix","None",mumps->id.ICNTL(26),&mumps->id.ICNTL(26),NULL);CHKERRQ(ierr); 12572cd7d884SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_27","ICNTL(27): the blocking size for multiple right-hand sides","None",mumps->id.ICNTL(27),&mumps->id.ICNTL(27),NULL);CHKERRQ(ierr); 12580298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_28","ICNTL(28): use 1 for sequential analysis and ictnl(7) ordering, or 2 for parallel analysis and ictnl(29) ordering","None",mumps->id.ICNTL(28),&mumps->id.ICNTL(28),NULL);CHKERRQ(ierr); 1259d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_29","ICNTL(29): parallel ordering 1 = ptscotch, 2 = parmetis","None",mumps->id.ICNTL(29),&mumps->id.ICNTL(29),NULL);CHKERRQ(ierr); 12600298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_30","ICNTL(30): compute user-specified set of entries in inv(A)","None",mumps->id.ICNTL(30),&mumps->id.ICNTL(30),NULL);CHKERRQ(ierr); 1261d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_31","ICNTL(31): indicates which factors may be discarded during factorization","None",mumps->id.ICNTL(31),&mumps->id.ICNTL(31),NULL);CHKERRQ(ierr); 12624e34a73bSHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_32","ICNTL(32): performs the forward elemination of the right-hand sides during factorization","None",mumps->id.ICNTL(32),&mumps->id.ICNTL(32),NULL);CHKERRQ(ierr); -- not supported by PETSc API */ 12630298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_33","ICNTL(33): compute determinant","None",mumps->id.ICNTL(33),&mumps->id.ICNTL(33),NULL);CHKERRQ(ierr); 1264dcd589f8SShri Abhyankar 12650298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_1","CNTL(1): relative pivoting threshold","None",mumps->id.CNTL(1),&mumps->id.CNTL(1),NULL);CHKERRQ(ierr); 12660298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_2","CNTL(2): stopping criterion of refinement","None",mumps->id.CNTL(2),&mumps->id.CNTL(2),NULL);CHKERRQ(ierr); 12670298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_3","CNTL(3): absolute pivoting threshold","None",mumps->id.CNTL(3),&mumps->id.CNTL(3),NULL);CHKERRQ(ierr); 12680298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_4","CNTL(4): value for static pivoting","None",mumps->id.CNTL(4),&mumps->id.CNTL(4),NULL);CHKERRQ(ierr); 12690298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_5","CNTL(5): fixation for null pivots","None",mumps->id.CNTL(5),&mumps->id.CNTL(5),NULL);CHKERRQ(ierr); 1270e5bb22a1SHong Zhang 12710298fd71SBarry Smith ierr = PetscOptionsString("-mat_mumps_ooc_tmpdir", "out of core directory", "None", mumps->id.ooc_tmpdir, mumps->id.ooc_tmpdir, 256, NULL); 1272b34f08ffSHong Zhang 127316d797efSHong Zhang ierr = PetscOptionsIntArray("-mat_mumps_view_info","request INFO local to each processor","",info,&ninfo,NULL);CHKERRQ(ierr); 1274b34f08ffSHong Zhang if (ninfo) { 1275b34f08ffSHong Zhang if (ninfo > 40) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"number of INFO %d must <= 40\n",ninfo); 1276b34f08ffSHong Zhang ierr = PetscMalloc1(ninfo,&mumps->info);CHKERRQ(ierr); 1277b34f08ffSHong Zhang mumps->ninfo = ninfo; 1278b34f08ffSHong Zhang for (i=0; i<ninfo; i++) { 1279b34f08ffSHong Zhang if (info[i] < 0 || info[i]>40) { 1280b34f08ffSHong Zhang SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"index of INFO %d must between 1 and 40\n",ninfo); 1281b34f08ffSHong Zhang } else { 1282b34f08ffSHong Zhang mumps->info[i] = info[i]; 1283b34f08ffSHong Zhang } 1284b34f08ffSHong Zhang } 1285b34f08ffSHong Zhang } 1286b34f08ffSHong Zhang 1287dcd589f8SShri Abhyankar PetscOptionsEnd(); 1288dcd589f8SShri Abhyankar PetscFunctionReturn(0); 1289dcd589f8SShri Abhyankar } 1290dcd589f8SShri Abhyankar 1291dcd589f8SShri Abhyankar #undef __FUNCT__ 1292dcd589f8SShri Abhyankar #define __FUNCT__ "PetscInitializeMUMPS" 1293f697e70eSHong Zhang PetscErrorCode PetscInitializeMUMPS(Mat A,Mat_MUMPS *mumps) 1294dcd589f8SShri Abhyankar { 1295dcd589f8SShri Abhyankar PetscErrorCode ierr; 1296dcd589f8SShri Abhyankar 1297dcd589f8SShri Abhyankar PetscFunctionBegin; 1298ce94432eSBarry Smith ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)A), &mumps->myid); 1299ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)A),&mumps->size);CHKERRQ(ierr); 1300ce94432eSBarry Smith ierr = MPI_Comm_dup(PetscObjectComm((PetscObject)A),&(mumps->comm_mumps));CHKERRQ(ierr); 13012205254eSKarl Rupp 1302f697e70eSHong Zhang mumps->id.comm_fortran = MPI_Comm_c2f(mumps->comm_mumps); 1303f697e70eSHong Zhang 1304f697e70eSHong Zhang mumps->id.job = JOB_INIT; 1305f697e70eSHong Zhang mumps->id.par = 1; /* host participates factorizaton and solve */ 1306f697e70eSHong Zhang mumps->id.sym = mumps->sym; 13072907cef9SHong Zhang PetscMUMPS_c(&mumps->id); 1308f697e70eSHong Zhang 1309f697e70eSHong Zhang mumps->CleanUpMUMPS = PETSC_FALSE; 13100298fd71SBarry Smith mumps->scat_rhs = NULL; 13110298fd71SBarry Smith mumps->scat_sol = NULL; 13129a2535b5SHong Zhang 131370544d5fSHong Zhang /* set PETSc-MUMPS default options - override MUMPS default */ 13149a2535b5SHong Zhang mumps->id.ICNTL(3) = 0; 13159a2535b5SHong Zhang mumps->id.ICNTL(4) = 0; 13169a2535b5SHong Zhang if (mumps->size == 1) { 13179a2535b5SHong Zhang mumps->id.ICNTL(18) = 0; /* centralized assembled matrix input */ 13189a2535b5SHong Zhang } else { 13199a2535b5SHong Zhang mumps->id.ICNTL(18) = 3; /* distributed assembled matrix input */ 13204e34a73bSHong Zhang mumps->id.ICNTL(20) = 0; /* rhs is in dense format */ 132170544d5fSHong Zhang mumps->id.ICNTL(21) = 1; /* distributed solution */ 13229a2535b5SHong Zhang } 13236444a565SStefano Zampini 13246444a565SStefano Zampini /* schur */ 13256444a565SStefano Zampini mumps->id.size_schur = 0; 13266444a565SStefano Zampini mumps->id.listvar_schur = NULL; 13276444a565SStefano Zampini mumps->id.schur = NULL; 1328b5fa320bSStefano Zampini mumps->schur_second_solve = PETSC_FALSE; 1329b5fa320bSStefano Zampini mumps->sizeredrhs = 0; 1330b5fa320bSStefano Zampini mumps->schur_pivots = NULL; 1331b5fa320bSStefano Zampini mumps->schur_work = NULL; 133259ac8732SStefano Zampini mumps->schur_sol = NULL; 133359ac8732SStefano Zampini mumps->schur_sizesol = 0; 133459ac8732SStefano Zampini mumps->schur_restored = PETSC_TRUE; 133559ac8732SStefano Zampini mumps->schur_factored = PETSC_FALSE; 133659ac8732SStefano Zampini mumps->schur_inverted = PETSC_FALSE; 1337dcd589f8SShri Abhyankar PetscFunctionReturn(0); 1338dcd589f8SShri Abhyankar } 1339dcd589f8SShri Abhyankar 1340a5e57a09SHong Zhang /* Note Petsc r(=c) permutation is used when mumps->id.ICNTL(7)==1 with centralized assembled matrix input; otherwise r and c are ignored */ 1341397b6df1SKris Buschelman #undef __FUNCT__ 1342f0c56d0fSKris Buschelman #define __FUNCT__ "MatLUFactorSymbolic_AIJMUMPS" 13430481f469SBarry Smith PetscErrorCode MatLUFactorSymbolic_AIJMUMPS(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info) 1344b24902e0SBarry Smith { 1345a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1346dcd589f8SShri Abhyankar PetscErrorCode ierr; 134767877ebaSShri Abhyankar Vec b; 134867877ebaSShri Abhyankar IS is_iden; 134967877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1350397b6df1SKris Buschelman 1351397b6df1SKris Buschelman PetscFunctionBegin; 1352a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1353dcd589f8SShri Abhyankar 13549a2535b5SHong Zhang /* Set MUMPS options from the options database */ 13559a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1356dcd589f8SShri Abhyankar 1357a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 1358dcd589f8SShri Abhyankar 135967877ebaSShri Abhyankar /* analysis phase */ 136067877ebaSShri Abhyankar /*----------------*/ 1361a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1362a5e57a09SHong Zhang mumps->id.n = M; 1363a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 136467877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1365a5e57a09SHong Zhang if (!mumps->myid) { 1366a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1367a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1368940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 136967877ebaSShri Abhyankar } 1370a5e57a09SHong Zhang if (mumps->id.ICNTL(7) == 1) { /* use user-provide matrix ordering - assuming r = c ordering */ 13715248a706SHong Zhang /* 13725248a706SHong Zhang PetscBool flag; 13735248a706SHong Zhang ierr = ISEqual(r,c,&flag);CHKERRQ(ierr); 13745248a706SHong Zhang if (!flag) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"row_perm != col_perm"); 13755248a706SHong Zhang ierr = ISView(r,PETSC_VIEWER_STDOUT_SELF); 13765248a706SHong Zhang */ 1377a5e57a09SHong Zhang if (!mumps->myid) { 1378e0b74bf9SHong Zhang const PetscInt *idx; 1379e0b74bf9SHong Zhang PetscInt i,*perm_in; 13802205254eSKarl Rupp 1381785e854fSJed Brown ierr = PetscMalloc1(M,&perm_in);CHKERRQ(ierr); 1382e0b74bf9SHong Zhang ierr = ISGetIndices(r,&idx);CHKERRQ(ierr); 13832205254eSKarl Rupp 1384a5e57a09SHong Zhang mumps->id.perm_in = perm_in; 1385e0b74bf9SHong Zhang for (i=0; i<M; i++) perm_in[i] = idx[i]+1; /* perm_in[]: start from 1, not 0! */ 1386e0b74bf9SHong Zhang ierr = ISRestoreIndices(r,&idx);CHKERRQ(ierr); 1387e0b74bf9SHong Zhang } 1388e0b74bf9SHong Zhang } 138967877ebaSShri Abhyankar } 139067877ebaSShri Abhyankar break; 139167877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1392a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1393a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1394a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1395940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 139667877ebaSShri Abhyankar } 139767877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1398a5e57a09SHong Zhang if (!mumps->myid) { 13992cd7d884SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->rmap->N,&mumps->b_seq);CHKERRQ(ierr); 14002cd7d884SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,A->rmap->N,0,1,&is_iden);CHKERRQ(ierr); 140167877ebaSShri Abhyankar } else { 1402a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 140367877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 140467877ebaSShri Abhyankar } 14052a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1406a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 14076bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 14086bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 140967877ebaSShri Abhyankar break; 141067877ebaSShri Abhyankar } 1411a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1412a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 141367877ebaSShri Abhyankar 1414719d5645SBarry Smith F->ops->lufactornumeric = MatFactorNumeric_MUMPS; 1415dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 141651d5961aSHong Zhang F->ops->solvetranspose = MatSolveTranspose_MUMPS; 14174e34a73bSHong Zhang F->ops->matsolve = MatMatSolve_MUMPS; 1418b24902e0SBarry Smith PetscFunctionReturn(0); 1419b24902e0SBarry Smith } 1420b24902e0SBarry Smith 1421450b117fSShri Abhyankar /* Note the Petsc r and c permutations are ignored */ 1422450b117fSShri Abhyankar #undef __FUNCT__ 1423450b117fSShri Abhyankar #define __FUNCT__ "MatLUFactorSymbolic_BAIJMUMPS" 1424450b117fSShri Abhyankar PetscErrorCode MatLUFactorSymbolic_BAIJMUMPS(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info) 1425450b117fSShri Abhyankar { 1426a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1427dcd589f8SShri Abhyankar PetscErrorCode ierr; 142867877ebaSShri Abhyankar Vec b; 142967877ebaSShri Abhyankar IS is_iden; 143067877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1431450b117fSShri Abhyankar 1432450b117fSShri Abhyankar PetscFunctionBegin; 1433a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1434dcd589f8SShri Abhyankar 14359a2535b5SHong Zhang /* Set MUMPS options from the options database */ 14369a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1437dcd589f8SShri Abhyankar 1438a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 143967877ebaSShri Abhyankar 144067877ebaSShri Abhyankar /* analysis phase */ 144167877ebaSShri Abhyankar /*----------------*/ 1442a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1443a5e57a09SHong Zhang mumps->id.n = M; 1444a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 144567877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1446a5e57a09SHong Zhang if (!mumps->myid) { 1447a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1448a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1449940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 145067877ebaSShri Abhyankar } 145167877ebaSShri Abhyankar } 145267877ebaSShri Abhyankar break; 145367877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1454a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1455a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1456a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1457940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 145867877ebaSShri Abhyankar } 145967877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1460a5e57a09SHong Zhang if (!mumps->myid) { 1461a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr); 146267877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr); 146367877ebaSShri Abhyankar } else { 1464a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 146567877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 146667877ebaSShri Abhyankar } 14672a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1468a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 14696bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 14706bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 147167877ebaSShri Abhyankar break; 147267877ebaSShri Abhyankar } 1473a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1474a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 147567877ebaSShri Abhyankar 1476450b117fSShri Abhyankar F->ops->lufactornumeric = MatFactorNumeric_MUMPS; 1477dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 147851d5961aSHong Zhang F->ops->solvetranspose = MatSolveTranspose_MUMPS; 1479450b117fSShri Abhyankar PetscFunctionReturn(0); 1480450b117fSShri Abhyankar } 1481b24902e0SBarry Smith 1482141f4205SHong Zhang /* Note the Petsc r permutation and factor info are ignored */ 1483397b6df1SKris Buschelman #undef __FUNCT__ 148467877ebaSShri Abhyankar #define __FUNCT__ "MatCholeskyFactorSymbolic_MUMPS" 148567877ebaSShri Abhyankar PetscErrorCode MatCholeskyFactorSymbolic_MUMPS(Mat F,Mat A,IS r,const MatFactorInfo *info) 1486b24902e0SBarry Smith { 1487a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1488dcd589f8SShri Abhyankar PetscErrorCode ierr; 148967877ebaSShri Abhyankar Vec b; 149067877ebaSShri Abhyankar IS is_iden; 149167877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1492397b6df1SKris Buschelman 1493397b6df1SKris Buschelman PetscFunctionBegin; 1494a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1495dcd589f8SShri Abhyankar 14969a2535b5SHong Zhang /* Set MUMPS options from the options database */ 14979a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1498dcd589f8SShri Abhyankar 1499a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 1500dcd589f8SShri Abhyankar 150167877ebaSShri Abhyankar /* analysis phase */ 150267877ebaSShri Abhyankar /*----------------*/ 1503a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1504a5e57a09SHong Zhang mumps->id.n = M; 1505a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 150667877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1507a5e57a09SHong Zhang if (!mumps->myid) { 1508a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1509a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1510940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 151167877ebaSShri Abhyankar } 151267877ebaSShri Abhyankar } 151367877ebaSShri Abhyankar break; 151467877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1515a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1516a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1517a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1518940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 151967877ebaSShri Abhyankar } 152067877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1521a5e57a09SHong Zhang if (!mumps->myid) { 1522a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr); 152367877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr); 152467877ebaSShri Abhyankar } else { 1525a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 152667877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 152767877ebaSShri Abhyankar } 15282a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1529a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 15306bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 15316bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 153267877ebaSShri Abhyankar break; 153367877ebaSShri Abhyankar } 1534a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1535a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 153667877ebaSShri Abhyankar 15372792810eSHong Zhang F->ops->choleskyfactornumeric = MatFactorNumeric_MUMPS; 1538dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 153951d5961aSHong Zhang F->ops->solvetranspose = MatSolve_MUMPS; 15404e34a73bSHong Zhang F->ops->matsolve = MatMatSolve_MUMPS; 15414e34a73bSHong Zhang #if defined(PETSC_USE_COMPLEX) 15420298fd71SBarry Smith F->ops->getinertia = NULL; 15434e34a73bSHong Zhang #else 15444e34a73bSHong Zhang F->ops->getinertia = MatGetInertia_SBAIJMUMPS; 1545db4efbfdSBarry Smith #endif 1546b24902e0SBarry Smith PetscFunctionReturn(0); 1547b24902e0SBarry Smith } 1548b24902e0SBarry Smith 1549397b6df1SKris Buschelman #undef __FUNCT__ 155064e6c443SBarry Smith #define __FUNCT__ "MatView_MUMPS" 155164e6c443SBarry Smith PetscErrorCode MatView_MUMPS(Mat A,PetscViewer viewer) 155274ed9c26SBarry Smith { 1553f6c57405SHong Zhang PetscErrorCode ierr; 155464e6c443SBarry Smith PetscBool iascii; 155564e6c443SBarry Smith PetscViewerFormat format; 1556a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 1557f6c57405SHong Zhang 1558f6c57405SHong Zhang PetscFunctionBegin; 155964e6c443SBarry Smith /* check if matrix is mumps type */ 156064e6c443SBarry Smith if (A->ops->solve != MatSolve_MUMPS) PetscFunctionReturn(0); 156164e6c443SBarry Smith 1562251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 156364e6c443SBarry Smith if (iascii) { 156464e6c443SBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 156564e6c443SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO) { 156664e6c443SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"MUMPS run parameters:\n");CHKERRQ(ierr); 1567a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," SYM (matrix type): %d \n",mumps->id.sym);CHKERRQ(ierr); 1568a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," PAR (host participation): %d \n",mumps->id.par);CHKERRQ(ierr); 1569a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(1) (output for error): %d \n",mumps->id.ICNTL(1));CHKERRQ(ierr); 1570a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(2) (output of diagnostic msg): %d \n",mumps->id.ICNTL(2));CHKERRQ(ierr); 1571a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(3) (output for global info): %d \n",mumps->id.ICNTL(3));CHKERRQ(ierr); 1572a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(4) (level of printing): %d \n",mumps->id.ICNTL(4));CHKERRQ(ierr); 1573a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(5) (input mat struct): %d \n",mumps->id.ICNTL(5));CHKERRQ(ierr); 1574a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(6) (matrix prescaling): %d \n",mumps->id.ICNTL(6));CHKERRQ(ierr); 1575a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(7) (sequentia matrix ordering):%d \n",mumps->id.ICNTL(7));CHKERRQ(ierr); 1576a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(8) (scalling strategy): %d \n",mumps->id.ICNTL(8));CHKERRQ(ierr); 1577a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(10) (max num of refinements): %d \n",mumps->id.ICNTL(10));CHKERRQ(ierr); 1578a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(11) (error analysis): %d \n",mumps->id.ICNTL(11));CHKERRQ(ierr); 1579a5e57a09SHong Zhang if (mumps->id.ICNTL(11)>0) { 1580a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(4) (inf norm of input mat): %g\n",mumps->id.RINFOG(4));CHKERRQ(ierr); 1581a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(5) (inf norm of solution): %g\n",mumps->id.RINFOG(5));CHKERRQ(ierr); 1582a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(6) (inf norm of residual): %g\n",mumps->id.RINFOG(6));CHKERRQ(ierr); 1583a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(7),RINFOG(8) (backward error est): %g, %g\n",mumps->id.RINFOG(7),mumps->id.RINFOG(8));CHKERRQ(ierr); 1584a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(9) (error estimate): %g \n",mumps->id.RINFOG(9));CHKERRQ(ierr); 1585a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(10),RINFOG(11)(condition numbers): %g, %g\n",mumps->id.RINFOG(10),mumps->id.RINFOG(11));CHKERRQ(ierr); 1586f6c57405SHong Zhang } 1587a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(12) (efficiency control): %d \n",mumps->id.ICNTL(12));CHKERRQ(ierr); 1588a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(13) (efficiency control): %d \n",mumps->id.ICNTL(13));CHKERRQ(ierr); 1589a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(14) (percentage of estimated workspace increase): %d \n",mumps->id.ICNTL(14));CHKERRQ(ierr); 1590f6c57405SHong Zhang /* ICNTL(15-17) not used */ 1591a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(18) (input mat struct): %d \n",mumps->id.ICNTL(18));CHKERRQ(ierr); 1592a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(19) (Shur complement info): %d \n",mumps->id.ICNTL(19));CHKERRQ(ierr); 1593a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(20) (rhs sparse pattern): %d \n",mumps->id.ICNTL(20));CHKERRQ(ierr); 1594ca3dc52bSPierre Jolivet ierr = PetscViewerASCIIPrintf(viewer," ICNTL(21) (solution struct): %d \n",mumps->id.ICNTL(21));CHKERRQ(ierr); 1595a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(22) (in-core/out-of-core facility): %d \n",mumps->id.ICNTL(22));CHKERRQ(ierr); 1596a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(23) (max size of memory can be allocated locally):%d \n",mumps->id.ICNTL(23));CHKERRQ(ierr); 1597c0165424SHong Zhang 1598a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(24) (detection of null pivot rows): %d \n",mumps->id.ICNTL(24));CHKERRQ(ierr); 1599a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(25) (computation of a null space basis): %d \n",mumps->id.ICNTL(25));CHKERRQ(ierr); 1600a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(26) (Schur options for rhs or solution): %d \n",mumps->id.ICNTL(26));CHKERRQ(ierr); 1601a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(27) (experimental parameter): %d \n",mumps->id.ICNTL(27));CHKERRQ(ierr); 1602a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(28) (use parallel or sequential ordering): %d \n",mumps->id.ICNTL(28));CHKERRQ(ierr); 1603a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(29) (parallel ordering): %d \n",mumps->id.ICNTL(29));CHKERRQ(ierr); 160442179a6aSHong Zhang 1605a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(30) (user-specified set of entries in inv(A)): %d \n",mumps->id.ICNTL(30));CHKERRQ(ierr); 1606a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(31) (factors is discarded in the solve phase): %d \n",mumps->id.ICNTL(31));CHKERRQ(ierr); 1607a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(33) (compute determinant): %d \n",mumps->id.ICNTL(33));CHKERRQ(ierr); 1608f6c57405SHong Zhang 1609a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(1) (relative pivoting threshold): %g \n",mumps->id.CNTL(1));CHKERRQ(ierr); 1610a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(2) (stopping criterion of refinement): %g \n",mumps->id.CNTL(2));CHKERRQ(ierr); 1611ca3dc52bSPierre Jolivet ierr = PetscViewerASCIIPrintf(viewer," CNTL(3) (absolute pivoting threshold): %g \n",mumps->id.CNTL(3));CHKERRQ(ierr); 1612ca3dc52bSPierre Jolivet ierr = PetscViewerASCIIPrintf(viewer," CNTL(4) (value of static pivoting): %g \n",mumps->id.CNTL(4));CHKERRQ(ierr); 1613a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(5) (fixation for null pivots): %g \n",mumps->id.CNTL(5));CHKERRQ(ierr); 1614f6c57405SHong Zhang 1615f6c57405SHong Zhang /* infomation local to each processor */ 161634ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(1) (local estimated flops for the elimination after analysis): \n");CHKERRQ(ierr); 16177b23a99aSBarry Smith ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_TRUE);CHKERRQ(ierr); 1618a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(1));CHKERRQ(ierr); 161934ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 162034ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(2) (local estimated flops for the assembly after factorization): \n");CHKERRQ(ierr); 1621a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(2));CHKERRQ(ierr); 162234ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 162334ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(3) (local estimated flops for the elimination after factorization): \n");CHKERRQ(ierr); 1624a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(3));CHKERRQ(ierr); 162534ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1626f6c57405SHong Zhang 162734ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(15) (estimated size of (in MB) MUMPS internal data for running numerical factorization): \n");CHKERRQ(ierr); 1628a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(15));CHKERRQ(ierr); 162934ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1630f6c57405SHong Zhang 163134ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(16) (size of (in MB) MUMPS internal data used during numerical factorization): \n");CHKERRQ(ierr); 1632a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(16));CHKERRQ(ierr); 163334ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1634f6c57405SHong Zhang 163534ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(23) (num of pivots eliminated on this processor after factorization): \n");CHKERRQ(ierr); 1636a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(23));CHKERRQ(ierr); 163734ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1638b34f08ffSHong Zhang 1639b34f08ffSHong Zhang if (mumps->ninfo && mumps->ninfo <= 40){ 1640b34f08ffSHong Zhang PetscInt i; 1641b34f08ffSHong Zhang for (i=0; i<mumps->ninfo; i++){ 1642b34f08ffSHong Zhang ierr = PetscViewerASCIIPrintf(viewer, " INFO(%d): \n",mumps->info[i]);CHKERRQ(ierr); 1643b34f08ffSHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(mumps->info[i]));CHKERRQ(ierr); 1644b34f08ffSHong Zhang ierr = PetscViewerFlush(viewer); 1645b34f08ffSHong Zhang } 1646b34f08ffSHong Zhang } 1647b34f08ffSHong Zhang 1648b34f08ffSHong Zhang 16497b23a99aSBarry Smith ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_FALSE);CHKERRQ(ierr); 1650f6c57405SHong Zhang 1651a5e57a09SHong Zhang if (!mumps->myid) { /* information from the host */ 1652a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(1) (global estimated flops for the elimination after analysis): %g \n",mumps->id.RINFOG(1));CHKERRQ(ierr); 1653a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(2) (global estimated flops for the assembly after factorization): %g \n",mumps->id.RINFOG(2));CHKERRQ(ierr); 1654a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(3) (global estimated flops for the elimination after factorization): %g \n",mumps->id.RINFOG(3));CHKERRQ(ierr); 1655a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," (RINFOG(12) RINFOG(13))*2^INFOG(34) (determinant): (%g,%g)*(2^%d)\n",mumps->id.RINFOG(12),mumps->id.RINFOG(13),mumps->id.INFOG(34));CHKERRQ(ierr); 1656f6c57405SHong Zhang 1657a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(3) (estimated real workspace for factors on all processors after analysis): %d \n",mumps->id.INFOG(3));CHKERRQ(ierr); 1658a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(4) (estimated integer workspace for factors on all processors after analysis): %d \n",mumps->id.INFOG(4));CHKERRQ(ierr); 1659a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(5) (estimated maximum front size in the complete tree): %d \n",mumps->id.INFOG(5));CHKERRQ(ierr); 1660a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(6) (number of nodes in the complete tree): %d \n",mumps->id.INFOG(6));CHKERRQ(ierr); 1661a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(7) (ordering option effectively use after analysis): %d \n",mumps->id.INFOG(7));CHKERRQ(ierr); 1662a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(8) (structural symmetry in percent of the permuted matrix after analysis): %d \n",mumps->id.INFOG(8));CHKERRQ(ierr); 1663a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(9) (total real/complex workspace to store the matrix factors after factorization): %d \n",mumps->id.INFOG(9));CHKERRQ(ierr); 1664a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(10) (total integer space store the matrix factors after factorization): %d \n",mumps->id.INFOG(10));CHKERRQ(ierr); 1665a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(11) (order of largest frontal matrix after factorization): %d \n",mumps->id.INFOG(11));CHKERRQ(ierr); 1666a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(12) (number of off-diagonal pivots): %d \n",mumps->id.INFOG(12));CHKERRQ(ierr); 1667a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(13) (number of delayed pivots after factorization): %d \n",mumps->id.INFOG(13));CHKERRQ(ierr); 1668a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(14) (number of memory compress after factorization): %d \n",mumps->id.INFOG(14));CHKERRQ(ierr); 1669a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(15) (number of steps of iterative refinement after solution): %d \n",mumps->id.INFOG(15));CHKERRQ(ierr); 1670a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(16) (estimated size (in MB) of all MUMPS internal data for factorization after analysis: value on the most memory consuming processor): %d \n",mumps->id.INFOG(16));CHKERRQ(ierr); 1671a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(17) (estimated size of all MUMPS internal data for factorization after analysis: sum over all processors): %d \n",mumps->id.INFOG(17));CHKERRQ(ierr); 1672a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(18) (size of all MUMPS internal data allocated during factorization: value on the most memory consuming processor): %d \n",mumps->id.INFOG(18));CHKERRQ(ierr); 1673a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(19) (size of all MUMPS internal data allocated during factorization: sum over all processors): %d \n",mumps->id.INFOG(19));CHKERRQ(ierr); 1674a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(20) (estimated number of entries in the factors): %d \n",mumps->id.INFOG(20));CHKERRQ(ierr); 1675a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(21) (size in MB of memory effectively used during factorization - value on the most memory consuming processor): %d \n",mumps->id.INFOG(21));CHKERRQ(ierr); 1676a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(22) (size in MB of memory effectively used during factorization - sum over all processors): %d \n",mumps->id.INFOG(22));CHKERRQ(ierr); 1677a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(23) (after analysis: value of ICNTL(6) effectively used): %d \n",mumps->id.INFOG(23));CHKERRQ(ierr); 1678a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(24) (after analysis: value of ICNTL(12) effectively used): %d \n",mumps->id.INFOG(24));CHKERRQ(ierr); 1679a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(25) (after factorization: number of pivots modified by static pivoting): %d \n",mumps->id.INFOG(25));CHKERRQ(ierr); 168040d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(28) (after factorization: number of null pivots encountered): %d\n",mumps->id.INFOG(28));CHKERRQ(ierr); 168140d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(29) (after factorization: effective number of entries in the factors (sum over all processors)): %d\n",mumps->id.INFOG(29));CHKERRQ(ierr); 168240d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(30, 31) (after solution: size in Mbytes of memory used during solution phase): %d, %d\n",mumps->id.INFOG(30),mumps->id.INFOG(31));CHKERRQ(ierr); 168340d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(32) (after analysis: type of analysis done): %d\n",mumps->id.INFOG(32));CHKERRQ(ierr); 168440d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(33) (value used for ICNTL(8)): %d\n",mumps->id.INFOG(33));CHKERRQ(ierr); 168540d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(34) (exponent of the determinant if determinant is requested): %d\n",mumps->id.INFOG(34));CHKERRQ(ierr); 1686f6c57405SHong Zhang } 1687f6c57405SHong Zhang } 1688cb828f0fSHong Zhang } 1689f6c57405SHong Zhang PetscFunctionReturn(0); 1690f6c57405SHong Zhang } 1691f6c57405SHong Zhang 169235bd34faSBarry Smith #undef __FUNCT__ 169335bd34faSBarry Smith #define __FUNCT__ "MatGetInfo_MUMPS" 169435bd34faSBarry Smith PetscErrorCode MatGetInfo_MUMPS(Mat A,MatInfoType flag,MatInfo *info) 169535bd34faSBarry Smith { 1696cb828f0fSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)A->spptr; 169735bd34faSBarry Smith 169835bd34faSBarry Smith PetscFunctionBegin; 169935bd34faSBarry Smith info->block_size = 1.0; 1700cb828f0fSHong Zhang info->nz_allocated = mumps->id.INFOG(20); 1701cb828f0fSHong Zhang info->nz_used = mumps->id.INFOG(20); 170235bd34faSBarry Smith info->nz_unneeded = 0.0; 170335bd34faSBarry Smith info->assemblies = 0.0; 170435bd34faSBarry Smith info->mallocs = 0.0; 170535bd34faSBarry Smith info->memory = 0.0; 170635bd34faSBarry Smith info->fill_ratio_given = 0; 170735bd34faSBarry Smith info->fill_ratio_needed = 0; 170835bd34faSBarry Smith info->factor_mallocs = 0; 170935bd34faSBarry Smith PetscFunctionReturn(0); 171035bd34faSBarry Smith } 171135bd34faSBarry Smith 17125ccb76cbSHong Zhang /* -------------------------------------------------------------------------------------------*/ 17135ccb76cbSHong Zhang #undef __FUNCT__ 17146444a565SStefano Zampini #define __FUNCT__ "MatMumpsSetSchurIndices_MUMPS" 17156444a565SStefano Zampini PetscErrorCode MatMumpsSetSchurIndices_MUMPS(Mat F,PetscInt size,PetscInt idxs[]) 17166444a565SStefano Zampini { 17176444a565SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 17186444a565SStefano Zampini PetscErrorCode ierr; 17196444a565SStefano Zampini 17206444a565SStefano Zampini PetscFunctionBegin; 172159ac8732SStefano Zampini if (mumps->size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"MUMPS parallel Schur complements not yet supported from PETSc\n"); 17226444a565SStefano Zampini if (mumps->id.size_schur != size) { 17236444a565SStefano Zampini ierr = PetscFree2(mumps->id.listvar_schur,mumps->id.schur);CHKERRQ(ierr); 17246444a565SStefano Zampini mumps->id.size_schur = size; 17256444a565SStefano Zampini mumps->id.schur_lld = size; 17266444a565SStefano Zampini ierr = PetscMalloc2(size,&mumps->id.listvar_schur,size*size,&mumps->id.schur);CHKERRQ(ierr); 17276444a565SStefano Zampini } 17286444a565SStefano Zampini ierr = PetscMemcpy(mumps->id.listvar_schur,idxs,size*sizeof(PetscInt));CHKERRQ(ierr); 17296444a565SStefano Zampini if (F->factortype == MAT_FACTOR_LU) { 173059ac8732SStefano Zampini mumps->id.ICNTL(19) = 3; /* MUMPS returns full matrix */ 17316444a565SStefano Zampini } else { 173259ac8732SStefano Zampini mumps->id.ICNTL(19) = 2; /* MUMPS returns lower triangular part */ 17336444a565SStefano Zampini } 173459ac8732SStefano Zampini /* set a special value of ICNTL (not handled my MUMPS) to be used in the solve phase by PETSc */ 1735b5fa320bSStefano Zampini mumps->id.ICNTL(26) = -1; 17366444a565SStefano Zampini PetscFunctionReturn(0); 17376444a565SStefano Zampini } 17386444a565SStefano Zampini 17396444a565SStefano Zampini #undef __FUNCT__ 17406444a565SStefano Zampini #define __FUNCT__ "MatMumpsSetSchurIndices" 17416444a565SStefano Zampini /*@ 17426444a565SStefano Zampini MatMumpsSetSchurIndices - Set indices defining the Schur complement that MUMPS will compute during the factorization steps 17436444a565SStefano Zampini 17446444a565SStefano Zampini Logically Collective on Mat 17456444a565SStefano Zampini 17466444a565SStefano Zampini Input Parameters: 17476444a565SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 17486444a565SStefano Zampini . size - size of the Schur complement indices 17496444a565SStefano Zampini - idxs[] - array of Schur complement indices 17506444a565SStefano Zampini 17516444a565SStefano Zampini Notes: 175259ac8732SStefano Zampini The user has to free the array idxs[] since the indices are copied by the routine. 175359ac8732SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 17546444a565SStefano Zampini 17556444a565SStefano Zampini Level: advanced 17566444a565SStefano Zampini 17576444a565SStefano Zampini References: MUMPS Users' Guide 17586444a565SStefano Zampini 175959ac8732SStefano Zampini .seealso: MatGetFactor(), MatMumpsCreateSchurComplement(), MatMumpsGetSchurComplement() 17606444a565SStefano Zampini @*/ 17616444a565SStefano Zampini PetscErrorCode MatMumpsSetSchurIndices(Mat F,PetscInt size,PetscInt idxs[]) 17626444a565SStefano Zampini { 17636444a565SStefano Zampini PetscErrorCode ierr; 17646444a565SStefano Zampini 17656444a565SStefano Zampini PetscFunctionBegin; 1766e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 1767e807eca7SStefano Zampini if (size) PetscValidIntPointer(idxs,3); 17686444a565SStefano Zampini ierr = PetscTryMethod(F,"MatMumpsSetSchurIndices_C",(Mat,PetscInt,PetscInt[]),(F,size,idxs));CHKERRQ(ierr); 17696444a565SStefano Zampini PetscFunctionReturn(0); 17706444a565SStefano Zampini } 177159ac8732SStefano Zampini 17726444a565SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 17736444a565SStefano Zampini #undef __FUNCT__ 177459ac8732SStefano Zampini #define __FUNCT__ "MatMumpsCreateSchurComplement_MUMPS" 177559ac8732SStefano Zampini PetscErrorCode MatMumpsCreateSchurComplement_MUMPS(Mat F,Mat* S) 17766444a565SStefano Zampini { 17776444a565SStefano Zampini Mat St; 17786444a565SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 17796444a565SStefano Zampini PetscScalar *array; 17806444a565SStefano Zampini #if defined(PETSC_USE_COMPLEX) 17816444a565SStefano Zampini PetscScalar im = PetscSqrtScalar(-1.0); 17826444a565SStefano Zampini #endif 17836444a565SStefano Zampini PetscErrorCode ierr; 17846444a565SStefano Zampini 17856444a565SStefano Zampini PetscFunctionBegin; 178659ac8732SStefano Zampini if (!mumps->CleanUpMUMPS) { /* CleanUpMUMPS is set to true after numerical factorization */ 178759ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Numerical factorization phase not yet performed! You should call MatFactorSymbolic/Numeric before"); 178859ac8732SStefano Zampini } else if (!mumps->id.ICNTL(19)) { 178959ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatMumpsSetSchurIndices to enable it"); 179059ac8732SStefano Zampini } else if (!mumps->id.size_schur) { 179159ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 179259ac8732SStefano Zampini } else if (!mumps->schur_restored) { 179359ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 17946444a565SStefano Zampini } 17956444a565SStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)F),&St);CHKERRQ(ierr); 17966444a565SStefano Zampini ierr = MatSetSizes(St,PETSC_DECIDE,PETSC_DECIDE,mumps->id.size_schur,mumps->id.size_schur);CHKERRQ(ierr); 17976444a565SStefano Zampini ierr = MatSetType(St,MATDENSE);CHKERRQ(ierr); 17986444a565SStefano Zampini ierr = MatSetUp(St);CHKERRQ(ierr); 17996444a565SStefano Zampini ierr = MatDenseGetArray(St,&array);CHKERRQ(ierr); 180059ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full matrix */ 18016444a565SStefano Zampini if (mumps->id.ICNTL(19) == 1) { /* stored by rows */ 18026444a565SStefano Zampini PetscInt i,j,N=mumps->id.size_schur; 18036444a565SStefano Zampini for (i=0;i<N;i++) { 18046444a565SStefano Zampini for (j=0;j<N;j++) { 18056444a565SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 18066444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j]; 18076444a565SStefano Zampini #else 18086444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j].r + im*mumps->id.schur[i*N+j].i; 18096444a565SStefano Zampini #endif 18106444a565SStefano Zampini array[j*N+i] = val; 18116444a565SStefano Zampini } 18126444a565SStefano Zampini } 18136444a565SStefano Zampini } else { /* stored by columns */ 18146444a565SStefano Zampini ierr = PetscMemcpy(array,mumps->id.schur,mumps->id.size_schur*mumps->id.size_schur*sizeof(PetscScalar));CHKERRQ(ierr); 18156444a565SStefano Zampini } 18166444a565SStefano Zampini } else { /* either full or lower-triangular (not packed) */ 18176444a565SStefano Zampini if (mumps->id.ICNTL(19) == 2) { /* lower triangular stored by columns */ 18186444a565SStefano Zampini PetscInt i,j,N=mumps->id.size_schur; 18196444a565SStefano Zampini for (i=0;i<N;i++) { 18206444a565SStefano Zampini for (j=i;j<N;j++) { 18216444a565SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 18226444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j]; 18236444a565SStefano Zampini #else 18246444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j].r + im*mumps->id.schur[i*N+j].i; 18256444a565SStefano Zampini #endif 18266444a565SStefano Zampini array[i*N+j] = val; 18276444a565SStefano Zampini array[j*N+i] = val; 18286444a565SStefano Zampini } 18296444a565SStefano Zampini } 18306444a565SStefano Zampini } else if (mumps->id.ICNTL(19) == 3) { /* full matrix */ 18316444a565SStefano Zampini ierr = PetscMemcpy(array,mumps->id.schur,mumps->id.size_schur*mumps->id.size_schur*sizeof(PetscScalar));CHKERRQ(ierr); 18326444a565SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 18336444a565SStefano Zampini PetscInt i,j,N=mumps->id.size_schur; 18346444a565SStefano Zampini for (i=0;i<N;i++) { 18356444a565SStefano Zampini for (j=0;j<i+1;j++) { 18366444a565SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 18376444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j]; 18386444a565SStefano Zampini #else 18396444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j].r + im*mumps->id.schur[i*N+j].i; 18406444a565SStefano Zampini #endif 18416444a565SStefano Zampini array[i*N+j] = val; 18426444a565SStefano Zampini array[j*N+i] = val; 18436444a565SStefano Zampini } 18446444a565SStefano Zampini } 18456444a565SStefano Zampini } 18466444a565SStefano Zampini } 18476444a565SStefano Zampini ierr = MatDenseRestoreArray(St,&array);CHKERRQ(ierr); 18486444a565SStefano Zampini *S = St; 18496444a565SStefano Zampini PetscFunctionReturn(0); 18506444a565SStefano Zampini } 18516444a565SStefano Zampini 18526444a565SStefano Zampini #undef __FUNCT__ 185359ac8732SStefano Zampini #define __FUNCT__ "MatMumpsCreateSchurComplement" 18546444a565SStefano Zampini /*@ 185559ac8732SStefano Zampini MatMumpsCreateSchurComplement - Create a Schur complement matrix object using Schur data computed by MUMPS during the factorization step 18566444a565SStefano Zampini 18576444a565SStefano Zampini Logically Collective on Mat 18586444a565SStefano Zampini 18596444a565SStefano Zampini Input Parameters: 18606444a565SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 18616444a565SStefano Zampini . *S - location where to return the Schur complement (MATDENSE) 18626444a565SStefano Zampini 18636444a565SStefano Zampini Notes: 186459ac8732SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 186559ac8732SStefano Zampini The routine provides a copy of the Schur data stored within MUMPS data strutures. The caller must destroy the object when it is no longer needed. 1866066565c5SStefano Zampini If MatMumpsInvertSchurComplement has been called, the routine gets back the inverse 18676444a565SStefano Zampini 18686444a565SStefano Zampini Level: advanced 18696444a565SStefano Zampini 18706444a565SStefano Zampini References: MUMPS Users' Guide 18716444a565SStefano Zampini 187259ac8732SStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices(), MatMumpsGetSchurComplement() 187359ac8732SStefano Zampini @*/ 187459ac8732SStefano Zampini PetscErrorCode MatMumpsCreateSchurComplement(Mat F,Mat* S) 187559ac8732SStefano Zampini { 187659ac8732SStefano Zampini PetscErrorCode ierr; 187759ac8732SStefano Zampini 187859ac8732SStefano Zampini PetscFunctionBegin; 1879e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 188059ac8732SStefano Zampini ierr = PetscTryMethod(F,"MatMumpsCreateSchurComplement_C",(Mat,Mat*),(F,S));CHKERRQ(ierr); 188159ac8732SStefano Zampini PetscFunctionReturn(0); 188259ac8732SStefano Zampini } 188359ac8732SStefano Zampini 188459ac8732SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 188559ac8732SStefano Zampini #undef __FUNCT__ 188659ac8732SStefano Zampini #define __FUNCT__ "MatMumpsGetSchurComplement_MUMPS" 188759ac8732SStefano Zampini PetscErrorCode MatMumpsGetSchurComplement_MUMPS(Mat F,Mat* S) 188859ac8732SStefano Zampini { 188959ac8732SStefano Zampini Mat St; 189059ac8732SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 189159ac8732SStefano Zampini PetscErrorCode ierr; 189259ac8732SStefano Zampini 189359ac8732SStefano Zampini PetscFunctionBegin; 189459ac8732SStefano Zampini if (!mumps->CleanUpMUMPS) { /* CleanUpMUMPS is set to true after numerical factorization */ 189559ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Numerical factorization phase not yet performed! You should call MatFactorSymbolic/Numeric before"); 189659ac8732SStefano Zampini } else if (!mumps->id.ICNTL(19)) { 189759ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatMumpsSetSchurIndices to enable it"); 189859ac8732SStefano Zampini } else if (!mumps->id.size_schur) { 189959ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 190059ac8732SStefano Zampini } else if (!mumps->schur_restored) { 190159ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 190259ac8732SStefano Zampini } 190359ac8732SStefano Zampini /* It should be the responsibility of the user to handle different ICNTL(19) cases if they want to work with the raw data */ 190459ac8732SStefano Zampini /* should I also add errors when the Schur complement has been already factored? */ 190559ac8732SStefano Zampini ierr = MatCreateSeqDense(PetscObjectComm((PetscObject)F),mumps->id.size_schur,mumps->id.size_schur,(PetscScalar*)mumps->id.schur,&St);CHKERRQ(ierr); 190659ac8732SStefano Zampini *S = St; 190759ac8732SStefano Zampini mumps->schur_restored = PETSC_FALSE; 190859ac8732SStefano Zampini PetscFunctionReturn(0); 190959ac8732SStefano Zampini } 191059ac8732SStefano Zampini 191159ac8732SStefano Zampini #undef __FUNCT__ 191259ac8732SStefano Zampini #define __FUNCT__ "MatMumpsGetSchurComplement" 191359ac8732SStefano Zampini /*@ 191459ac8732SStefano Zampini MatMumpsGetSchurComplement - Get a Schur complement matrix object using the current status of the raw Schur data computed by MUMPS during the factorization step 191559ac8732SStefano Zampini 191659ac8732SStefano Zampini Logically Collective on Mat 191759ac8732SStefano Zampini 191859ac8732SStefano Zampini Input Parameters: 191959ac8732SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 192059ac8732SStefano Zampini . *S - location where to return the Schur complement (MATDENSE) 192159ac8732SStefano Zampini 192259ac8732SStefano Zampini Notes: 192359ac8732SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 192459ac8732SStefano Zampini The routine uses the pointer to the raw data of the Schur Complement stored within MUMPS data strutures. The caller should call MatMumpsRestoreSchurComplement when the object is no longer needed. 1925066565c5SStefano Zampini If MatMumpsInvertSchurComplement has been called, the routine gets back the inverse 192659ac8732SStefano Zampini 192759ac8732SStefano Zampini Level: advanced 192859ac8732SStefano Zampini 192959ac8732SStefano Zampini References: MUMPS Users' Guide 193059ac8732SStefano Zampini 193159ac8732SStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices(), MatMumpsRestoreSchurComplement(), MatMumpsCreateSchurComplement() 19326444a565SStefano Zampini @*/ 19336444a565SStefano Zampini PetscErrorCode MatMumpsGetSchurComplement(Mat F,Mat* S) 19346444a565SStefano Zampini { 19356444a565SStefano Zampini PetscErrorCode ierr; 19366444a565SStefano Zampini 19376444a565SStefano Zampini PetscFunctionBegin; 1938e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 193959ac8732SStefano Zampini ierr = PetscUseMethod(F,"MatMumpsGetSchurComplement_C",(Mat,Mat*),(F,S));CHKERRQ(ierr); 194059ac8732SStefano Zampini PetscFunctionReturn(0); 194159ac8732SStefano Zampini } 194259ac8732SStefano Zampini 194359ac8732SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 194459ac8732SStefano Zampini #undef __FUNCT__ 194559ac8732SStefano Zampini #define __FUNCT__ "MatMumpsRestoreSchurComplement_MUMPS" 194659ac8732SStefano Zampini PetscErrorCode MatMumpsRestoreSchurComplement_MUMPS(Mat F,Mat* S) 194759ac8732SStefano Zampini { 194859ac8732SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 194959ac8732SStefano Zampini PetscErrorCode ierr; 195059ac8732SStefano Zampini 195159ac8732SStefano Zampini PetscFunctionBegin; 195259ac8732SStefano Zampini if (!mumps->CleanUpMUMPS) { /* CleanUpMUMPS is set to true after numerical factorization */ 195359ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Numerical factorization phase not yet performed! You should call MatFactorSymbolic/Numeric before"); 195459ac8732SStefano Zampini } else if (!mumps->id.ICNTL(19)) { 195559ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatMumpsSetSchurIndices to enable it"); 195659ac8732SStefano Zampini } else if (!mumps->id.size_schur) { 195759ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 1958066565c5SStefano Zampini } else if (mumps->schur_restored) { 1959066565c5SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has been already restored"); 196059ac8732SStefano Zampini } 196159ac8732SStefano Zampini ierr = MatDestroy(S);CHKERRQ(ierr); 196259ac8732SStefano Zampini *S = NULL; 196359ac8732SStefano Zampini mumps->schur_restored = PETSC_TRUE; 196459ac8732SStefano Zampini PetscFunctionReturn(0); 196559ac8732SStefano Zampini } 196659ac8732SStefano Zampini 196759ac8732SStefano Zampini #undef __FUNCT__ 196859ac8732SStefano Zampini #define __FUNCT__ "MatMumpsRestoreSchurComplement" 196959ac8732SStefano Zampini /*@ 197059ac8732SStefano Zampini MatMumpsRestoreSchurComplement - Restore the Schur complement matrix object obtained from a call to MatGetSchurComplement 197159ac8732SStefano Zampini 197259ac8732SStefano Zampini Logically Collective on Mat 197359ac8732SStefano Zampini 197459ac8732SStefano Zampini Input Parameters: 197559ac8732SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 197659ac8732SStefano Zampini . *S - location where the Schur complement is stored 197759ac8732SStefano Zampini 197859ac8732SStefano Zampini Notes: 197959ac8732SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 198059ac8732SStefano Zampini 198159ac8732SStefano Zampini Level: advanced 198259ac8732SStefano Zampini 198359ac8732SStefano Zampini References: MUMPS Users' Guide 198459ac8732SStefano Zampini 198559ac8732SStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices(), MatMumpsGetSchurComplement(), MatMumpsCreateSchurComplement() 198659ac8732SStefano Zampini @*/ 198759ac8732SStefano Zampini PetscErrorCode MatMumpsRestoreSchurComplement(Mat F,Mat* S) 198859ac8732SStefano Zampini { 198959ac8732SStefano Zampini PetscErrorCode ierr; 199059ac8732SStefano Zampini 199159ac8732SStefano Zampini PetscFunctionBegin; 1992e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 199359ac8732SStefano Zampini ierr = PetscUseMethod(F,"MatMumpsRestoreSchurComplement_C",(Mat,Mat*),(F,S));CHKERRQ(ierr); 199459ac8732SStefano Zampini PetscFunctionReturn(0); 199559ac8732SStefano Zampini } 199659ac8732SStefano Zampini 199759ac8732SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 199859ac8732SStefano Zampini #undef __FUNCT__ 199959ac8732SStefano Zampini #define __FUNCT__ "MatMumpsInvertSchurComplement_MUMPS" 200059ac8732SStefano Zampini PetscErrorCode MatMumpsInvertSchurComplement_MUMPS(Mat F) 200159ac8732SStefano Zampini { 200259ac8732SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 200359ac8732SStefano Zampini PetscErrorCode ierr; 200459ac8732SStefano Zampini 200559ac8732SStefano Zampini PetscFunctionBegin; 200659ac8732SStefano Zampini if (!mumps->id.ICNTL(19)) { /* do nothing */ 200759ac8732SStefano Zampini PetscFunctionReturn(0); 200859ac8732SStefano Zampini } 200959ac8732SStefano Zampini if (!mumps->CleanUpMUMPS) { /* CleanUpMUMPS is set to true after numerical factorization */ 201059ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Numerical factorization phase not yet performed! You should call MatFactorSymbolic/Numeric before"); 201159ac8732SStefano Zampini } else if (!mumps->id.size_schur) { 201259ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 201359ac8732SStefano Zampini } else if (!mumps->schur_restored) { 201459ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 201559ac8732SStefano Zampini } 201659ac8732SStefano Zampini ierr = MatMumpsInvertSchur_Private(mumps);CHKERRQ(ierr); 201759ac8732SStefano Zampini PetscFunctionReturn(0); 201859ac8732SStefano Zampini } 201959ac8732SStefano Zampini 202059ac8732SStefano Zampini #undef __FUNCT__ 202159ac8732SStefano Zampini #define __FUNCT__ "MatMumpsInvertSchurComplement" 202259ac8732SStefano Zampini /*@ 202359ac8732SStefano Zampini MatMumpsInvertSchurComplement - Invert the raw Schur data computed by MUMPS during the factorization step 202459ac8732SStefano Zampini 202559ac8732SStefano Zampini Logically Collective on Mat 202659ac8732SStefano Zampini 202759ac8732SStefano Zampini Input Parameters: 202859ac8732SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 202959ac8732SStefano Zampini 203059ac8732SStefano Zampini Notes: 203159ac8732SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 203259ac8732SStefano Zampini The routine uses the pointer to the raw data of the Schur Complement stored within MUMPS data strutures. 203359ac8732SStefano Zampini 203459ac8732SStefano Zampini Level: advanced 203559ac8732SStefano Zampini 203659ac8732SStefano Zampini References: MUMPS Users' Guide 203759ac8732SStefano Zampini 203859ac8732SStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices() 203959ac8732SStefano Zampini @*/ 204059ac8732SStefano Zampini PetscErrorCode MatMumpsInvertSchurComplement(Mat F) 204159ac8732SStefano Zampini { 204259ac8732SStefano Zampini PetscErrorCode ierr; 204359ac8732SStefano Zampini 204459ac8732SStefano Zampini PetscFunctionBegin; 2045e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 204659ac8732SStefano Zampini ierr = PetscTryMethod(F,"MatMumpsInvertSchurComplement_C",(Mat),(F));CHKERRQ(ierr); 20476444a565SStefano Zampini PetscFunctionReturn(0); 20486444a565SStefano Zampini } 20496444a565SStefano Zampini 20506444a565SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 20516444a565SStefano Zampini #undef __FUNCT__ 2052e807eca7SStefano Zampini #define __FUNCT__ "MatMumpsSolveSchurComplement_MUMPS" 2053e807eca7SStefano Zampini PetscErrorCode MatMumpsSolveSchurComplement_MUMPS(Mat F, Vec rhs, Vec sol) 2054e807eca7SStefano Zampini { 2055e807eca7SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2056e807eca7SStefano Zampini MumpsScalar *orhs; 2057e807eca7SStefano Zampini PetscScalar *osol,*nrhs,*nsol; 2058e807eca7SStefano Zampini PetscErrorCode ierr; 2059e807eca7SStefano Zampini 2060e807eca7SStefano Zampini PetscFunctionBegin; 2061e807eca7SStefano Zampini if (!mumps->CleanUpMUMPS) { /* CleanUpMUMPS is set to true after numerical factorization */ 2062e807eca7SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Numerical factorization phase not yet performed! You should call MatFactorSymbolic/Numeric before"); 2063e807eca7SStefano Zampini } else if (!mumps->id.ICNTL(19)) { 2064e807eca7SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatMumpsSetSchurIndices to enable it"); 2065e807eca7SStefano Zampini } else if (!mumps->id.size_schur) { 2066e807eca7SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 2067e807eca7SStefano Zampini } else if (!mumps->schur_restored) { 2068e807eca7SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 2069e807eca7SStefano Zampini } 2070e807eca7SStefano Zampini /* swap pointers */ 2071e807eca7SStefano Zampini orhs = mumps->id.redrhs; 2072e807eca7SStefano Zampini osol = mumps->schur_sol; 2073e807eca7SStefano Zampini ierr = VecGetArray(rhs,&nrhs);CHKERRQ(ierr); 2074e807eca7SStefano Zampini ierr = VecGetArray(sol,&nsol);CHKERRQ(ierr); 2075e807eca7SStefano Zampini mumps->id.redrhs = (MumpsScalar*)nrhs; 2076e807eca7SStefano Zampini mumps->schur_sol = nsol; 2077e807eca7SStefano Zampini /* solve Schur complement */ 2078e807eca7SStefano Zampini mumps->id.nrhs = 1; 2079e807eca7SStefano Zampini ierr = MatMumpsSolveSchur_Private(mumps,PETSC_FALSE);CHKERRQ(ierr); 2080e807eca7SStefano Zampini /* restore pointers */ 2081e807eca7SStefano Zampini ierr = VecRestoreArray(rhs,&nrhs);CHKERRQ(ierr); 2082e807eca7SStefano Zampini ierr = VecRestoreArray(sol,&nsol);CHKERRQ(ierr); 2083e807eca7SStefano Zampini mumps->id.redrhs = orhs; 2084e807eca7SStefano Zampini mumps->schur_sol = osol; 2085e807eca7SStefano Zampini PetscFunctionReturn(0); 2086e807eca7SStefano Zampini } 2087e807eca7SStefano Zampini 2088e807eca7SStefano Zampini #undef __FUNCT__ 2089e807eca7SStefano Zampini #define __FUNCT__ "MatMumpsSolveSchurComplement" 2090e807eca7SStefano Zampini /*@ 2091e807eca7SStefano Zampini MatMumpsSolveSchurComplement - Solve the Schur complement system computed by MUMPS during the factorization step 2092e807eca7SStefano Zampini 2093e807eca7SStefano Zampini Logically Collective on Mat 2094e807eca7SStefano Zampini 2095e807eca7SStefano Zampini Input Parameters: 2096e807eca7SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2097e807eca7SStefano Zampini . rhs - location where the right hand side of the Schur complement system is stored 2098e807eca7SStefano Zampini - sol - location where the solution of the Schur complement system has to be returned 2099e807eca7SStefano Zampini 2100e807eca7SStefano Zampini Notes: 2101e807eca7SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 2102e807eca7SStefano Zampini The sizes of the vectors should match the size of the Schur complement 2103e807eca7SStefano Zampini 2104e807eca7SStefano Zampini Level: advanced 2105e807eca7SStefano Zampini 2106e807eca7SStefano Zampini References: MUMPS Users' Guide 2107e807eca7SStefano Zampini 2108e807eca7SStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices() 2109e807eca7SStefano Zampini @*/ 2110e807eca7SStefano Zampini PetscErrorCode MatMumpsSolveSchurComplement(Mat F, Vec rhs, Vec sol) 2111e807eca7SStefano Zampini { 2112e807eca7SStefano Zampini PetscErrorCode ierr; 2113e807eca7SStefano Zampini 2114e807eca7SStefano Zampini PetscFunctionBegin; 2115e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 2116e807eca7SStefano Zampini PetscValidHeaderSpecific(rhs,VEC_CLASSID,2); 2117e807eca7SStefano Zampini PetscValidHeaderSpecific(sol,VEC_CLASSID,2); 2118e807eca7SStefano Zampini PetscCheckSameComm(F,1,rhs,2); 2119e807eca7SStefano Zampini PetscCheckSameComm(F,1,sol,3); 2120*7404bcfbSStefano Zampini ierr = PetscUseMethod(F,"MatMumpsSolveSchurComplement_C",(Mat,Vec,Vec),(F,rhs,sol));CHKERRQ(ierr); 2121*7404bcfbSStefano Zampini PetscFunctionReturn(0); 2122*7404bcfbSStefano Zampini } 2123*7404bcfbSStefano Zampini 2124*7404bcfbSStefano Zampini /* -------------------------------------------------------------------------------------------*/ 2125*7404bcfbSStefano Zampini #undef __FUNCT__ 2126*7404bcfbSStefano Zampini #define __FUNCT__ "MatMumpsSolveSchurComplementTranspose_MUMPS" 2127*7404bcfbSStefano Zampini PetscErrorCode MatMumpsSolveSchurComplementTranspose_MUMPS(Mat F, Vec rhs, Vec sol) 2128*7404bcfbSStefano Zampini { 2129*7404bcfbSStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2130*7404bcfbSStefano Zampini MumpsScalar *orhs; 2131*7404bcfbSStefano Zampini PetscScalar *osol,*nrhs,*nsol; 2132*7404bcfbSStefano Zampini PetscErrorCode ierr; 2133*7404bcfbSStefano Zampini 2134*7404bcfbSStefano Zampini PetscFunctionBegin; 2135*7404bcfbSStefano Zampini if (!mumps->CleanUpMUMPS) { /* CleanUpMUMPS is set to true after numerical factorization */ 2136*7404bcfbSStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Numerical factorization phase not yet performed! You should call MatFactorSymbolic/Numeric before"); 2137*7404bcfbSStefano Zampini } else if (!mumps->id.ICNTL(19)) { 2138*7404bcfbSStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatMumpsSetSchurIndices to enable it"); 2139*7404bcfbSStefano Zampini } else if (!mumps->id.size_schur) { 2140*7404bcfbSStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 2141*7404bcfbSStefano Zampini } else if (!mumps->schur_restored) { 2142*7404bcfbSStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 2143*7404bcfbSStefano Zampini } 2144*7404bcfbSStefano Zampini /* swap pointers */ 2145*7404bcfbSStefano Zampini orhs = mumps->id.redrhs; 2146*7404bcfbSStefano Zampini osol = mumps->schur_sol; 2147*7404bcfbSStefano Zampini ierr = VecGetArray(rhs,&nrhs);CHKERRQ(ierr); 2148*7404bcfbSStefano Zampini ierr = VecGetArray(sol,&nsol);CHKERRQ(ierr); 2149*7404bcfbSStefano Zampini mumps->id.redrhs = (MumpsScalar*)nrhs; 2150*7404bcfbSStefano Zampini mumps->schur_sol = nsol; 2151*7404bcfbSStefano Zampini /* solve Schur complement */ 2152*7404bcfbSStefano Zampini mumps->id.nrhs = 1; 2153*7404bcfbSStefano Zampini mumps->id.ICNTL(9) = 0; 2154*7404bcfbSStefano Zampini ierr = MatMumpsSolveSchur_Private(mumps,PETSC_FALSE);CHKERRQ(ierr); 2155*7404bcfbSStefano Zampini mumps->id.ICNTL(9) = 1; 2156*7404bcfbSStefano Zampini /* restore pointers */ 2157*7404bcfbSStefano Zampini ierr = VecRestoreArray(rhs,&nrhs);CHKERRQ(ierr); 2158*7404bcfbSStefano Zampini ierr = VecRestoreArray(sol,&nsol);CHKERRQ(ierr); 2159*7404bcfbSStefano Zampini mumps->id.redrhs = orhs; 2160*7404bcfbSStefano Zampini mumps->schur_sol = osol; 2161*7404bcfbSStefano Zampini PetscFunctionReturn(0); 2162*7404bcfbSStefano Zampini } 2163*7404bcfbSStefano Zampini 2164*7404bcfbSStefano Zampini #undef __FUNCT__ 2165*7404bcfbSStefano Zampini #define __FUNCT__ "MatMumpsSolveSchurComplementTranspose" 2166*7404bcfbSStefano Zampini /*@ 2167*7404bcfbSStefano Zampini MatMumpsSolveSchurComplementTranspose - Solve the transpose of the Schur complement system computed by MUMPS during the factorization step 2168*7404bcfbSStefano Zampini 2169*7404bcfbSStefano Zampini Logically Collective on Mat 2170*7404bcfbSStefano Zampini 2171*7404bcfbSStefano Zampini Input Parameters: 2172*7404bcfbSStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2173*7404bcfbSStefano Zampini . rhs - location where the right hand side of the Schur complement system is stored 2174*7404bcfbSStefano Zampini - sol - location where the solution of the Schur complement system has to be returned 2175*7404bcfbSStefano Zampini 2176*7404bcfbSStefano Zampini Notes: 2177*7404bcfbSStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 2178*7404bcfbSStefano Zampini The sizes of the vectors should match the size of the Schur complement 2179*7404bcfbSStefano Zampini 2180*7404bcfbSStefano Zampini Level: advanced 2181*7404bcfbSStefano Zampini 2182*7404bcfbSStefano Zampini References: MUMPS Users' Guide 2183*7404bcfbSStefano Zampini 2184*7404bcfbSStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices() 2185*7404bcfbSStefano Zampini @*/ 2186*7404bcfbSStefano Zampini PetscErrorCode MatMumpsSolveSchurComplementTranspose(Mat F, Vec rhs, Vec sol) 2187*7404bcfbSStefano Zampini { 2188*7404bcfbSStefano Zampini PetscErrorCode ierr; 2189*7404bcfbSStefano Zampini 2190*7404bcfbSStefano Zampini PetscFunctionBegin; 2191*7404bcfbSStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 2192*7404bcfbSStefano Zampini PetscValidHeaderSpecific(rhs,VEC_CLASSID,2); 2193*7404bcfbSStefano Zampini PetscValidHeaderSpecific(sol,VEC_CLASSID,2); 2194*7404bcfbSStefano Zampini PetscCheckSameComm(F,1,rhs,2); 2195*7404bcfbSStefano Zampini PetscCheckSameComm(F,1,sol,3); 2196*7404bcfbSStefano Zampini ierr = PetscUseMethod(F,"MatMumpsSolveSchurComplementTranspose_C",(Mat,Vec,Vec),(F,rhs,sol));CHKERRQ(ierr); 2197e807eca7SStefano Zampini PetscFunctionReturn(0); 2198e807eca7SStefano Zampini } 2199e807eca7SStefano Zampini 2200e807eca7SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 2201e807eca7SStefano Zampini #undef __FUNCT__ 22025ccb76cbSHong Zhang #define __FUNCT__ "MatMumpsSetIcntl_MUMPS" 22035ccb76cbSHong Zhang PetscErrorCode MatMumpsSetIcntl_MUMPS(Mat F,PetscInt icntl,PetscInt ival) 22045ccb76cbSHong Zhang { 2205a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 22065ccb76cbSHong Zhang 22075ccb76cbSHong Zhang PetscFunctionBegin; 2208a5e57a09SHong Zhang mumps->id.ICNTL(icntl) = ival; 22095ccb76cbSHong Zhang PetscFunctionReturn(0); 22105ccb76cbSHong Zhang } 22115ccb76cbSHong Zhang 22125ccb76cbSHong Zhang #undef __FUNCT__ 2213bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetIcntl_MUMPS" 2214bc6112feSHong Zhang PetscErrorCode MatMumpsGetIcntl_MUMPS(Mat F,PetscInt icntl,PetscInt *ival) 2215bc6112feSHong Zhang { 2216bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2217bc6112feSHong Zhang 2218bc6112feSHong Zhang PetscFunctionBegin; 2219bc6112feSHong Zhang *ival = mumps->id.ICNTL(icntl); 2220bc6112feSHong Zhang PetscFunctionReturn(0); 2221bc6112feSHong Zhang } 2222bc6112feSHong Zhang 2223bc6112feSHong Zhang #undef __FUNCT__ 22245ccb76cbSHong Zhang #define __FUNCT__ "MatMumpsSetIcntl" 22255ccb76cbSHong Zhang /*@ 22265ccb76cbSHong Zhang MatMumpsSetIcntl - Set MUMPS parameter ICNTL() 22275ccb76cbSHong Zhang 22285ccb76cbSHong Zhang Logically Collective on Mat 22295ccb76cbSHong Zhang 22305ccb76cbSHong Zhang Input Parameters: 22315ccb76cbSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 22325ccb76cbSHong Zhang . icntl - index of MUMPS parameter array ICNTL() 22335ccb76cbSHong Zhang - ival - value of MUMPS ICNTL(icntl) 22345ccb76cbSHong Zhang 22355ccb76cbSHong Zhang Options Database: 22365ccb76cbSHong Zhang . -mat_mumps_icntl_<icntl> <ival> 22375ccb76cbSHong Zhang 22385ccb76cbSHong Zhang Level: beginner 22395ccb76cbSHong Zhang 22405ccb76cbSHong Zhang References: MUMPS Users' Guide 22415ccb76cbSHong Zhang 22425ccb76cbSHong Zhang .seealso: MatGetFactor() 22435ccb76cbSHong Zhang @*/ 22445ccb76cbSHong Zhang PetscErrorCode MatMumpsSetIcntl(Mat F,PetscInt icntl,PetscInt ival) 22455ccb76cbSHong Zhang { 22465ccb76cbSHong Zhang PetscErrorCode ierr; 22475ccb76cbSHong Zhang 22485ccb76cbSHong Zhang PetscFunctionBegin; 22495ccb76cbSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 22505ccb76cbSHong Zhang PetscValidLogicalCollectiveInt(F,ival,3); 22515ccb76cbSHong Zhang ierr = PetscTryMethod(F,"MatMumpsSetIcntl_C",(Mat,PetscInt,PetscInt),(F,icntl,ival));CHKERRQ(ierr); 22525ccb76cbSHong Zhang PetscFunctionReturn(0); 22535ccb76cbSHong Zhang } 22545ccb76cbSHong Zhang 2255bc6112feSHong Zhang #undef __FUNCT__ 2256bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetIcntl" 2257a21f80fcSHong Zhang /*@ 2258a21f80fcSHong Zhang MatMumpsGetIcntl - Get MUMPS parameter ICNTL() 2259a21f80fcSHong Zhang 2260a21f80fcSHong Zhang Logically Collective on Mat 2261a21f80fcSHong Zhang 2262a21f80fcSHong Zhang Input Parameters: 2263a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2264a21f80fcSHong Zhang - icntl - index of MUMPS parameter array ICNTL() 2265a21f80fcSHong Zhang 2266a21f80fcSHong Zhang Output Parameter: 2267a21f80fcSHong Zhang . ival - value of MUMPS ICNTL(icntl) 2268a21f80fcSHong Zhang 2269a21f80fcSHong Zhang Level: beginner 2270a21f80fcSHong Zhang 2271a21f80fcSHong Zhang References: MUMPS Users' Guide 2272a21f80fcSHong Zhang 2273a21f80fcSHong Zhang .seealso: MatGetFactor() 2274a21f80fcSHong Zhang @*/ 2275bc6112feSHong Zhang PetscErrorCode MatMumpsGetIcntl(Mat F,PetscInt icntl,PetscInt *ival) 2276bc6112feSHong Zhang { 2277bc6112feSHong Zhang PetscErrorCode ierr; 2278bc6112feSHong Zhang 2279bc6112feSHong Zhang PetscFunctionBegin; 2280bc6112feSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 2281bc6112feSHong Zhang PetscValidIntPointer(ival,3); 2282bc6112feSHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetIcntl_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 2283bc6112feSHong Zhang PetscFunctionReturn(0); 2284bc6112feSHong Zhang } 2285bc6112feSHong Zhang 22868928b65cSHong Zhang /* -------------------------------------------------------------------------------------------*/ 22878928b65cSHong Zhang #undef __FUNCT__ 22888928b65cSHong Zhang #define __FUNCT__ "MatMumpsSetCntl_MUMPS" 22898928b65cSHong Zhang PetscErrorCode MatMumpsSetCntl_MUMPS(Mat F,PetscInt icntl,PetscReal val) 22908928b65cSHong Zhang { 22918928b65cSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 22928928b65cSHong Zhang 22938928b65cSHong Zhang PetscFunctionBegin; 22948928b65cSHong Zhang mumps->id.CNTL(icntl) = val; 22958928b65cSHong Zhang PetscFunctionReturn(0); 22968928b65cSHong Zhang } 22978928b65cSHong Zhang 22988928b65cSHong Zhang #undef __FUNCT__ 2299bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetCntl_MUMPS" 2300bc6112feSHong Zhang PetscErrorCode MatMumpsGetCntl_MUMPS(Mat F,PetscInt icntl,PetscReal *val) 2301bc6112feSHong Zhang { 2302bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2303bc6112feSHong Zhang 2304bc6112feSHong Zhang PetscFunctionBegin; 2305bc6112feSHong Zhang *val = mumps->id.CNTL(icntl); 2306bc6112feSHong Zhang PetscFunctionReturn(0); 2307bc6112feSHong Zhang } 2308bc6112feSHong Zhang 2309bc6112feSHong Zhang #undef __FUNCT__ 23108928b65cSHong Zhang #define __FUNCT__ "MatMumpsSetCntl" 23118928b65cSHong Zhang /*@ 23128928b65cSHong Zhang MatMumpsSetCntl - Set MUMPS parameter CNTL() 23138928b65cSHong Zhang 23148928b65cSHong Zhang Logically Collective on Mat 23158928b65cSHong Zhang 23168928b65cSHong Zhang Input Parameters: 23178928b65cSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 23188928b65cSHong Zhang . icntl - index of MUMPS parameter array CNTL() 23198928b65cSHong Zhang - val - value of MUMPS CNTL(icntl) 23208928b65cSHong Zhang 23218928b65cSHong Zhang Options Database: 23228928b65cSHong Zhang . -mat_mumps_cntl_<icntl> <val> 23238928b65cSHong Zhang 23248928b65cSHong Zhang Level: beginner 23258928b65cSHong Zhang 23268928b65cSHong Zhang References: MUMPS Users' Guide 23278928b65cSHong Zhang 23288928b65cSHong Zhang .seealso: MatGetFactor() 23298928b65cSHong Zhang @*/ 23308928b65cSHong Zhang PetscErrorCode MatMumpsSetCntl(Mat F,PetscInt icntl,PetscReal val) 23318928b65cSHong Zhang { 23328928b65cSHong Zhang PetscErrorCode ierr; 23338928b65cSHong Zhang 23348928b65cSHong Zhang PetscFunctionBegin; 23358928b65cSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 2336bc6112feSHong Zhang PetscValidLogicalCollectiveReal(F,val,3); 23378928b65cSHong Zhang ierr = PetscTryMethod(F,"MatMumpsSetCntl_C",(Mat,PetscInt,PetscReal),(F,icntl,val));CHKERRQ(ierr); 23388928b65cSHong Zhang PetscFunctionReturn(0); 23398928b65cSHong Zhang } 23408928b65cSHong Zhang 2341bc6112feSHong Zhang #undef __FUNCT__ 2342bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetCntl" 2343a21f80fcSHong Zhang /*@ 2344a21f80fcSHong Zhang MatMumpsGetCntl - Get MUMPS parameter CNTL() 2345a21f80fcSHong Zhang 2346a21f80fcSHong Zhang Logically Collective on Mat 2347a21f80fcSHong Zhang 2348a21f80fcSHong Zhang Input Parameters: 2349a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2350a21f80fcSHong Zhang - icntl - index of MUMPS parameter array CNTL() 2351a21f80fcSHong Zhang 2352a21f80fcSHong Zhang Output Parameter: 2353a21f80fcSHong Zhang . val - value of MUMPS CNTL(icntl) 2354a21f80fcSHong Zhang 2355a21f80fcSHong Zhang Level: beginner 2356a21f80fcSHong Zhang 2357a21f80fcSHong Zhang References: MUMPS Users' Guide 2358a21f80fcSHong Zhang 2359a21f80fcSHong Zhang .seealso: MatGetFactor() 2360a21f80fcSHong Zhang @*/ 2361bc6112feSHong Zhang PetscErrorCode MatMumpsGetCntl(Mat F,PetscInt icntl,PetscReal *val) 2362bc6112feSHong Zhang { 2363bc6112feSHong Zhang PetscErrorCode ierr; 2364bc6112feSHong Zhang 2365bc6112feSHong Zhang PetscFunctionBegin; 2366bc6112feSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 2367bc6112feSHong Zhang PetscValidRealPointer(val,3); 2368bc6112feSHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetCntl_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 2369bc6112feSHong Zhang PetscFunctionReturn(0); 2370bc6112feSHong Zhang } 2371bc6112feSHong Zhang 2372bc6112feSHong Zhang #undef __FUNCT__ 2373ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfo_MUMPS" 2374ca810319SHong Zhang PetscErrorCode MatMumpsGetInfo_MUMPS(Mat F,PetscInt icntl,PetscInt *info) 2375bc6112feSHong Zhang { 2376bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2377bc6112feSHong Zhang 2378bc6112feSHong Zhang PetscFunctionBegin; 2379bc6112feSHong Zhang *info = mumps->id.INFO(icntl); 2380bc6112feSHong Zhang PetscFunctionReturn(0); 2381bc6112feSHong Zhang } 2382bc6112feSHong Zhang 2383bc6112feSHong Zhang #undef __FUNCT__ 2384ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfog_MUMPS" 2385ca810319SHong Zhang PetscErrorCode MatMumpsGetInfog_MUMPS(Mat F,PetscInt icntl,PetscInt *infog) 2386bc6112feSHong Zhang { 2387bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2388bc6112feSHong Zhang 2389bc6112feSHong Zhang PetscFunctionBegin; 2390bc6112feSHong Zhang *infog = mumps->id.INFOG(icntl); 2391bc6112feSHong Zhang PetscFunctionReturn(0); 2392bc6112feSHong Zhang } 2393bc6112feSHong Zhang 2394bc6112feSHong Zhang #undef __FUNCT__ 2395ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfo_MUMPS" 2396ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfo_MUMPS(Mat F,PetscInt icntl,PetscReal *rinfo) 2397bc6112feSHong Zhang { 2398bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2399bc6112feSHong Zhang 2400bc6112feSHong Zhang PetscFunctionBegin; 2401bc6112feSHong Zhang *rinfo = mumps->id.RINFO(icntl); 2402bc6112feSHong Zhang PetscFunctionReturn(0); 2403bc6112feSHong Zhang } 2404bc6112feSHong Zhang 2405bc6112feSHong Zhang #undef __FUNCT__ 2406ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfog_MUMPS" 2407ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfog_MUMPS(Mat F,PetscInt icntl,PetscReal *rinfog) 2408bc6112feSHong Zhang { 2409bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2410bc6112feSHong Zhang 2411bc6112feSHong Zhang PetscFunctionBegin; 2412bc6112feSHong Zhang *rinfog = mumps->id.RINFOG(icntl); 2413bc6112feSHong Zhang PetscFunctionReturn(0); 2414bc6112feSHong Zhang } 2415bc6112feSHong Zhang 2416bc6112feSHong Zhang #undef __FUNCT__ 2417ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfo" 2418a21f80fcSHong Zhang /*@ 2419a21f80fcSHong Zhang MatMumpsGetInfo - Get MUMPS parameter INFO() 2420a21f80fcSHong Zhang 2421a21f80fcSHong Zhang Logically Collective on Mat 2422a21f80fcSHong Zhang 2423a21f80fcSHong Zhang Input Parameters: 2424a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2425a21f80fcSHong Zhang - icntl - index of MUMPS parameter array INFO() 2426a21f80fcSHong Zhang 2427a21f80fcSHong Zhang Output Parameter: 2428a21f80fcSHong Zhang . ival - value of MUMPS INFO(icntl) 2429a21f80fcSHong Zhang 2430a21f80fcSHong Zhang Level: beginner 2431a21f80fcSHong Zhang 2432a21f80fcSHong Zhang References: MUMPS Users' Guide 2433a21f80fcSHong Zhang 2434a21f80fcSHong Zhang .seealso: MatGetFactor() 2435a21f80fcSHong Zhang @*/ 2436ca810319SHong Zhang PetscErrorCode MatMumpsGetInfo(Mat F,PetscInt icntl,PetscInt *ival) 2437bc6112feSHong Zhang { 2438bc6112feSHong Zhang PetscErrorCode ierr; 2439bc6112feSHong Zhang 2440bc6112feSHong Zhang PetscFunctionBegin; 2441ca810319SHong Zhang PetscValidIntPointer(ival,3); 2442ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetInfo_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 2443bc6112feSHong Zhang PetscFunctionReturn(0); 2444bc6112feSHong Zhang } 2445bc6112feSHong Zhang 2446bc6112feSHong Zhang #undef __FUNCT__ 2447ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfog" 2448a21f80fcSHong Zhang /*@ 2449a21f80fcSHong Zhang MatMumpsGetInfog - Get MUMPS parameter INFOG() 2450a21f80fcSHong Zhang 2451a21f80fcSHong Zhang Logically Collective on Mat 2452a21f80fcSHong Zhang 2453a21f80fcSHong Zhang Input Parameters: 2454a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2455a21f80fcSHong Zhang - icntl - index of MUMPS parameter array INFOG() 2456a21f80fcSHong Zhang 2457a21f80fcSHong Zhang Output Parameter: 2458a21f80fcSHong Zhang . ival - value of MUMPS INFOG(icntl) 2459a21f80fcSHong Zhang 2460a21f80fcSHong Zhang Level: beginner 2461a21f80fcSHong Zhang 2462a21f80fcSHong Zhang References: MUMPS Users' Guide 2463a21f80fcSHong Zhang 2464a21f80fcSHong Zhang .seealso: MatGetFactor() 2465a21f80fcSHong Zhang @*/ 2466ca810319SHong Zhang PetscErrorCode MatMumpsGetInfog(Mat F,PetscInt icntl,PetscInt *ival) 2467bc6112feSHong Zhang { 2468bc6112feSHong Zhang PetscErrorCode ierr; 2469bc6112feSHong Zhang 2470bc6112feSHong Zhang PetscFunctionBegin; 2471ca810319SHong Zhang PetscValidIntPointer(ival,3); 2472ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetInfog_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 2473bc6112feSHong Zhang PetscFunctionReturn(0); 2474bc6112feSHong Zhang } 2475bc6112feSHong Zhang 2476bc6112feSHong Zhang #undef __FUNCT__ 2477ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfo" 2478a21f80fcSHong Zhang /*@ 2479a21f80fcSHong Zhang MatMumpsGetRinfo - Get MUMPS parameter RINFO() 2480a21f80fcSHong Zhang 2481a21f80fcSHong Zhang Logically Collective on Mat 2482a21f80fcSHong Zhang 2483a21f80fcSHong Zhang Input Parameters: 2484a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2485a21f80fcSHong Zhang - icntl - index of MUMPS parameter array RINFO() 2486a21f80fcSHong Zhang 2487a21f80fcSHong Zhang Output Parameter: 2488a21f80fcSHong Zhang . val - value of MUMPS RINFO(icntl) 2489a21f80fcSHong Zhang 2490a21f80fcSHong Zhang Level: beginner 2491a21f80fcSHong Zhang 2492a21f80fcSHong Zhang References: MUMPS Users' Guide 2493a21f80fcSHong Zhang 2494a21f80fcSHong Zhang .seealso: MatGetFactor() 2495a21f80fcSHong Zhang @*/ 2496ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfo(Mat F,PetscInt icntl,PetscReal *val) 2497bc6112feSHong Zhang { 2498bc6112feSHong Zhang PetscErrorCode ierr; 2499bc6112feSHong Zhang 2500bc6112feSHong Zhang PetscFunctionBegin; 2501bc6112feSHong Zhang PetscValidRealPointer(val,3); 2502ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetRinfo_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 2503bc6112feSHong Zhang PetscFunctionReturn(0); 2504bc6112feSHong Zhang } 2505bc6112feSHong Zhang 2506bc6112feSHong Zhang #undef __FUNCT__ 2507ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfog" 2508a21f80fcSHong Zhang /*@ 2509a21f80fcSHong Zhang MatMumpsGetRinfog - Get MUMPS parameter RINFOG() 2510a21f80fcSHong Zhang 2511a21f80fcSHong Zhang Logically Collective on Mat 2512a21f80fcSHong Zhang 2513a21f80fcSHong Zhang Input Parameters: 2514a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2515a21f80fcSHong Zhang - icntl - index of MUMPS parameter array RINFOG() 2516a21f80fcSHong Zhang 2517a21f80fcSHong Zhang Output Parameter: 2518a21f80fcSHong Zhang . val - value of MUMPS RINFOG(icntl) 2519a21f80fcSHong Zhang 2520a21f80fcSHong Zhang Level: beginner 2521a21f80fcSHong Zhang 2522a21f80fcSHong Zhang References: MUMPS Users' Guide 2523a21f80fcSHong Zhang 2524a21f80fcSHong Zhang .seealso: MatGetFactor() 2525a21f80fcSHong Zhang @*/ 2526ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfog(Mat F,PetscInt icntl,PetscReal *val) 2527bc6112feSHong Zhang { 2528bc6112feSHong Zhang PetscErrorCode ierr; 2529bc6112feSHong Zhang 2530bc6112feSHong Zhang PetscFunctionBegin; 2531bc6112feSHong Zhang PetscValidRealPointer(val,3); 2532ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetRinfog_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 2533bc6112feSHong Zhang PetscFunctionReturn(0); 2534bc6112feSHong Zhang } 2535bc6112feSHong Zhang 253624b6179bSKris Buschelman /*MC 25372692d6eeSBarry Smith MATSOLVERMUMPS - A matrix type providing direct solvers (LU and Cholesky) for 253824b6179bSKris Buschelman distributed and sequential matrices via the external package MUMPS. 253924b6179bSKris Buschelman 254041c8de11SBarry Smith Works with MATAIJ and MATSBAIJ matrices 254124b6179bSKris Buschelman 254224b6179bSKris Buschelman Options Database Keys: 25434e34a73bSHong Zhang + -mat_mumps_icntl_1 <6>: ICNTL(1): output stream for error messages (None) 25444e34a73bSHong Zhang . -mat_mumps_icntl_2 <0>: ICNTL(2): output stream for diagnostic printing, statistics, and warning (None) 25454e34a73bSHong Zhang . -mat_mumps_icntl_3 <0>: ICNTL(3): output stream for global information, collected on the host (None) 25464e34a73bSHong Zhang . -mat_mumps_icntl_4 <0>: ICNTL(4): level of printing (0 to 4) (None) 25474e34a73bSHong Zhang . -mat_mumps_icntl_6 <7>: ICNTL(6): permutes to a zero-free diagonal and/or scale the matrix (0 to 7) (None) 25484e34a73bSHong Zhang . -mat_mumps_icntl_7 <7>: ICNTL(7): computes a symmetric permutation in sequential analysis (0 to 7). 3=Scotch, 4=PORD, 5=Metis (None) 25494e34a73bSHong Zhang . -mat_mumps_icntl_8 <77>: ICNTL(8): scaling strategy (-2 to 8 or 77) (None) 25504e34a73bSHong Zhang . -mat_mumps_icntl_10 <0>: ICNTL(10): max num of refinements (None) 25514e34a73bSHong Zhang . -mat_mumps_icntl_11 <0>: ICNTL(11): statistics related to an error analysis (via -ksp_view) (None) 25524e34a73bSHong Zhang . -mat_mumps_icntl_12 <1>: ICNTL(12): an ordering strategy for symmetric matrices (0 to 3) (None) 25534e34a73bSHong Zhang . -mat_mumps_icntl_13 <0>: ICNTL(13): parallelism of the root node (enable ScaLAPACK) and its splitting (None) 25544e34a73bSHong Zhang . -mat_mumps_icntl_14 <20>: ICNTL(14): percentage increase in the estimated working space (None) 25554e34a73bSHong Zhang . -mat_mumps_icntl_19 <0>: ICNTL(19): computes the Schur complement (None) 25564e34a73bSHong Zhang . -mat_mumps_icntl_22 <0>: ICNTL(22): in-core/out-of-core factorization and solve (0 or 1) (None) 25574e34a73bSHong Zhang . -mat_mumps_icntl_23 <0>: ICNTL(23): max size of the working memory (MB) that can allocate per processor (None) 25584e34a73bSHong Zhang . -mat_mumps_icntl_24 <0>: ICNTL(24): detection of null pivot rows (0 or 1) (None) 25594e34a73bSHong Zhang . -mat_mumps_icntl_25 <0>: ICNTL(25): compute a solution of a deficient matrix and a null space basis (None) 25604e34a73bSHong Zhang . -mat_mumps_icntl_26 <0>: ICNTL(26): drives the solution phase if a Schur complement matrix (None) 25614e34a73bSHong Zhang . -mat_mumps_icntl_28 <1>: ICNTL(28): use 1 for sequential analysis and ictnl(7) ordering, or 2 for parallel analysis and ictnl(29) ordering (None) 25624e34a73bSHong Zhang . -mat_mumps_icntl_29 <0>: ICNTL(29): parallel ordering 1 = ptscotch, 2 = parmetis (None) 25634e34a73bSHong Zhang . -mat_mumps_icntl_30 <0>: ICNTL(30): compute user-specified set of entries in inv(A) (None) 25644e34a73bSHong Zhang . -mat_mumps_icntl_31 <0>: ICNTL(31): indicates which factors may be discarded during factorization (None) 25654e34a73bSHong Zhang . -mat_mumps_icntl_33 <0>: ICNTL(33): compute determinant (None) 25664e34a73bSHong Zhang . -mat_mumps_cntl_1 <0.01>: CNTL(1): relative pivoting threshold (None) 25674e34a73bSHong Zhang . -mat_mumps_cntl_2 <1.49012e-08>: CNTL(2): stopping criterion of refinement (None) 25684e34a73bSHong Zhang . -mat_mumps_cntl_3 <0>: CNTL(3): absolute pivoting threshold (None) 25694e34a73bSHong Zhang . -mat_mumps_cntl_4 <-1>: CNTL(4): value for static pivoting (None) 25704e34a73bSHong Zhang - -mat_mumps_cntl_5 <0>: CNTL(5): fixation for null pivots (None) 257124b6179bSKris Buschelman 257224b6179bSKris Buschelman Level: beginner 257324b6179bSKris Buschelman 257441c8de11SBarry Smith .seealso: PCFactorSetMatSolverPackage(), MatSolverPackage 257541c8de11SBarry Smith 257624b6179bSKris Buschelman M*/ 257724b6179bSKris Buschelman 257835bd34faSBarry Smith #undef __FUNCT__ 257935bd34faSBarry Smith #define __FUNCT__ "MatFactorGetSolverPackage_mumps" 2580f7a08781SBarry Smith static PetscErrorCode MatFactorGetSolverPackage_mumps(Mat A,const MatSolverPackage *type) 258135bd34faSBarry Smith { 258235bd34faSBarry Smith PetscFunctionBegin; 25832692d6eeSBarry Smith *type = MATSOLVERMUMPS; 258435bd34faSBarry Smith PetscFunctionReturn(0); 258535bd34faSBarry Smith } 258635bd34faSBarry Smith 2587bccb9932SShri Abhyankar /* MatGetFactor for Seq and MPI AIJ matrices */ 25882877fffaSHong Zhang #undef __FUNCT__ 2589bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_aij_mumps" 25908cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_aij_mumps(Mat A,MatFactorType ftype,Mat *F) 25912877fffaSHong Zhang { 25922877fffaSHong Zhang Mat B; 25932877fffaSHong Zhang PetscErrorCode ierr; 25942877fffaSHong Zhang Mat_MUMPS *mumps; 2595ace3abfcSBarry Smith PetscBool isSeqAIJ; 25962877fffaSHong Zhang 25972877fffaSHong Zhang PetscFunctionBegin; 25982877fffaSHong Zhang /* Create the factorization matrix */ 2599251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQAIJ,&isSeqAIJ);CHKERRQ(ierr); 2600ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 26012877fffaSHong Zhang ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 26022877fffaSHong Zhang ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2603bccb9932SShri Abhyankar if (isSeqAIJ) { 26040298fd71SBarry Smith ierr = MatSeqAIJSetPreallocation(B,0,NULL);CHKERRQ(ierr); 2605bccb9932SShri Abhyankar } else { 26060298fd71SBarry Smith ierr = MatMPIAIJSetPreallocation(B,0,NULL,0,NULL);CHKERRQ(ierr); 2607bccb9932SShri Abhyankar } 26082877fffaSHong Zhang 2609b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 26102205254eSKarl Rupp 26112877fffaSHong Zhang B->ops->view = MatView_MUMPS; 261235bd34faSBarry Smith B->ops->getinfo = MatGetInfo_MUMPS; 261320be8e61SHong Zhang B->ops->getdiagonal = MatGetDiagonal_MUMPS; 26142205254eSKarl Rupp 2615bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 2616bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 2617bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 2618bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 2619bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 2620bc6112feSHong Zhang 2621ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 2622ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 2623ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 2624ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 26256444a565SStefano Zampini 26266444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetSchurIndices_C",MatMumpsSetSchurIndices_MUMPS);CHKERRQ(ierr); 262759ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsInvertSchurComplement_C",MatMumpsInvertSchurComplement_MUMPS);CHKERRQ(ierr); 262859ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsCreateSchurComplement_C",MatMumpsCreateSchurComplement_MUMPS);CHKERRQ(ierr); 26296444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetSchurComplement_C",MatMumpsGetSchurComplement_MUMPS);CHKERRQ(ierr); 263059ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsRestoreSchurComplement_C",MatMumpsRestoreSchurComplement_MUMPS);CHKERRQ(ierr); 2631e807eca7SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplement_C",MatMumpsSolveSchurComplement_MUMPS);CHKERRQ(ierr); 2632*7404bcfbSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplementTranspose_C",MatMumpsSolveSchurComplementTranspose_MUMPS);CHKERRQ(ierr); 2633e807eca7SStefano Zampini 2634450b117fSShri Abhyankar if (ftype == MAT_FACTOR_LU) { 2635450b117fSShri Abhyankar B->ops->lufactorsymbolic = MatLUFactorSymbolic_AIJMUMPS; 2636d5f3da31SBarry Smith B->factortype = MAT_FACTOR_LU; 2637bccb9932SShri Abhyankar if (isSeqAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqaij_seqaij; 2638bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpiaij_mpiaij; 2639746480a1SHong Zhang mumps->sym = 0; 2640dcd589f8SShri Abhyankar } else { 264167877ebaSShri Abhyankar B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_MUMPS; 2642450b117fSShri Abhyankar B->factortype = MAT_FACTOR_CHOLESKY; 2643bccb9932SShri Abhyankar if (isSeqAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqaij_seqsbaij; 2644bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpiaij_mpisbaij; 264559ac8732SStefano Zampini #if defined(PETSC_USE_COMPLEX) 264659ac8732SStefano Zampini mumps->sym = 2; 264759ac8732SStefano Zampini #else 26486fdc2a6dSBarry Smith if (A->spd_set && A->spd) mumps->sym = 1; 26496fdc2a6dSBarry Smith else mumps->sym = 2; 265059ac8732SStefano Zampini #endif 2651450b117fSShri Abhyankar } 26522877fffaSHong Zhang 26532877fffaSHong Zhang mumps->isAIJ = PETSC_TRUE; 2654bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 26552877fffaSHong Zhang B->ops->destroy = MatDestroy_MUMPS; 26562877fffaSHong Zhang B->spptr = (void*)mumps; 26572205254eSKarl Rupp 2658f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 2659746480a1SHong Zhang 26602877fffaSHong Zhang *F = B; 26612877fffaSHong Zhang PetscFunctionReturn(0); 26622877fffaSHong Zhang } 26632877fffaSHong Zhang 2664bccb9932SShri Abhyankar /* MatGetFactor for Seq and MPI SBAIJ matrices */ 26652877fffaSHong Zhang #undef __FUNCT__ 2666bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_sbaij_mumps" 26678cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_sbaij_mumps(Mat A,MatFactorType ftype,Mat *F) 26682877fffaSHong Zhang { 26692877fffaSHong Zhang Mat B; 26702877fffaSHong Zhang PetscErrorCode ierr; 26712877fffaSHong Zhang Mat_MUMPS *mumps; 2672ace3abfcSBarry Smith PetscBool isSeqSBAIJ; 26732877fffaSHong Zhang 26742877fffaSHong Zhang PetscFunctionBegin; 2675ce94432eSBarry Smith if (ftype != MAT_FACTOR_CHOLESKY) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with MUMPS LU, use AIJ matrix"); 2676ce94432eSBarry Smith if (A->rmap->bs > 1) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with block size > 1 with MUMPS Cholesky, use AIJ matrix instead"); 2677251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQSBAIJ,&isSeqSBAIJ);CHKERRQ(ierr); 26782877fffaSHong Zhang /* Create the factorization matrix */ 2679ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 26802877fffaSHong Zhang ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 26812877fffaSHong Zhang ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2682b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 2683bccb9932SShri Abhyankar if (isSeqSBAIJ) { 26840298fd71SBarry Smith ierr = MatSeqSBAIJSetPreallocation(B,1,0,NULL);CHKERRQ(ierr); 26852205254eSKarl Rupp 268616ebf90aSShri Abhyankar mumps->ConvertToTriples = MatConvertToTriples_seqsbaij_seqsbaij; 2687dcd589f8SShri Abhyankar } else { 26880298fd71SBarry Smith ierr = MatMPISBAIJSetPreallocation(B,1,0,NULL,0,NULL);CHKERRQ(ierr); 26892205254eSKarl Rupp 2690bccb9932SShri Abhyankar mumps->ConvertToTriples = MatConvertToTriples_mpisbaij_mpisbaij; 2691bccb9932SShri Abhyankar } 2692bccb9932SShri Abhyankar 269367877ebaSShri Abhyankar B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_MUMPS; 2694bccb9932SShri Abhyankar B->ops->view = MatView_MUMPS; 269520be8e61SHong Zhang B->ops->getdiagonal = MatGetDiagonal_MUMPS; 26962205254eSKarl Rupp 2697bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 2698b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 2699b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 2700b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 2701b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 2702bc6112feSHong Zhang 2703ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 2704ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 2705ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 2706ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 27072205254eSKarl Rupp 27086444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetSchurIndices_C",MatMumpsSetSchurIndices_MUMPS);CHKERRQ(ierr); 270959ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsInvertSchurComplement_C",MatMumpsInvertSchurComplement_MUMPS);CHKERRQ(ierr); 271059ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsCreateSchurComplement_C",MatMumpsCreateSchurComplement_MUMPS);CHKERRQ(ierr); 27116444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetSchurComplement_C",MatMumpsGetSchurComplement_MUMPS);CHKERRQ(ierr); 271259ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsRestoreSchurComplement_C",MatMumpsRestoreSchurComplement_MUMPS);CHKERRQ(ierr); 2713e807eca7SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplement_C",MatMumpsSolveSchurComplement_MUMPS);CHKERRQ(ierr); 2714*7404bcfbSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplementTranspose_C",MatMumpsSolveSchurComplementTranspose_MUMPS);CHKERRQ(ierr); 27156444a565SStefano Zampini 2716f4762488SHong Zhang B->factortype = MAT_FACTOR_CHOLESKY; 271759ac8732SStefano Zampini #if defined(PETSC_USE_COMPLEX) 271859ac8732SStefano Zampini mumps->sym = 2; 271959ac8732SStefano Zampini #else 27206fdc2a6dSBarry Smith if (A->spd_set && A->spd) mumps->sym = 1; 27216fdc2a6dSBarry Smith else mumps->sym = 2; 272259ac8732SStefano Zampini #endif 2723a214ac2aSShri Abhyankar 2724bccb9932SShri Abhyankar mumps->isAIJ = PETSC_FALSE; 2725bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 2726f3c0ef26SHong Zhang B->ops->destroy = MatDestroy_MUMPS; 27272877fffaSHong Zhang B->spptr = (void*)mumps; 27282205254eSKarl Rupp 2729f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 2730746480a1SHong Zhang 27312877fffaSHong Zhang *F = B; 27322877fffaSHong Zhang PetscFunctionReturn(0); 27332877fffaSHong Zhang } 273497969023SHong Zhang 2735450b117fSShri Abhyankar #undef __FUNCT__ 2736bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_baij_mumps" 27378cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_baij_mumps(Mat A,MatFactorType ftype,Mat *F) 273867877ebaSShri Abhyankar { 273967877ebaSShri Abhyankar Mat B; 274067877ebaSShri Abhyankar PetscErrorCode ierr; 274167877ebaSShri Abhyankar Mat_MUMPS *mumps; 2742ace3abfcSBarry Smith PetscBool isSeqBAIJ; 274367877ebaSShri Abhyankar 274467877ebaSShri Abhyankar PetscFunctionBegin; 274567877ebaSShri Abhyankar /* Create the factorization matrix */ 2746251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQBAIJ,&isSeqBAIJ);CHKERRQ(ierr); 2747ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 274867877ebaSShri Abhyankar ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 274967877ebaSShri Abhyankar ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2750bccb9932SShri Abhyankar if (isSeqBAIJ) { 27510298fd71SBarry Smith ierr = MatSeqBAIJSetPreallocation(B,A->rmap->bs,0,NULL);CHKERRQ(ierr); 2752bccb9932SShri Abhyankar } else { 27530298fd71SBarry Smith ierr = MatMPIBAIJSetPreallocation(B,A->rmap->bs,0,NULL,0,NULL);CHKERRQ(ierr); 2754bccb9932SShri Abhyankar } 2755450b117fSShri Abhyankar 2756b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 2757450b117fSShri Abhyankar if (ftype == MAT_FACTOR_LU) { 2758450b117fSShri Abhyankar B->ops->lufactorsymbolic = MatLUFactorSymbolic_BAIJMUMPS; 2759450b117fSShri Abhyankar B->factortype = MAT_FACTOR_LU; 2760bccb9932SShri Abhyankar if (isSeqBAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqbaij_seqaij; 2761bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpibaij_mpiaij; 2762746480a1SHong Zhang mumps->sym = 0; 2763f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Cannot use PETSc BAIJ matrices with MUMPS Cholesky, use SBAIJ or AIJ matrix instead\n"); 2764bccb9932SShri Abhyankar 2765450b117fSShri Abhyankar B->ops->view = MatView_MUMPS; 276620be8e61SHong Zhang B->ops->getdiagonal = MatGetDiagonal_MUMPS; 27672205254eSKarl Rupp 2768bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 2769bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 2770bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 2771bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 2772bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 2773bc6112feSHong Zhang 2774ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 2775ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 2776ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 2777ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 2778450b117fSShri Abhyankar 27796444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetSchurIndices_C",MatMumpsSetSchurIndices_MUMPS);CHKERRQ(ierr); 278059ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsInvertSchurComplement_C",MatMumpsInvertSchurComplement_MUMPS);CHKERRQ(ierr); 278159ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsCreateSchurComplement_C",MatMumpsCreateSchurComplement_MUMPS);CHKERRQ(ierr); 27826444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetSchurComplement_C",MatMumpsGetSchurComplement_MUMPS);CHKERRQ(ierr); 278359ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsRestoreSchurComplement_C",MatMumpsRestoreSchurComplement_MUMPS);CHKERRQ(ierr); 2784e807eca7SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplement_C",MatMumpsSolveSchurComplement_MUMPS);CHKERRQ(ierr); 2785*7404bcfbSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplementTranspose_C",MatMumpsSolveSchurComplementTranspose_MUMPS);CHKERRQ(ierr); 27866444a565SStefano Zampini 2787450b117fSShri Abhyankar mumps->isAIJ = PETSC_TRUE; 2788bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 2789450b117fSShri Abhyankar B->ops->destroy = MatDestroy_MUMPS; 2790450b117fSShri Abhyankar B->spptr = (void*)mumps; 27912205254eSKarl Rupp 2792f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 2793746480a1SHong Zhang 2794450b117fSShri Abhyankar *F = B; 2795450b117fSShri Abhyankar PetscFunctionReturn(0); 2796450b117fSShri Abhyankar } 279742c9c57cSBarry Smith 279842c9c57cSBarry Smith PETSC_EXTERN PetscErrorCode MatGetFactor_aij_mumps(Mat,MatFactorType,Mat*); 279942c9c57cSBarry Smith PETSC_EXTERN PetscErrorCode MatGetFactor_baij_mumps(Mat,MatFactorType,Mat*); 280042c9c57cSBarry Smith PETSC_EXTERN PetscErrorCode MatGetFactor_sbaij_mumps(Mat,MatFactorType,Mat*); 280142c9c57cSBarry Smith 280242c9c57cSBarry Smith #undef __FUNCT__ 280342c9c57cSBarry Smith #define __FUNCT__ "MatSolverPackageRegister_MUMPS" 280429b38603SBarry Smith PETSC_EXTERN PetscErrorCode MatSolverPackageRegister_MUMPS(void) 280542c9c57cSBarry Smith { 280642c9c57cSBarry Smith PetscErrorCode ierr; 280742c9c57cSBarry Smith 280842c9c57cSBarry Smith PetscFunctionBegin; 280942c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIAIJ,MAT_FACTOR_LU,MatGetFactor_aij_mumps);CHKERRQ(ierr); 281042c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_aij_mumps);CHKERRQ(ierr); 281142c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIBAIJ,MAT_FACTOR_LU,MatGetFactor_baij_mumps);CHKERRQ(ierr); 281242c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_baij_mumps);CHKERRQ(ierr); 281342c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPISBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_sbaij_mumps);CHKERRQ(ierr); 281442c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQAIJ,MAT_FACTOR_LU,MatGetFactor_aij_mumps);CHKERRQ(ierr); 281542c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_aij_mumps);CHKERRQ(ierr); 281642c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQBAIJ,MAT_FACTOR_LU,MatGetFactor_baij_mumps);CHKERRQ(ierr); 281742c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_baij_mumps);CHKERRQ(ierr); 281842c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQSBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_sbaij_mumps);CHKERRQ(ierr); 281942c9c57cSBarry Smith PetscFunctionReturn(0); 282042c9c57cSBarry Smith } 282142c9c57cSBarry Smith 2822