11c2a3de1SBarry Smith 2397b6df1SKris Buschelman /* 3c2b5dc30SHong Zhang Provides an interface to the MUMPS sparse solver 4397b6df1SKris Buschelman */ 551d5961aSHong Zhang 6c6db04a5SJed Brown #include <../src/mat/impls/aij/mpi/mpiaij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <../src/mat/impls/sbaij/mpi/mpisbaij.h> 8b5fa320bSStefano Zampini #include <petscblaslapack.h> 9397b6df1SKris Buschelman 10397b6df1SKris Buschelman EXTERN_C_BEGIN 11397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 122907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 132907cef9SHong Zhang #include <cmumps_c.h> 142907cef9SHong Zhang #else 15c6db04a5SJed Brown #include <zmumps_c.h> 162907cef9SHong Zhang #endif 172907cef9SHong Zhang #else 182907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 192907cef9SHong Zhang #include <smumps_c.h> 20397b6df1SKris Buschelman #else 21c6db04a5SJed Brown #include <dmumps_c.h> 22397b6df1SKris Buschelman #endif 232907cef9SHong Zhang #endif 24397b6df1SKris Buschelman EXTERN_C_END 25397b6df1SKris Buschelman #define JOB_INIT -1 263d472b54SHong Zhang #define JOB_FACTSYMBOLIC 1 273d472b54SHong Zhang #define JOB_FACTNUMERIC 2 283d472b54SHong Zhang #define JOB_SOLVE 3 29397b6df1SKris Buschelman #define JOB_END -2 303d472b54SHong Zhang 312907cef9SHong Zhang /* calls to MUMPS */ 322907cef9SHong Zhang #if defined(PETSC_USE_COMPLEX) 332907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 342907cef9SHong Zhang #define PetscMUMPS_c cmumps_c 352907cef9SHong Zhang #else 362907cef9SHong Zhang #define PetscMUMPS_c zmumps_c 372907cef9SHong Zhang #endif 382907cef9SHong Zhang #else 392907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 402907cef9SHong Zhang #define PetscMUMPS_c smumps_c 412907cef9SHong Zhang #else 422907cef9SHong Zhang #define PetscMUMPS_c dmumps_c 432907cef9SHong Zhang #endif 442907cef9SHong Zhang #endif 452907cef9SHong Zhang 46940cd9d6SSatish Balay /* declare MumpsScalar */ 47940cd9d6SSatish Balay #if defined(PETSC_USE_COMPLEX) 48940cd9d6SSatish Balay #if defined(PETSC_USE_REAL_SINGLE) 49940cd9d6SSatish Balay #define MumpsScalar mumps_complex 50940cd9d6SSatish Balay #else 51940cd9d6SSatish Balay #define MumpsScalar mumps_double_complex 52940cd9d6SSatish Balay #endif 53940cd9d6SSatish Balay #else 54940cd9d6SSatish Balay #define MumpsScalar PetscScalar 55940cd9d6SSatish Balay #endif 563d472b54SHong Zhang 57397b6df1SKris Buschelman /* macros s.t. indices match MUMPS documentation */ 58397b6df1SKris Buschelman #define ICNTL(I) icntl[(I)-1] 59397b6df1SKris Buschelman #define CNTL(I) cntl[(I)-1] 60397b6df1SKris Buschelman #define INFOG(I) infog[(I)-1] 61a7aca84bSHong Zhang #define INFO(I) info[(I)-1] 62397b6df1SKris Buschelman #define RINFOG(I) rinfog[(I)-1] 63adc1d99fSHong Zhang #define RINFO(I) rinfo[(I)-1] 64397b6df1SKris Buschelman 65397b6df1SKris Buschelman typedef struct { 66397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 672907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 682907cef9SHong Zhang CMUMPS_STRUC_C id; 692907cef9SHong Zhang #else 70397b6df1SKris Buschelman ZMUMPS_STRUC_C id; 712907cef9SHong Zhang #endif 722907cef9SHong Zhang #else 732907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 742907cef9SHong Zhang SMUMPS_STRUC_C id; 75397b6df1SKris Buschelman #else 76397b6df1SKris Buschelman DMUMPS_STRUC_C id; 77397b6df1SKris Buschelman #endif 782907cef9SHong Zhang #endif 792907cef9SHong Zhang 80397b6df1SKris Buschelman MatStructure matstruc; 81c1490034SHong Zhang PetscMPIInt myid,size; 82a5e57a09SHong Zhang PetscInt *irn,*jcn,nz,sym; 83397b6df1SKris Buschelman PetscScalar *val; 84397b6df1SKris Buschelman MPI_Comm comm_mumps; 8564e6c443SBarry Smith PetscBool isAIJ,CleanUpMUMPS; 86a5e57a09SHong Zhang PetscInt ICNTL9_pre; /* check if ICNTL(9) is changed from previous MatSolve */ 87801fbe65SHong Zhang VecScatter scat_rhs, scat_sol; /* used by MatSolve() */ 88801fbe65SHong Zhang Vec b_seq,x_seq; 89b34f08ffSHong Zhang PetscInt ninfo,*info; /* display INFO */ 90b5fa320bSStefano Zampini PetscBool schur_second_solve; 91b5fa320bSStefano Zampini PetscInt sizeredrhs; 92b5fa320bSStefano Zampini PetscInt *schur_pivots; 9359ac8732SStefano Zampini PetscInt schur_B_lwork; 94b5fa320bSStefano Zampini PetscScalar *schur_work; 9559ac8732SStefano Zampini PetscScalar *schur_sol; 9659ac8732SStefano Zampini PetscInt schur_sizesol; 9759ac8732SStefano Zampini PetscBool schur_restored; 9859ac8732SStefano Zampini PetscBool schur_factored; 9959ac8732SStefano Zampini PetscBool schur_inverted; 100*a0b0af32SStefano Zampini PetscInt schur_sym; 1012205254eSKarl Rupp 102bf0cc555SLisandro Dalcin PetscErrorCode (*Destroy)(Mat); 103bccb9932SShri Abhyankar PetscErrorCode (*ConvertToTriples)(Mat, int, MatReuse, int*, int**, int**, PetscScalar**); 104f0c56d0fSKris Buschelman } Mat_MUMPS; 105f0c56d0fSKris Buschelman 10609573ac7SBarry Smith extern PetscErrorCode MatDuplicate_MUMPS(Mat,MatDuplicateOption,Mat*); 107b24902e0SBarry Smith 10859ac8732SStefano Zampini #undef __FUNCT__ 10959ac8732SStefano Zampini #define __FUNCT__ "MatMumpsResetSchur_Private" 11059ac8732SStefano Zampini static PetscErrorCode MatMumpsResetSchur_Private(Mat_MUMPS* mumps) 111b5fa320bSStefano Zampini { 112b5fa320bSStefano Zampini PetscErrorCode ierr; 113b5fa320bSStefano Zampini 114b5fa320bSStefano Zampini PetscFunctionBegin; 11559ac8732SStefano Zampini ierr = PetscFree2(mumps->id.listvar_schur,mumps->id.schur);CHKERRQ(ierr); 11659ac8732SStefano Zampini ierr = PetscFree(mumps->id.redrhs);CHKERRQ(ierr); 11759ac8732SStefano Zampini ierr = PetscFree(mumps->schur_sol);CHKERRQ(ierr); 11859ac8732SStefano Zampini ierr = PetscFree(mumps->schur_pivots);CHKERRQ(ierr); 11959ac8732SStefano Zampini ierr = PetscFree(mumps->schur_work);CHKERRQ(ierr); 12059ac8732SStefano Zampini if (!mumps->schur_restored) { 12159ac8732SStefano Zampini SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 12259ac8732SStefano Zampini } 12359ac8732SStefano Zampini mumps->id.size_schur = 0; 12459ac8732SStefano Zampini mumps->id.ICNTL(19) = 0; 12559ac8732SStefano Zampini PetscFunctionReturn(0); 12659ac8732SStefano Zampini } 12759ac8732SStefano Zampini 12859ac8732SStefano Zampini #undef __FUNCT__ 12959ac8732SStefano Zampini #define __FUNCT__ "MatMumpsFactorSchur_Private" 13059ac8732SStefano Zampini static PetscErrorCode MatMumpsFactorSchur_Private(Mat_MUMPS* mumps) 13159ac8732SStefano Zampini { 13259ac8732SStefano Zampini PetscBLASInt B_N,B_ierr,B_slda; 13359ac8732SStefano Zampini PetscErrorCode ierr; 13459ac8732SStefano Zampini 13559ac8732SStefano Zampini PetscFunctionBegin; 13659ac8732SStefano Zampini if (mumps->schur_factored) { 13759ac8732SStefano Zampini PetscFunctionReturn(0); 13859ac8732SStefano Zampini } 13959ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.size_schur,&B_N);CHKERRQ(ierr); 14059ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.schur_lld,&B_slda);CHKERRQ(ierr); 14159ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full Schur matrix */ 14259ac8732SStefano Zampini if (!mumps->schur_pivots) { 14359ac8732SStefano Zampini ierr = PetscMalloc1(B_N,&mumps->schur_pivots);CHKERRQ(ierr); 14459ac8732SStefano Zampini } 14559ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 14659ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetrf",LAPACKgetrf_(&B_N,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,&B_ierr)); 14759ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 14859ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GETRF Lapack routine %d",(int)B_ierr); 14959ac8732SStefano Zampini } else { /* either full or lower-triangular (not packed) */ 15059ac8732SStefano Zampini char ord[2]; 15159ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 15259ac8732SStefano Zampini sprintf(ord,"L"); 15359ac8732SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 15459ac8732SStefano Zampini sprintf(ord,"U"); 15559ac8732SStefano Zampini } 156*a0b0af32SStefano Zampini if (mumps->schur_sym == 2) { 15759ac8732SStefano Zampini if (!mumps->schur_pivots) { 15859ac8732SStefano Zampini PetscScalar lwork; 15959ac8732SStefano Zampini 16059ac8732SStefano Zampini ierr = PetscMalloc1(B_N,&mumps->schur_pivots);CHKERRQ(ierr); 16159ac8732SStefano Zampini mumps->schur_B_lwork=-1; 16259ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 16359ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytrf",LAPACKsytrf_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,&lwork,&mumps->schur_B_lwork,&B_ierr)); 16459ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 16559ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SYTRF Lapack routine %d",(int)B_ierr); 16659ac8732SStefano Zampini ierr = PetscBLASIntCast((PetscInt)PetscRealPart(lwork),&mumps->schur_B_lwork);CHKERRQ(ierr); 16759ac8732SStefano Zampini ierr = PetscMalloc1(mumps->schur_B_lwork,&mumps->schur_work);CHKERRQ(ierr); 16859ac8732SStefano Zampini } 16959ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 17059ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytrf",LAPACKsytrf_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,mumps->schur_work,&mumps->schur_B_lwork,&B_ierr)); 17159ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 17259ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYTRF Lapack routine %d",(int)B_ierr); 17359ac8732SStefano Zampini } else { 17459ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 17559ac8732SStefano Zampini PetscStackCallBLAS("LAPACKpotrf",LAPACKpotrf_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,&B_ierr)); 17659ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 17759ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in POTRF Lapack routine %d",(int)B_ierr); 17859ac8732SStefano Zampini } 17959ac8732SStefano Zampini } 18059ac8732SStefano Zampini mumps->schur_factored = PETSC_TRUE; 18159ac8732SStefano Zampini PetscFunctionReturn(0); 18259ac8732SStefano Zampini } 18359ac8732SStefano Zampini 18459ac8732SStefano Zampini #undef __FUNCT__ 18559ac8732SStefano Zampini #define __FUNCT__ "MatMumpsInvertSchur_Private" 18659ac8732SStefano Zampini static PetscErrorCode MatMumpsInvertSchur_Private(Mat_MUMPS* mumps) 18759ac8732SStefano Zampini { 18859ac8732SStefano Zampini PetscBLASInt B_N,B_ierr,B_slda; 18959ac8732SStefano Zampini PetscErrorCode ierr; 19059ac8732SStefano Zampini 19159ac8732SStefano Zampini PetscFunctionBegin; 19259ac8732SStefano Zampini ierr = MatMumpsFactorSchur_Private(mumps);CHKERRQ(ierr); 19359ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.size_schur,&B_N);CHKERRQ(ierr); 19459ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.schur_lld,&B_slda);CHKERRQ(ierr); 19559ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full Schur matrix */ 19659ac8732SStefano Zampini if (!mumps->schur_work) { 19759ac8732SStefano Zampini PetscScalar lwork; 19859ac8732SStefano Zampini 19959ac8732SStefano Zampini mumps->schur_B_lwork = -1; 20059ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 20159ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetri",LAPACKgetri_(&B_N,(PetscScalar*)mumps->id.schur,&B_N,mumps->schur_pivots,&lwork,&mumps->schur_B_lwork,&B_ierr)); 20259ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 20359ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to GETRI Lapack routine %d",(int)B_ierr); 20459ac8732SStefano Zampini ierr = PetscBLASIntCast((PetscInt)PetscRealPart(lwork),&mumps->schur_B_lwork);CHKERRQ(ierr); 20559ac8732SStefano Zampini ierr = PetscMalloc1(mumps->schur_B_lwork,&mumps->schur_work);CHKERRQ(ierr); 20659ac8732SStefano Zampini } 20759ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 20859ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetri",LAPACKgetri_(&B_N,(PetscScalar*)mumps->id.schur,&B_N,mumps->schur_pivots,mumps->schur_work,&mumps->schur_B_lwork,&B_ierr)); 20959ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 21059ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GETRI Lapack routine %d",(int)B_ierr); 21159ac8732SStefano Zampini } else { /* either full or lower-triangular (not packed) */ 21259ac8732SStefano Zampini char ord[2]; 21359ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 21459ac8732SStefano Zampini sprintf(ord,"L"); 21559ac8732SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 21659ac8732SStefano Zampini sprintf(ord,"U"); 21759ac8732SStefano Zampini } 218*a0b0af32SStefano Zampini if (mumps->schur_sym == 2) { 21959ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 22059ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytri",LAPACKsytri_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_N,mumps->schur_pivots,mumps->schur_work,&B_ierr)); 22159ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 22259ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYTRI Lapack routine %d",(int)B_ierr); 22359ac8732SStefano Zampini } else { 22459ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 22559ac8732SStefano Zampini PetscStackCallBLAS("LAPACKpotri",LAPACKpotri_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_N,&B_ierr)); 22659ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 22759ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in POTRI Lapack routine %d",(int)B_ierr); 22859ac8732SStefano Zampini } 22959ac8732SStefano Zampini } 23059ac8732SStefano Zampini mumps->schur_inverted = PETSC_TRUE; 23159ac8732SStefano Zampini PetscFunctionReturn(0); 23259ac8732SStefano Zampini } 23359ac8732SStefano Zampini 23459ac8732SStefano Zampini #undef __FUNCT__ 23559ac8732SStefano Zampini #define __FUNCT__ "MatMumpsSolveSchur_Private" 236e807eca7SStefano Zampini static PetscErrorCode MatMumpsSolveSchur_Private(Mat_MUMPS* mumps, PetscBool sol_in_redrhs) 23759ac8732SStefano Zampini { 23859ac8732SStefano Zampini PetscBLASInt B_N,B_Nrhs,B_ierr,B_slda,B_rlda; 23959ac8732SStefano Zampini PetscScalar one=1.,zero=0.; 24059ac8732SStefano Zampini PetscErrorCode ierr; 24159ac8732SStefano Zampini 24259ac8732SStefano Zampini PetscFunctionBegin; 24359ac8732SStefano Zampini ierr = MatMumpsFactorSchur_Private(mumps);CHKERRQ(ierr); 244b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.size_schur,&B_N);CHKERRQ(ierr); 245b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.schur_lld,&B_slda);CHKERRQ(ierr); 246b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.nrhs,&B_Nrhs);CHKERRQ(ierr); 247b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.lredrhs,&B_rlda);CHKERRQ(ierr); 24859ac8732SStefano Zampini if (mumps->schur_inverted) { 24959ac8732SStefano Zampini PetscInt sizesol = B_Nrhs*B_N; 25059ac8732SStefano Zampini if (!mumps->schur_sol || sizesol > mumps->schur_sizesol) { 25159ac8732SStefano Zampini ierr = PetscFree(mumps->schur_sol);CHKERRQ(ierr); 25259ac8732SStefano Zampini ierr = PetscMalloc1(sizesol,&mumps->schur_sol);CHKERRQ(ierr); 25359ac8732SStefano Zampini mumps->schur_sizesol = sizesol; 254b5fa320bSStefano Zampini } 25559ac8732SStefano Zampini if (!mumps->sym) { 25659ac8732SStefano Zampini char type[2]; 257b5fa320bSStefano Zampini if (mumps->id.ICNTL(19) == 1) { /* stored by rows */ 25859ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 25959ac8732SStefano Zampini sprintf(type,"N"); 260b5fa320bSStefano Zampini } else { 26159ac8732SStefano Zampini sprintf(type,"T"); 262b5fa320bSStefano Zampini } 26359ac8732SStefano Zampini } else { /* stored by columns */ 26459ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 26559ac8732SStefano Zampini sprintf(type,"T"); 26659ac8732SStefano Zampini } else { 26759ac8732SStefano Zampini sprintf(type,"N"); 26859ac8732SStefano Zampini } 26959ac8732SStefano Zampini } 27059ac8732SStefano Zampini PetscStackCallBLAS("BLASgemm",BLASgemm_(type,"N",&B_N,&B_Nrhs,&B_N,&one,(PetscScalar*)mumps->id.schur,&B_slda,(PetscScalar*)mumps->id.redrhs,&B_rlda,&zero,mumps->schur_sol,&B_rlda)); 27159ac8732SStefano Zampini } else { 27259ac8732SStefano Zampini char ord[2]; 27359ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 27459ac8732SStefano Zampini sprintf(ord,"L"); 27559ac8732SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 27659ac8732SStefano Zampini sprintf(ord,"U"); 27759ac8732SStefano Zampini } 27859ac8732SStefano Zampini PetscStackCallBLAS("BLASsymm",BLASsymm_("L",ord,&B_N,&B_Nrhs,&one,(PetscScalar*)mumps->id.schur,&B_slda,(PetscScalar*)mumps->id.redrhs,&B_rlda,&zero,mumps->schur_sol,&B_rlda)); 27959ac8732SStefano Zampini } 280e807eca7SStefano Zampini if (sol_in_redrhs) { 28159ac8732SStefano Zampini ierr = PetscMemcpy(mumps->id.redrhs,mumps->schur_sol,sizesol*sizeof(PetscScalar));CHKERRQ(ierr); 282e807eca7SStefano Zampini } 283a12f35bfSStefano Zampini } else { /* Schur complement has not been inverted */ 284a12f35bfSStefano Zampini MumpsScalar *orhs=NULL; 285a12f35bfSStefano Zampini 286a12f35bfSStefano Zampini if (!sol_in_redrhs) { 287a12f35bfSStefano Zampini PetscInt sizesol = B_Nrhs*B_N; 288a12f35bfSStefano Zampini if (!mumps->schur_sol || sizesol > mumps->schur_sizesol) { 289a12f35bfSStefano Zampini ierr = PetscFree(mumps->schur_sol);CHKERRQ(ierr); 290a12f35bfSStefano Zampini ierr = PetscMalloc1(sizesol,&mumps->schur_sol);CHKERRQ(ierr); 291a12f35bfSStefano Zampini mumps->schur_sizesol = sizesol; 292a12f35bfSStefano Zampini } 293a12f35bfSStefano Zampini orhs = mumps->id.redrhs; 294a12f35bfSStefano Zampini ierr = PetscMemcpy(mumps->schur_sol,mumps->id.redrhs,sizesol*sizeof(PetscScalar));CHKERRQ(ierr); 295a12f35bfSStefano Zampini mumps->id.redrhs = (MumpsScalar*)mumps->schur_sol; 296a12f35bfSStefano Zampini } 29759ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full Schur matrix */ 29859ac8732SStefano Zampini char type[2]; 29959ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 1) { /* stored by rows */ 30059ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 30159ac8732SStefano Zampini sprintf(type,"N"); 30259ac8732SStefano Zampini } else { 30359ac8732SStefano Zampini sprintf(type,"T"); 30459ac8732SStefano Zampini } 30559ac8732SStefano Zampini } else { /* stored by columns */ 30659ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 30759ac8732SStefano Zampini sprintf(type,"T"); 30859ac8732SStefano Zampini } else { 30959ac8732SStefano Zampini sprintf(type,"N"); 31059ac8732SStefano Zampini } 31159ac8732SStefano Zampini } 31259ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 31359ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetrs",LAPACKgetrs_(type,&B_N,&B_Nrhs,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,(PetscScalar*)mumps->id.redrhs,&B_rlda,&B_ierr)); 314b5fa320bSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 315b5fa320bSStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GETRS Lapack routine %d",(int)B_ierr); 316b5fa320bSStefano Zampini } else { /* either full or lower-triangular (not packed) */ 317b5fa320bSStefano Zampini char ord[2]; 318b5fa320bSStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 319b5fa320bSStefano Zampini sprintf(ord,"L"); 320b5fa320bSStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 321b5fa320bSStefano Zampini sprintf(ord,"U"); 322b5fa320bSStefano Zampini } 323*a0b0af32SStefano Zampini if (mumps->schur_sym == 2) { 324b5fa320bSStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 32559ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytrs",LAPACKsytrs_(ord,&B_N,&B_Nrhs,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,(PetscScalar*)mumps->id.redrhs,&B_rlda,&B_ierr)); 326b5fa320bSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 327b5fa320bSStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYTRS Lapack routine %d",(int)B_ierr); 328b5fa320bSStefano Zampini } else { 329b5fa320bSStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 33059ac8732SStefano Zampini PetscStackCallBLAS("LAPACKpotrs",LAPACKpotrs_(ord,&B_N,&B_Nrhs,(PetscScalar*)mumps->id.schur,&B_slda,(PetscScalar*)mumps->id.redrhs,&B_rlda,&B_ierr)); 331b5fa320bSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 332b5fa320bSStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in POTRS Lapack routine %d",(int)B_ierr); 333b5fa320bSStefano Zampini } 334b5fa320bSStefano Zampini } 335e807eca7SStefano Zampini if (!sol_in_redrhs) { 336a12f35bfSStefano Zampini mumps->id.redrhs = orhs; 337e807eca7SStefano Zampini } 33859ac8732SStefano Zampini } 339b5fa320bSStefano Zampini PetscFunctionReturn(0); 340b5fa320bSStefano Zampini } 341b5fa320bSStefano Zampini 34259ac8732SStefano Zampini #undef __FUNCT__ 34359ac8732SStefano Zampini #define __FUNCT__ "MatMumpsHandleSchur_Private" 344b5fa320bSStefano Zampini static PetscErrorCode MatMumpsHandleSchur_Private(Mat_MUMPS* mumps) 345b5fa320bSStefano Zampini { 346b5fa320bSStefano Zampini PetscErrorCode ierr; 347b5fa320bSStefano Zampini 348b5fa320bSStefano Zampini PetscFunctionBegin; 349b5fa320bSStefano Zampini if (!mumps->id.ICNTL(19)) { /* do nothing when Schur complement has not been computed */ 350b5fa320bSStefano Zampini PetscFunctionReturn(0); 351b5fa320bSStefano Zampini } 352b5fa320bSStefano Zampini if (!mumps->schur_second_solve) { /* prepare for the condensation step */ 353b5fa320bSStefano Zampini /* check if schur complement has been computed 354e807eca7SStefano Zampini We set by default ICNTL(26) == -1 when Schur indices have been provided by the user. 355b5fa320bSStefano Zampini According to MUMPS (5.0.0) manual, any value should be harmful during the factorization phase 356b5fa320bSStefano Zampini Unless the user provides a valid value for ICNTL(26), MatSolve and MatMatSolve routines solve the full system. 357b5fa320bSStefano Zampini This requires an extra call to PetscMUMPS_c and the computation of the factors for S, handled setting double_schur_solve to PETSC_TRUE */ 358b5fa320bSStefano Zampini if (mumps->id.ICNTL(26) < 0 || mumps->id.ICNTL(26) > 2) { 359b5fa320bSStefano Zampini PetscInt sizeredrhs = mumps->id.nrhs*mumps->id.size_schur; 360b5fa320bSStefano Zampini /* allocate MUMPS internal array to store reduced right-hand sides */ 361b5fa320bSStefano Zampini if (!mumps->id.redrhs || sizeredrhs > mumps->sizeredrhs) { 362b5fa320bSStefano Zampini ierr = PetscFree(mumps->id.redrhs);CHKERRQ(ierr); 363b5fa320bSStefano Zampini mumps->id.lredrhs = mumps->id.size_schur; 364b5fa320bSStefano Zampini ierr = PetscMalloc1(mumps->id.nrhs*mumps->id.lredrhs,&mumps->id.redrhs);CHKERRQ(ierr); 365b5fa320bSStefano Zampini mumps->sizeredrhs = mumps->id.nrhs*mumps->id.lredrhs; 366b5fa320bSStefano Zampini } 367b5fa320bSStefano Zampini mumps->schur_second_solve = PETSC_TRUE; 368b5fa320bSStefano Zampini mumps->id.ICNTL(26) = 1; /* condensation phase */ 369b5fa320bSStefano Zampini } 370b5fa320bSStefano Zampini } else { /* prepare for the expansion step */ 371b5fa320bSStefano Zampini /* solve Schur complement (this should be done by the MUMPS user, so basically us) */ 372e807eca7SStefano Zampini ierr = MatMumpsSolveSchur_Private(mumps,PETSC_TRUE);CHKERRQ(ierr); 373b5fa320bSStefano Zampini mumps->id.ICNTL(26) = 2; /* expansion phase */ 374b5fa320bSStefano Zampini PetscMUMPS_c(&mumps->id); 375b5fa320bSStefano Zampini if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 376b5fa320bSStefano Zampini /* restore defaults */ 377b5fa320bSStefano Zampini mumps->id.ICNTL(26) = -1; 378b5fa320bSStefano Zampini mumps->schur_second_solve = PETSC_FALSE; 379b5fa320bSStefano Zampini } 380b5fa320bSStefano Zampini PetscFunctionReturn(0); 381b5fa320bSStefano Zampini } 382b5fa320bSStefano Zampini 383397b6df1SKris Buschelman /* 384d341cd04SHong Zhang MatConvertToTriples_A_B - convert Petsc matrix to triples: row[nz], col[nz], val[nz] 385d341cd04SHong Zhang 386397b6df1SKris Buschelman input: 38767877ebaSShri Abhyankar A - matrix in aij,baij or sbaij (bs=1) format 388397b6df1SKris Buschelman shift - 0: C style output triple; 1: Fortran style output triple. 389bccb9932SShri Abhyankar reuse - MAT_INITIAL_MATRIX: spaces are allocated and values are set for the triple 390bccb9932SShri Abhyankar MAT_REUSE_MATRIX: only the values in v array are updated 391397b6df1SKris Buschelman output: 392397b6df1SKris Buschelman nnz - dim of r, c, and v (number of local nonzero entries of A) 393397b6df1SKris Buschelman r, c, v - row and col index, matrix values (matrix triples) 394eb9baa12SBarry Smith 395eb9baa12SBarry Smith The returned values r, c, and sometimes v are obtained in a single PetscMalloc(). Then in MatDestroy_MUMPS() it is 396eb9baa12SBarry Smith freed with PetscFree((mumps->irn); This is not ideal code, the fact that v is ONLY sometimes part of mumps->irn means 397eb9baa12SBarry Smith that the PetscMalloc() cannot easily be replaced with a PetscMalloc3(). 398eb9baa12SBarry Smith 399397b6df1SKris Buschelman */ 40016ebf90aSShri Abhyankar 40116ebf90aSShri Abhyankar #undef __FUNCT__ 40216ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqaij_seqaij" 403bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqaij_seqaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 404b24902e0SBarry Smith { 405185f6596SHong Zhang const PetscInt *ai,*aj,*ajj,M=A->rmap->n; 40667877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 407dfbe8321SBarry Smith PetscErrorCode ierr; 408c1490034SHong Zhang PetscInt *row,*col; 40916ebf90aSShri Abhyankar Mat_SeqAIJ *aa=(Mat_SeqAIJ*)A->data; 410397b6df1SKris Buschelman 411397b6df1SKris Buschelman PetscFunctionBegin; 41216ebf90aSShri Abhyankar *v=aa->a; 413bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 4142205254eSKarl Rupp nz = aa->nz; 4152205254eSKarl Rupp ai = aa->i; 4162205254eSKarl Rupp aj = aa->j; 41716ebf90aSShri Abhyankar *nnz = nz; 418785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 419185f6596SHong Zhang col = row + nz; 420185f6596SHong Zhang 42116ebf90aSShri Abhyankar nz = 0; 42216ebf90aSShri Abhyankar for (i=0; i<M; i++) { 42316ebf90aSShri Abhyankar rnz = ai[i+1] - ai[i]; 42467877ebaSShri Abhyankar ajj = aj + ai[i]; 42567877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 42667877ebaSShri Abhyankar row[nz] = i+shift; col[nz++] = ajj[j] + shift; 42716ebf90aSShri Abhyankar } 42816ebf90aSShri Abhyankar } 42916ebf90aSShri Abhyankar *r = row; *c = col; 43016ebf90aSShri Abhyankar } 43116ebf90aSShri Abhyankar PetscFunctionReturn(0); 43216ebf90aSShri Abhyankar } 433397b6df1SKris Buschelman 43416ebf90aSShri Abhyankar #undef __FUNCT__ 43567877ebaSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqbaij_seqaij" 436bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqbaij_seqaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 43767877ebaSShri Abhyankar { 43867877ebaSShri Abhyankar Mat_SeqBAIJ *aa=(Mat_SeqBAIJ*)A->data; 43933d57670SJed Brown const PetscInt *ai,*aj,*ajj,bs2 = aa->bs2; 44033d57670SJed Brown PetscInt bs,M,nz,idx=0,rnz,i,j,k,m; 44167877ebaSShri Abhyankar PetscErrorCode ierr; 44267877ebaSShri Abhyankar PetscInt *row,*col; 44367877ebaSShri Abhyankar 44467877ebaSShri Abhyankar PetscFunctionBegin; 44533d57670SJed Brown ierr = MatGetBlockSize(A,&bs);CHKERRQ(ierr); 44633d57670SJed Brown M = A->rmap->N/bs; 447cf3759fdSShri Abhyankar *v = aa->a; 448bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 449cf3759fdSShri Abhyankar ai = aa->i; aj = aa->j; 45067877ebaSShri Abhyankar nz = bs2*aa->nz; 45167877ebaSShri Abhyankar *nnz = nz; 452785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 453185f6596SHong Zhang col = row + nz; 454185f6596SHong Zhang 45567877ebaSShri Abhyankar for (i=0; i<M; i++) { 45667877ebaSShri Abhyankar ajj = aj + ai[i]; 45767877ebaSShri Abhyankar rnz = ai[i+1] - ai[i]; 45867877ebaSShri Abhyankar for (k=0; k<rnz; k++) { 45967877ebaSShri Abhyankar for (j=0; j<bs; j++) { 46067877ebaSShri Abhyankar for (m=0; m<bs; m++) { 46167877ebaSShri Abhyankar row[idx] = i*bs + m + shift; 462cf3759fdSShri Abhyankar col[idx++] = bs*(ajj[k]) + j + shift; 46367877ebaSShri Abhyankar } 46467877ebaSShri Abhyankar } 46567877ebaSShri Abhyankar } 46667877ebaSShri Abhyankar } 467cf3759fdSShri Abhyankar *r = row; *c = col; 46867877ebaSShri Abhyankar } 46967877ebaSShri Abhyankar PetscFunctionReturn(0); 47067877ebaSShri Abhyankar } 47167877ebaSShri Abhyankar 47267877ebaSShri Abhyankar #undef __FUNCT__ 47316ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqsbaij_seqsbaij" 474bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqsbaij_seqsbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 47516ebf90aSShri Abhyankar { 47667877ebaSShri Abhyankar const PetscInt *ai, *aj,*ajj,M=A->rmap->n; 47767877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 47816ebf90aSShri Abhyankar PetscErrorCode ierr; 47916ebf90aSShri Abhyankar PetscInt *row,*col; 48016ebf90aSShri Abhyankar Mat_SeqSBAIJ *aa=(Mat_SeqSBAIJ*)A->data; 48116ebf90aSShri Abhyankar 48216ebf90aSShri Abhyankar PetscFunctionBegin; 483882afa5aSHong Zhang *v = aa->a; 484bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 4852205254eSKarl Rupp nz = aa->nz; 4862205254eSKarl Rupp ai = aa->i; 4872205254eSKarl Rupp aj = aa->j; 4882205254eSKarl Rupp *v = aa->a; 48916ebf90aSShri Abhyankar *nnz = nz; 490785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 491185f6596SHong Zhang col = row + nz; 492185f6596SHong Zhang 49316ebf90aSShri Abhyankar nz = 0; 49416ebf90aSShri Abhyankar for (i=0; i<M; i++) { 49516ebf90aSShri Abhyankar rnz = ai[i+1] - ai[i]; 49667877ebaSShri Abhyankar ajj = aj + ai[i]; 49767877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 49867877ebaSShri Abhyankar row[nz] = i+shift; col[nz++] = ajj[j] + shift; 49916ebf90aSShri Abhyankar } 50016ebf90aSShri Abhyankar } 50116ebf90aSShri Abhyankar *r = row; *c = col; 50216ebf90aSShri Abhyankar } 50316ebf90aSShri Abhyankar PetscFunctionReturn(0); 50416ebf90aSShri Abhyankar } 50516ebf90aSShri Abhyankar 50616ebf90aSShri Abhyankar #undef __FUNCT__ 50716ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqaij_seqsbaij" 508bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqaij_seqsbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 50916ebf90aSShri Abhyankar { 51067877ebaSShri Abhyankar const PetscInt *ai,*aj,*ajj,*adiag,M=A->rmap->n; 51167877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 51267877ebaSShri Abhyankar const PetscScalar *av,*v1; 51316ebf90aSShri Abhyankar PetscScalar *val; 51416ebf90aSShri Abhyankar PetscErrorCode ierr; 51516ebf90aSShri Abhyankar PetscInt *row,*col; 516829b1710SHong Zhang Mat_SeqAIJ *aa=(Mat_SeqAIJ*)A->data; 51716ebf90aSShri Abhyankar 51816ebf90aSShri Abhyankar PetscFunctionBegin; 51916ebf90aSShri Abhyankar ai =aa->i; aj=aa->j;av=aa->a; 52016ebf90aSShri Abhyankar adiag=aa->diag; 521bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 522829b1710SHong Zhang /* count nz in the uppper triangular part of A */ 523829b1710SHong Zhang nz = 0; 524829b1710SHong Zhang for (i=0; i<M; i++) nz += ai[i+1] - adiag[i]; 52516ebf90aSShri Abhyankar *nnz = nz; 526829b1710SHong Zhang 527185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 528185f6596SHong Zhang col = row + nz; 529185f6596SHong Zhang val = (PetscScalar*)(col + nz); 530185f6596SHong Zhang 53116ebf90aSShri Abhyankar nz = 0; 53216ebf90aSShri Abhyankar for (i=0; i<M; i++) { 53316ebf90aSShri Abhyankar rnz = ai[i+1] - adiag[i]; 53467877ebaSShri Abhyankar ajj = aj + adiag[i]; 535cf3759fdSShri Abhyankar v1 = av + adiag[i]; 53667877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 53767877ebaSShri Abhyankar row[nz] = i+shift; col[nz] = ajj[j] + shift; val[nz++] = v1[j]; 53816ebf90aSShri Abhyankar } 53916ebf90aSShri Abhyankar } 54016ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 541397b6df1SKris Buschelman } else { 54216ebf90aSShri Abhyankar nz = 0; val = *v; 54316ebf90aSShri Abhyankar for (i=0; i <M; i++) { 54416ebf90aSShri Abhyankar rnz = ai[i+1] - adiag[i]; 54567877ebaSShri Abhyankar ajj = aj + adiag[i]; 54667877ebaSShri Abhyankar v1 = av + adiag[i]; 54767877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 54867877ebaSShri Abhyankar val[nz++] = v1[j]; 54916ebf90aSShri Abhyankar } 55016ebf90aSShri Abhyankar } 55116ebf90aSShri Abhyankar } 55216ebf90aSShri Abhyankar PetscFunctionReturn(0); 55316ebf90aSShri Abhyankar } 55416ebf90aSShri Abhyankar 55516ebf90aSShri Abhyankar #undef __FUNCT__ 55616ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpisbaij_mpisbaij" 557bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpisbaij_mpisbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 55816ebf90aSShri Abhyankar { 55916ebf90aSShri Abhyankar const PetscInt *ai, *aj, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 56016ebf90aSShri Abhyankar PetscErrorCode ierr; 56116ebf90aSShri Abhyankar PetscInt rstart,nz,i,j,jj,irow,countA,countB; 56216ebf90aSShri Abhyankar PetscInt *row,*col; 56316ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 56416ebf90aSShri Abhyankar PetscScalar *val; 565397b6df1SKris Buschelman Mat_MPISBAIJ *mat = (Mat_MPISBAIJ*)A->data; 566397b6df1SKris Buschelman Mat_SeqSBAIJ *aa = (Mat_SeqSBAIJ*)(mat->A)->data; 567397b6df1SKris Buschelman Mat_SeqBAIJ *bb = (Mat_SeqBAIJ*)(mat->B)->data; 56816ebf90aSShri Abhyankar 56916ebf90aSShri Abhyankar PetscFunctionBegin; 570d0f46423SBarry Smith ai=aa->i; aj=aa->j; bi=bb->i; bj=bb->j; rstart= A->rmap->rstart; 571397b6df1SKris Buschelman av=aa->a; bv=bb->a; 572397b6df1SKris Buschelman 5732205254eSKarl Rupp garray = mat->garray; 5742205254eSKarl Rupp 575bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 57616ebf90aSShri Abhyankar nz = aa->nz + bb->nz; 57716ebf90aSShri Abhyankar *nnz = nz; 578185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 579185f6596SHong Zhang col = row + nz; 580185f6596SHong Zhang val = (PetscScalar*)(col + nz); 581185f6596SHong Zhang 582397b6df1SKris Buschelman *r = row; *c = col; *v = val; 583397b6df1SKris Buschelman } else { 584397b6df1SKris Buschelman row = *r; col = *c; val = *v; 585397b6df1SKris Buschelman } 586397b6df1SKris Buschelman 587028e57e8SHong Zhang jj = 0; irow = rstart; 588397b6df1SKris Buschelman for (i=0; i<m; i++) { 589397b6df1SKris Buschelman ajj = aj + ai[i]; /* ptr to the beginning of this row */ 590397b6df1SKris Buschelman countA = ai[i+1] - ai[i]; 591397b6df1SKris Buschelman countB = bi[i+1] - bi[i]; 592397b6df1SKris Buschelman bjj = bj + bi[i]; 59316ebf90aSShri Abhyankar v1 = av + ai[i]; 59416ebf90aSShri Abhyankar v2 = bv + bi[i]; 595397b6df1SKris Buschelman 596397b6df1SKris Buschelman /* A-part */ 597397b6df1SKris Buschelman for (j=0; j<countA; j++) { 598bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 599397b6df1SKris Buschelman row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 600397b6df1SKris Buschelman } 60116ebf90aSShri Abhyankar val[jj++] = v1[j]; 602397b6df1SKris Buschelman } 60316ebf90aSShri Abhyankar 60416ebf90aSShri Abhyankar /* B-part */ 60516ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 606bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 607397b6df1SKris Buschelman row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 608397b6df1SKris Buschelman } 60916ebf90aSShri Abhyankar val[jj++] = v2[j]; 61016ebf90aSShri Abhyankar } 61116ebf90aSShri Abhyankar irow++; 61216ebf90aSShri Abhyankar } 61316ebf90aSShri Abhyankar PetscFunctionReturn(0); 61416ebf90aSShri Abhyankar } 61516ebf90aSShri Abhyankar 61616ebf90aSShri Abhyankar #undef __FUNCT__ 61716ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpiaij_mpiaij" 618bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpiaij_mpiaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 61916ebf90aSShri Abhyankar { 62016ebf90aSShri Abhyankar const PetscInt *ai, *aj, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 62116ebf90aSShri Abhyankar PetscErrorCode ierr; 62216ebf90aSShri Abhyankar PetscInt rstart,nz,i,j,jj,irow,countA,countB; 62316ebf90aSShri Abhyankar PetscInt *row,*col; 62416ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 62516ebf90aSShri Abhyankar PetscScalar *val; 62616ebf90aSShri Abhyankar Mat_MPIAIJ *mat = (Mat_MPIAIJ*)A->data; 62716ebf90aSShri Abhyankar Mat_SeqAIJ *aa = (Mat_SeqAIJ*)(mat->A)->data; 62816ebf90aSShri Abhyankar Mat_SeqAIJ *bb = (Mat_SeqAIJ*)(mat->B)->data; 62916ebf90aSShri Abhyankar 63016ebf90aSShri Abhyankar PetscFunctionBegin; 63116ebf90aSShri Abhyankar ai=aa->i; aj=aa->j; bi=bb->i; bj=bb->j; rstart= A->rmap->rstart; 63216ebf90aSShri Abhyankar av=aa->a; bv=bb->a; 63316ebf90aSShri Abhyankar 6342205254eSKarl Rupp garray = mat->garray; 6352205254eSKarl Rupp 636bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 63716ebf90aSShri Abhyankar nz = aa->nz + bb->nz; 63816ebf90aSShri Abhyankar *nnz = nz; 639185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 640185f6596SHong Zhang col = row + nz; 641185f6596SHong Zhang val = (PetscScalar*)(col + nz); 642185f6596SHong Zhang 64316ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 64416ebf90aSShri Abhyankar } else { 64516ebf90aSShri Abhyankar row = *r; col = *c; val = *v; 64616ebf90aSShri Abhyankar } 64716ebf90aSShri Abhyankar 64816ebf90aSShri Abhyankar jj = 0; irow = rstart; 64916ebf90aSShri Abhyankar for (i=0; i<m; i++) { 65016ebf90aSShri Abhyankar ajj = aj + ai[i]; /* ptr to the beginning of this row */ 65116ebf90aSShri Abhyankar countA = ai[i+1] - ai[i]; 65216ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 65316ebf90aSShri Abhyankar bjj = bj + bi[i]; 65416ebf90aSShri Abhyankar v1 = av + ai[i]; 65516ebf90aSShri Abhyankar v2 = bv + bi[i]; 65616ebf90aSShri Abhyankar 65716ebf90aSShri Abhyankar /* A-part */ 65816ebf90aSShri Abhyankar for (j=0; j<countA; j++) { 659bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 66016ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 66116ebf90aSShri Abhyankar } 66216ebf90aSShri Abhyankar val[jj++] = v1[j]; 66316ebf90aSShri Abhyankar } 66416ebf90aSShri Abhyankar 66516ebf90aSShri Abhyankar /* B-part */ 66616ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 667bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 66816ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 66916ebf90aSShri Abhyankar } 67016ebf90aSShri Abhyankar val[jj++] = v2[j]; 67116ebf90aSShri Abhyankar } 67216ebf90aSShri Abhyankar irow++; 67316ebf90aSShri Abhyankar } 67416ebf90aSShri Abhyankar PetscFunctionReturn(0); 67516ebf90aSShri Abhyankar } 67616ebf90aSShri Abhyankar 67716ebf90aSShri Abhyankar #undef __FUNCT__ 67867877ebaSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpibaij_mpiaij" 679bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpibaij_mpiaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 68067877ebaSShri Abhyankar { 68167877ebaSShri Abhyankar Mat_MPIBAIJ *mat = (Mat_MPIBAIJ*)A->data; 68267877ebaSShri Abhyankar Mat_SeqBAIJ *aa = (Mat_SeqBAIJ*)(mat->A)->data; 68367877ebaSShri Abhyankar Mat_SeqBAIJ *bb = (Mat_SeqBAIJ*)(mat->B)->data; 68467877ebaSShri Abhyankar const PetscInt *ai = aa->i, *bi = bb->i, *aj = aa->j, *bj = bb->j,*ajj, *bjj; 685d985c460SShri Abhyankar const PetscInt *garray = mat->garray,mbs=mat->mbs,rstart=A->rmap->rstart; 68633d57670SJed Brown const PetscInt bs2=mat->bs2; 68767877ebaSShri Abhyankar PetscErrorCode ierr; 68833d57670SJed Brown PetscInt bs,nz,i,j,k,n,jj,irow,countA,countB,idx; 68967877ebaSShri Abhyankar PetscInt *row,*col; 69067877ebaSShri Abhyankar const PetscScalar *av=aa->a, *bv=bb->a,*v1,*v2; 69167877ebaSShri Abhyankar PetscScalar *val; 69267877ebaSShri Abhyankar 69367877ebaSShri Abhyankar PetscFunctionBegin; 69433d57670SJed Brown ierr = MatGetBlockSize(A,&bs);CHKERRQ(ierr); 695bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 69667877ebaSShri Abhyankar nz = bs2*(aa->nz + bb->nz); 69767877ebaSShri Abhyankar *nnz = nz; 698185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 699185f6596SHong Zhang col = row + nz; 700185f6596SHong Zhang val = (PetscScalar*)(col + nz); 701185f6596SHong Zhang 70267877ebaSShri Abhyankar *r = row; *c = col; *v = val; 70367877ebaSShri Abhyankar } else { 70467877ebaSShri Abhyankar row = *r; col = *c; val = *v; 70567877ebaSShri Abhyankar } 70667877ebaSShri Abhyankar 707d985c460SShri Abhyankar jj = 0; irow = rstart; 70867877ebaSShri Abhyankar for (i=0; i<mbs; i++) { 70967877ebaSShri Abhyankar countA = ai[i+1] - ai[i]; 71067877ebaSShri Abhyankar countB = bi[i+1] - bi[i]; 71167877ebaSShri Abhyankar ajj = aj + ai[i]; 71267877ebaSShri Abhyankar bjj = bj + bi[i]; 71367877ebaSShri Abhyankar v1 = av + bs2*ai[i]; 71467877ebaSShri Abhyankar v2 = bv + bs2*bi[i]; 71567877ebaSShri Abhyankar 71667877ebaSShri Abhyankar idx = 0; 71767877ebaSShri Abhyankar /* A-part */ 71867877ebaSShri Abhyankar for (k=0; k<countA; k++) { 71967877ebaSShri Abhyankar for (j=0; j<bs; j++) { 72067877ebaSShri Abhyankar for (n=0; n<bs; n++) { 721bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 722d985c460SShri Abhyankar row[jj] = irow + n + shift; 723d985c460SShri Abhyankar col[jj] = rstart + bs*ajj[k] + j + shift; 72467877ebaSShri Abhyankar } 72567877ebaSShri Abhyankar val[jj++] = v1[idx++]; 72667877ebaSShri Abhyankar } 72767877ebaSShri Abhyankar } 72867877ebaSShri Abhyankar } 72967877ebaSShri Abhyankar 73067877ebaSShri Abhyankar idx = 0; 73167877ebaSShri Abhyankar /* B-part */ 73267877ebaSShri Abhyankar for (k=0; k<countB; k++) { 73367877ebaSShri Abhyankar for (j=0; j<bs; j++) { 73467877ebaSShri Abhyankar for (n=0; n<bs; n++) { 735bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 736d985c460SShri Abhyankar row[jj] = irow + n + shift; 737d985c460SShri Abhyankar col[jj] = bs*garray[bjj[k]] + j + shift; 73867877ebaSShri Abhyankar } 739d985c460SShri Abhyankar val[jj++] = v2[idx++]; 74067877ebaSShri Abhyankar } 74167877ebaSShri Abhyankar } 74267877ebaSShri Abhyankar } 743d985c460SShri Abhyankar irow += bs; 74467877ebaSShri Abhyankar } 74567877ebaSShri Abhyankar PetscFunctionReturn(0); 74667877ebaSShri Abhyankar } 74767877ebaSShri Abhyankar 74867877ebaSShri Abhyankar #undef __FUNCT__ 74916ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpiaij_mpisbaij" 750bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpiaij_mpisbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 75116ebf90aSShri Abhyankar { 75216ebf90aSShri Abhyankar const PetscInt *ai, *aj,*adiag, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 75316ebf90aSShri Abhyankar PetscErrorCode ierr; 754e0bace9bSHong Zhang PetscInt rstart,nz,nza,nzb,i,j,jj,irow,countA,countB; 75516ebf90aSShri Abhyankar PetscInt *row,*col; 75616ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 75716ebf90aSShri Abhyankar PetscScalar *val; 75816ebf90aSShri Abhyankar Mat_MPIAIJ *mat = (Mat_MPIAIJ*)A->data; 75916ebf90aSShri Abhyankar Mat_SeqAIJ *aa =(Mat_SeqAIJ*)(mat->A)->data; 76016ebf90aSShri Abhyankar Mat_SeqAIJ *bb =(Mat_SeqAIJ*)(mat->B)->data; 76116ebf90aSShri Abhyankar 76216ebf90aSShri Abhyankar PetscFunctionBegin; 76316ebf90aSShri Abhyankar ai=aa->i; aj=aa->j; adiag=aa->diag; 76416ebf90aSShri Abhyankar bi=bb->i; bj=bb->j; garray = mat->garray; 76516ebf90aSShri Abhyankar av=aa->a; bv=bb->a; 7662205254eSKarl Rupp 76716ebf90aSShri Abhyankar rstart = A->rmap->rstart; 76816ebf90aSShri Abhyankar 769bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 770e0bace9bSHong Zhang nza = 0; /* num of upper triangular entries in mat->A, including diagonals */ 771e0bace9bSHong Zhang nzb = 0; /* num of upper triangular entries in mat->B */ 77216ebf90aSShri Abhyankar for (i=0; i<m; i++) { 773e0bace9bSHong Zhang nza += (ai[i+1] - adiag[i]); 77416ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 77516ebf90aSShri Abhyankar bjj = bj + bi[i]; 776e0bace9bSHong Zhang for (j=0; j<countB; j++) { 777e0bace9bSHong Zhang if (garray[bjj[j]] > rstart) nzb++; 778e0bace9bSHong Zhang } 779e0bace9bSHong Zhang } 78016ebf90aSShri Abhyankar 781e0bace9bSHong Zhang nz = nza + nzb; /* total nz of upper triangular part of mat */ 78216ebf90aSShri Abhyankar *nnz = nz; 783185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 784185f6596SHong Zhang col = row + nz; 785185f6596SHong Zhang val = (PetscScalar*)(col + nz); 786185f6596SHong Zhang 78716ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 78816ebf90aSShri Abhyankar } else { 78916ebf90aSShri Abhyankar row = *r; col = *c; val = *v; 79016ebf90aSShri Abhyankar } 79116ebf90aSShri Abhyankar 79216ebf90aSShri Abhyankar jj = 0; irow = rstart; 79316ebf90aSShri Abhyankar for (i=0; i<m; i++) { 79416ebf90aSShri Abhyankar ajj = aj + adiag[i]; /* ptr to the beginning of the diagonal of this row */ 79516ebf90aSShri Abhyankar v1 = av + adiag[i]; 79616ebf90aSShri Abhyankar countA = ai[i+1] - adiag[i]; 79716ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 79816ebf90aSShri Abhyankar bjj = bj + bi[i]; 79916ebf90aSShri Abhyankar v2 = bv + bi[i]; 80016ebf90aSShri Abhyankar 80116ebf90aSShri Abhyankar /* A-part */ 80216ebf90aSShri Abhyankar for (j=0; j<countA; j++) { 803bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 80416ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 80516ebf90aSShri Abhyankar } 80616ebf90aSShri Abhyankar val[jj++] = v1[j]; 80716ebf90aSShri Abhyankar } 80816ebf90aSShri Abhyankar 80916ebf90aSShri Abhyankar /* B-part */ 81016ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 81116ebf90aSShri Abhyankar if (garray[bjj[j]] > rstart) { 812bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 81316ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 81416ebf90aSShri Abhyankar } 81516ebf90aSShri Abhyankar val[jj++] = v2[j]; 81616ebf90aSShri Abhyankar } 817397b6df1SKris Buschelman } 818397b6df1SKris Buschelman irow++; 819397b6df1SKris Buschelman } 820397b6df1SKris Buschelman PetscFunctionReturn(0); 821397b6df1SKris Buschelman } 822397b6df1SKris Buschelman 823397b6df1SKris Buschelman #undef __FUNCT__ 82420be8e61SHong Zhang #define __FUNCT__ "MatGetDiagonal_MUMPS" 82520be8e61SHong Zhang PetscErrorCode MatGetDiagonal_MUMPS(Mat A,Vec v) 82620be8e61SHong Zhang { 82720be8e61SHong Zhang PetscFunctionBegin; 82820be8e61SHong Zhang SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Mat type: MUMPS factor"); 82920be8e61SHong Zhang PetscFunctionReturn(0); 83020be8e61SHong Zhang } 83120be8e61SHong Zhang 83220be8e61SHong Zhang #undef __FUNCT__ 8333924e44cSKris Buschelman #define __FUNCT__ "MatDestroy_MUMPS" 834dfbe8321SBarry Smith PetscErrorCode MatDestroy_MUMPS(Mat A) 835dfbe8321SBarry Smith { 836a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 837dfbe8321SBarry Smith PetscErrorCode ierr; 838b24902e0SBarry Smith 839397b6df1SKris Buschelman PetscFunctionBegin; 840a5e57a09SHong Zhang if (mumps->CleanUpMUMPS) { 841397b6df1SKris Buschelman /* Terminate instance, deallocate memories */ 842a5e57a09SHong Zhang ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr); 843a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_rhs);CHKERRQ(ierr); 844a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 845801fbe65SHong Zhang ierr = VecDestroy(&mumps->b_seq);CHKERRQ(ierr); 846a5e57a09SHong Zhang ierr = VecDestroy(&mumps->x_seq);CHKERRQ(ierr); 847a5e57a09SHong Zhang ierr = PetscFree(mumps->id.perm_in);CHKERRQ(ierr); 848a5e57a09SHong Zhang ierr = PetscFree(mumps->irn);CHKERRQ(ierr); 849b34f08ffSHong Zhang ierr = PetscFree(mumps->info);CHKERRQ(ierr); 85059ac8732SStefano Zampini ierr = MatMumpsResetSchur_Private(mumps);CHKERRQ(ierr); 851a5e57a09SHong Zhang mumps->id.job = JOB_END; 852a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 853a5e57a09SHong Zhang ierr = MPI_Comm_free(&(mumps->comm_mumps));CHKERRQ(ierr); 854397b6df1SKris Buschelman } 855a5e57a09SHong Zhang if (mumps->Destroy) { 856a5e57a09SHong Zhang ierr = (mumps->Destroy)(A);CHKERRQ(ierr); 857bf0cc555SLisandro Dalcin } 858bf0cc555SLisandro Dalcin ierr = PetscFree(A->spptr);CHKERRQ(ierr); 859bf0cc555SLisandro Dalcin 86097969023SHong Zhang /* clear composed functions */ 861bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatFactorGetSolverPackage_C",NULL);CHKERRQ(ierr); 862bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetIcntl_C",NULL);CHKERRQ(ierr); 863bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetIcntl_C",NULL);CHKERRQ(ierr); 864bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetCntl_C",NULL);CHKERRQ(ierr); 865bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetCntl_C",NULL);CHKERRQ(ierr); 866bc6112feSHong Zhang 867ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetInfo_C",NULL);CHKERRQ(ierr); 868ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetInfog_C",NULL);CHKERRQ(ierr); 869ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetRinfo_C",NULL);CHKERRQ(ierr); 870ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetRinfog_C",NULL);CHKERRQ(ierr); 8716444a565SStefano Zampini 8726444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetSchurIndices_C",NULL);CHKERRQ(ierr); 87359ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsInvertSchurComplement_C",NULL);CHKERRQ(ierr); 87459ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsCreateSchurComplement_C",NULL);CHKERRQ(ierr); 8756444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetSchurComplement_C",NULL);CHKERRQ(ierr); 87659ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsRestoreSchurComplement_C",NULL);CHKERRQ(ierr); 877e807eca7SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSolveSchurComplement_C",NULL);CHKERRQ(ierr); 8787404bcfbSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSolveSchurComplementTranspose_C",NULL);CHKERRQ(ierr); 879*a0b0af32SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSchurComplementSetSym_C",NULL);CHKERRQ(ierr); 880397b6df1SKris Buschelman PetscFunctionReturn(0); 881397b6df1SKris Buschelman } 882397b6df1SKris Buschelman 883397b6df1SKris Buschelman #undef __FUNCT__ 884f6c57405SHong Zhang #define __FUNCT__ "MatSolve_MUMPS" 885b24902e0SBarry Smith PetscErrorCode MatSolve_MUMPS(Mat A,Vec b,Vec x) 886b24902e0SBarry Smith { 887a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 888d54de34fSKris Buschelman PetscScalar *array; 88967877ebaSShri Abhyankar Vec b_seq; 890329ec9b3SHong Zhang IS is_iden,is_petsc; 891dfbe8321SBarry Smith PetscErrorCode ierr; 892329ec9b3SHong Zhang PetscInt i; 893883f2eb9SBarry Smith static PetscBool cite1 = PETSC_FALSE,cite2 = PETSC_FALSE; 894397b6df1SKris Buschelman 895397b6df1SKris Buschelman PetscFunctionBegin; 896883f2eb9SBarry Smith ierr = PetscCitationsRegister("@article{MUMPS01,\n author = {P.~R. Amestoy and I.~S. Duff and J.-Y. L'Excellent and J. Koster},\n title = {A fully asynchronous multifrontal solver using distributed dynamic scheduling},\n journal = {SIAM Journal on Matrix Analysis and Applications},\n volume = {23},\n number = {1},\n pages = {15--41},\n year = {2001}\n}\n",&cite1);CHKERRQ(ierr); 897883f2eb9SBarry Smith ierr = PetscCitationsRegister("@article{MUMPS02,\n author = {P.~R. Amestoy and A. Guermouche and J.-Y. L'Excellent and S. Pralet},\n title = {Hybrid scheduling for the parallel solution of linear systems},\n journal = {Parallel Computing},\n volume = {32},\n number = {2},\n pages = {136--156},\n year = {2006}\n}\n",&cite2);CHKERRQ(ierr); 898a5e57a09SHong Zhang mumps->id.nrhs = 1; 899a5e57a09SHong Zhang b_seq = mumps->b_seq; 900a5e57a09SHong Zhang if (mumps->size > 1) { 901329ec9b3SHong Zhang /* MUMPS only supports centralized rhs. Scatter b into a seqential rhs vector */ 902a5e57a09SHong Zhang ierr = VecScatterBegin(mumps->scat_rhs,b,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 903a5e57a09SHong Zhang ierr = VecScatterEnd(mumps->scat_rhs,b,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 904a5e57a09SHong Zhang if (!mumps->myid) {ierr = VecGetArray(b_seq,&array);CHKERRQ(ierr);} 905397b6df1SKris Buschelman } else { /* size == 1 */ 906397b6df1SKris Buschelman ierr = VecCopy(b,x);CHKERRQ(ierr); 907397b6df1SKris Buschelman ierr = VecGetArray(x,&array);CHKERRQ(ierr); 908397b6df1SKris Buschelman } 909a5e57a09SHong Zhang if (!mumps->myid) { /* define rhs on the host */ 910a5e57a09SHong Zhang mumps->id.nrhs = 1; 911940cd9d6SSatish Balay mumps->id.rhs = (MumpsScalar*)array; 912397b6df1SKris Buschelman } 913397b6df1SKris Buschelman 914b5fa320bSStefano Zampini /* handle condensation step of Schur complement (if any) */ 915b5fa320bSStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps);CHKERRQ(ierr); 916b5fa320bSStefano Zampini 917397b6df1SKris Buschelman /* solve phase */ 918329ec9b3SHong Zhang /*-------------*/ 919a5e57a09SHong Zhang mumps->id.job = JOB_SOLVE; 920a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 921a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 922397b6df1SKris Buschelman 923b5fa320bSStefano Zampini /* handle expansion step of Schur complement (if any) */ 924b5fa320bSStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps);CHKERRQ(ierr); 925b5fa320bSStefano Zampini 926a5e57a09SHong Zhang if (mumps->size > 1) { /* convert mumps distributed solution to petsc mpi x */ 927a5e57a09SHong Zhang if (mumps->scat_sol && mumps->ICNTL9_pre != mumps->id.ICNTL(9)) { 928a5e57a09SHong Zhang /* when id.ICNTL(9) changes, the contents of lsol_loc may change (not its size, lsol_loc), recreates scat_sol */ 929a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 930397b6df1SKris Buschelman } 931a5e57a09SHong Zhang if (!mumps->scat_sol) { /* create scatter scat_sol */ 932a5e57a09SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,mumps->id.lsol_loc,0,1,&is_iden);CHKERRQ(ierr); /* from */ 933a5e57a09SHong Zhang for (i=0; i<mumps->id.lsol_loc; i++) { 934a5e57a09SHong Zhang mumps->id.isol_loc[i] -= 1; /* change Fortran style to C style */ 935a5e57a09SHong Zhang } 936a5e57a09SHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,mumps->id.lsol_loc,mumps->id.isol_loc,PETSC_COPY_VALUES,&is_petsc);CHKERRQ(ierr); /* to */ 937a5e57a09SHong Zhang ierr = VecScatterCreate(mumps->x_seq,is_iden,x,is_petsc,&mumps->scat_sol);CHKERRQ(ierr); 9386bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 9396bf464f9SBarry Smith ierr = ISDestroy(&is_petsc);CHKERRQ(ierr); 9402205254eSKarl Rupp 941a5e57a09SHong Zhang mumps->ICNTL9_pre = mumps->id.ICNTL(9); /* save current value of id.ICNTL(9) */ 942397b6df1SKris Buschelman } 943a5e57a09SHong Zhang 944a5e57a09SHong Zhang ierr = VecScatterBegin(mumps->scat_sol,mumps->x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 945a5e57a09SHong Zhang ierr = VecScatterEnd(mumps->scat_sol,mumps->x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 946329ec9b3SHong Zhang } 947397b6df1SKris Buschelman PetscFunctionReturn(0); 948397b6df1SKris Buschelman } 949397b6df1SKris Buschelman 95051d5961aSHong Zhang #undef __FUNCT__ 95151d5961aSHong Zhang #define __FUNCT__ "MatSolveTranspose_MUMPS" 95251d5961aSHong Zhang PetscErrorCode MatSolveTranspose_MUMPS(Mat A,Vec b,Vec x) 95351d5961aSHong Zhang { 954a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 95551d5961aSHong Zhang PetscErrorCode ierr; 95651d5961aSHong Zhang 95751d5961aSHong Zhang PetscFunctionBegin; 958a5e57a09SHong Zhang mumps->id.ICNTL(9) = 0; 9590ad0caddSJed Brown ierr = MatSolve_MUMPS(A,b,x);CHKERRQ(ierr); 960a5e57a09SHong Zhang mumps->id.ICNTL(9) = 1; 96151d5961aSHong Zhang PetscFunctionReturn(0); 96251d5961aSHong Zhang } 96351d5961aSHong Zhang 964e0b74bf9SHong Zhang #undef __FUNCT__ 965e0b74bf9SHong Zhang #define __FUNCT__ "MatMatSolve_MUMPS" 966e0b74bf9SHong Zhang PetscErrorCode MatMatSolve_MUMPS(Mat A,Mat B,Mat X) 967e0b74bf9SHong Zhang { 968bda8bf91SBarry Smith PetscErrorCode ierr; 969bda8bf91SBarry Smith PetscBool flg; 9704e34a73bSHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 971334c5f61SHong Zhang PetscInt i,nrhs,M; 9722cd7d884SHong Zhang PetscScalar *array,*bray; 973bda8bf91SBarry Smith 974e0b74bf9SHong Zhang PetscFunctionBegin; 9750298fd71SBarry Smith ierr = PetscObjectTypeCompareAny((PetscObject)B,&flg,MATSEQDENSE,MATMPIDENSE,NULL);CHKERRQ(ierr); 976801fbe65SHong Zhang if (!flg) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_ARG_WRONG,"Matrix B must be MATDENSE matrix"); 9770298fd71SBarry Smith ierr = PetscObjectTypeCompareAny((PetscObject)X,&flg,MATSEQDENSE,MATMPIDENSE,NULL);CHKERRQ(ierr); 978801fbe65SHong Zhang if (!flg) SETERRQ(PetscObjectComm((PetscObject)X),PETSC_ERR_ARG_WRONG,"Matrix X must be MATDENSE matrix"); 979801fbe65SHong Zhang if (B->rmap->n != X->rmap->n) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_ARG_WRONG,"Matrix B and X must have same row distribution"); 9804e34a73bSHong Zhang 9812cd7d884SHong Zhang ierr = MatGetSize(B,&M,&nrhs);CHKERRQ(ierr); 982334c5f61SHong Zhang mumps->id.nrhs = nrhs; 983334c5f61SHong Zhang mumps->id.lrhs = M; 9844e34a73bSHong Zhang 9852cd7d884SHong Zhang if (mumps->size == 1) { 9862cd7d884SHong Zhang /* copy B to X */ 9872cd7d884SHong Zhang ierr = MatDenseGetArray(B,&bray);CHKERRQ(ierr); 9882cd7d884SHong Zhang ierr = MatDenseGetArray(X,&array);CHKERRQ(ierr); 9896444a565SStefano Zampini ierr = PetscMemcpy(array,bray,M*nrhs*sizeof(PetscScalar));CHKERRQ(ierr); 9902cd7d884SHong Zhang ierr = MatDenseRestoreArray(B,&bray);CHKERRQ(ierr); 991940cd9d6SSatish Balay mumps->id.rhs = (MumpsScalar*)array; 992b5fa320bSStefano Zampini /* handle condensation step of Schur complement (if any) */ 993b5fa320bSStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps);CHKERRQ(ierr); 994801fbe65SHong Zhang 9952cd7d884SHong Zhang /* solve phase */ 9962cd7d884SHong Zhang /*-------------*/ 9972cd7d884SHong Zhang mumps->id.job = JOB_SOLVE; 9982cd7d884SHong Zhang PetscMUMPS_c(&mumps->id); 9992cd7d884SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 1000b5fa320bSStefano Zampini 1001b5fa320bSStefano Zampini /* handle expansion step of Schur complement (if any) */ 1002b5fa320bSStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps);CHKERRQ(ierr); 10032cd7d884SHong Zhang ierr = MatDenseRestoreArray(X,&array);CHKERRQ(ierr); 1004334c5f61SHong Zhang } else { /*--------- parallel case --------*/ 100571aed81dSHong Zhang PetscInt lsol_loc,nlsol_loc,*isol_loc,*idx,*iidx,*idxx,*isol_loc_save; 10061070efccSSatish Balay MumpsScalar *sol_loc,*sol_loc_save; 1007801fbe65SHong Zhang IS is_to,is_from; 1008334c5f61SHong Zhang PetscInt k,proc,j,m; 1009801fbe65SHong Zhang const PetscInt *rstart; 1010334c5f61SHong Zhang Vec v_mpi,b_seq,x_seq; 1011334c5f61SHong Zhang VecScatter scat_rhs,scat_sol; 1012801fbe65SHong Zhang 1013801fbe65SHong Zhang /* create x_seq to hold local solution */ 101471aed81dSHong Zhang isol_loc_save = mumps->id.isol_loc; /* save it for MatSovle() */ 101571aed81dSHong Zhang sol_loc_save = mumps->id.sol_loc; 1016801fbe65SHong Zhang 101771aed81dSHong Zhang lsol_loc = mumps->id.INFO(23); 101871aed81dSHong Zhang nlsol_loc = nrhs*lsol_loc; /* length of sol_loc */ 101971aed81dSHong Zhang ierr = PetscMalloc2(nlsol_loc,&sol_loc,nlsol_loc,&isol_loc);CHKERRQ(ierr); 1020940cd9d6SSatish Balay mumps->id.sol_loc = (MumpsScalar*)sol_loc; 1021801fbe65SHong Zhang mumps->id.isol_loc = isol_loc; 1022801fbe65SHong Zhang 10231070efccSSatish Balay ierr = VecCreateSeqWithArray(PETSC_COMM_SELF,1,nlsol_loc,(PetscScalar*)sol_loc,&x_seq);CHKERRQ(ierr); 10242cd7d884SHong Zhang 102574f0fcc7SHong Zhang /* copy rhs matrix B into vector v_mpi */ 1026334c5f61SHong Zhang ierr = MatGetLocalSize(B,&m,NULL);CHKERRQ(ierr); 1027801fbe65SHong Zhang ierr = MatDenseGetArray(B,&bray);CHKERRQ(ierr); 102874f0fcc7SHong Zhang ierr = VecCreateMPIWithArray(PetscObjectComm((PetscObject)B),1,nrhs*m,nrhs*M,(const PetscScalar*)bray,&v_mpi);CHKERRQ(ierr); 1029801fbe65SHong Zhang ierr = MatDenseRestoreArray(B,&bray);CHKERRQ(ierr); 1030801fbe65SHong Zhang 1031334c5f61SHong Zhang /* scatter v_mpi to b_seq because MUMPS only supports centralized rhs */ 103274f0fcc7SHong Zhang /* idx: maps from k-th index of v_mpi to (i,j)-th global entry of B; 1033801fbe65SHong Zhang iidx: inverse of idx, will be used by scattering xx_seq -> X */ 1034801fbe65SHong Zhang ierr = PetscMalloc2(nrhs*M,&idx,nrhs*M,&iidx);CHKERRQ(ierr); 1035801fbe65SHong Zhang ierr = MatGetOwnershipRanges(B,&rstart);CHKERRQ(ierr); 1036801fbe65SHong Zhang k = 0; 1037801fbe65SHong Zhang for (proc=0; proc<mumps->size; proc++){ 1038801fbe65SHong Zhang for (j=0; j<nrhs; j++){ 1039801fbe65SHong Zhang for (i=rstart[proc]; i<rstart[proc+1]; i++){ 1040801fbe65SHong Zhang iidx[j*M + i] = k; 1041801fbe65SHong Zhang idx[k++] = j*M + i; 1042801fbe65SHong Zhang } 1043801fbe65SHong Zhang } 10442cd7d884SHong Zhang } 10452cd7d884SHong Zhang 1046801fbe65SHong Zhang if (!mumps->myid) { 1047334c5f61SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,nrhs*M,&b_seq);CHKERRQ(ierr); 1048801fbe65SHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,nrhs*M,idx,PETSC_COPY_VALUES,&is_to);CHKERRQ(ierr); 1049801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,nrhs*M,0,1,&is_from);CHKERRQ(ierr); 1050801fbe65SHong Zhang } else { 1051334c5f61SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&b_seq);CHKERRQ(ierr); 1052801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_to);CHKERRQ(ierr); 1053801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_from);CHKERRQ(ierr); 1054801fbe65SHong Zhang } 1055334c5f61SHong Zhang ierr = VecScatterCreate(v_mpi,is_from,b_seq,is_to,&scat_rhs);CHKERRQ(ierr); 1056334c5f61SHong Zhang ierr = VecScatterBegin(scat_rhs,v_mpi,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1057801fbe65SHong Zhang ierr = ISDestroy(&is_to);CHKERRQ(ierr); 1058801fbe65SHong Zhang ierr = ISDestroy(&is_from);CHKERRQ(ierr); 1059334c5f61SHong Zhang ierr = VecScatterEnd(scat_rhs,v_mpi,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1060801fbe65SHong Zhang 1061801fbe65SHong Zhang if (!mumps->myid) { /* define rhs on the host */ 1062334c5f61SHong Zhang ierr = VecGetArray(b_seq,&bray);CHKERRQ(ierr); 1063940cd9d6SSatish Balay mumps->id.rhs = (MumpsScalar*)bray; 1064334c5f61SHong Zhang ierr = VecRestoreArray(b_seq,&bray);CHKERRQ(ierr); 1065801fbe65SHong Zhang } 1066801fbe65SHong Zhang 1067801fbe65SHong Zhang /* solve phase */ 1068801fbe65SHong Zhang /*-------------*/ 1069801fbe65SHong Zhang mumps->id.job = JOB_SOLVE; 1070801fbe65SHong Zhang PetscMUMPS_c(&mumps->id); 1071801fbe65SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 1072801fbe65SHong Zhang 1073334c5f61SHong Zhang /* scatter mumps distributed solution to petsc vector v_mpi, which shares local arrays with solution matrix X */ 107474f0fcc7SHong Zhang ierr = MatDenseGetArray(X,&array);CHKERRQ(ierr); 107574f0fcc7SHong Zhang ierr = VecPlaceArray(v_mpi,array);CHKERRQ(ierr); 1076801fbe65SHong Zhang 1077334c5f61SHong Zhang /* create scatter scat_sol */ 107871aed81dSHong Zhang ierr = PetscMalloc1(nlsol_loc,&idxx);CHKERRQ(ierr); 107971aed81dSHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,nlsol_loc,0,1,&is_from);CHKERRQ(ierr); 108071aed81dSHong Zhang for (i=0; i<lsol_loc; i++) { 1081334c5f61SHong Zhang isol_loc[i] -= 1; /* change Fortran style to C style */ 1082334c5f61SHong Zhang idxx[i] = iidx[isol_loc[i]]; 1083801fbe65SHong Zhang for (j=1; j<nrhs; j++){ 1084334c5f61SHong Zhang idxx[j*lsol_loc+i] = iidx[isol_loc[i]+j*M]; 1085801fbe65SHong Zhang } 1086801fbe65SHong Zhang } 108771aed81dSHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,nlsol_loc,idxx,PETSC_COPY_VALUES,&is_to);CHKERRQ(ierr); 1088334c5f61SHong Zhang ierr = VecScatterCreate(x_seq,is_from,v_mpi,is_to,&scat_sol);CHKERRQ(ierr); 1089334c5f61SHong Zhang ierr = VecScatterBegin(scat_sol,x_seq,v_mpi,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1090801fbe65SHong Zhang ierr = ISDestroy(&is_from);CHKERRQ(ierr); 1091801fbe65SHong Zhang ierr = ISDestroy(&is_to);CHKERRQ(ierr); 1092334c5f61SHong Zhang ierr = VecScatterEnd(scat_sol,x_seq,v_mpi,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1093801fbe65SHong Zhang ierr = MatDenseRestoreArray(X,&array);CHKERRQ(ierr); 109471aed81dSHong Zhang 109571aed81dSHong Zhang /* free spaces */ 109671aed81dSHong Zhang mumps->id.sol_loc = sol_loc_save; 109771aed81dSHong Zhang mumps->id.isol_loc = isol_loc_save; 109871aed81dSHong Zhang 109971aed81dSHong Zhang ierr = PetscFree2(sol_loc,isol_loc);CHKERRQ(ierr); 1100801fbe65SHong Zhang ierr = PetscFree2(idx,iidx);CHKERRQ(ierr); 1101801fbe65SHong Zhang ierr = PetscFree(idxx);CHKERRQ(ierr); 110271aed81dSHong Zhang ierr = VecDestroy(&x_seq);CHKERRQ(ierr); 110374f0fcc7SHong Zhang ierr = VecDestroy(&v_mpi);CHKERRQ(ierr); 1104334c5f61SHong Zhang ierr = VecDestroy(&b_seq);CHKERRQ(ierr); 1105334c5f61SHong Zhang ierr = VecScatterDestroy(&scat_rhs);CHKERRQ(ierr); 1106334c5f61SHong Zhang ierr = VecScatterDestroy(&scat_sol);CHKERRQ(ierr); 1107801fbe65SHong Zhang } 1108e0b74bf9SHong Zhang PetscFunctionReturn(0); 1109e0b74bf9SHong Zhang } 1110e0b74bf9SHong Zhang 1111ace3df97SHong Zhang #if !defined(PETSC_USE_COMPLEX) 1112a58c3f20SHong Zhang /* 1113a58c3f20SHong Zhang input: 1114a58c3f20SHong Zhang F: numeric factor 1115a58c3f20SHong Zhang output: 1116a58c3f20SHong Zhang nneg: total number of negative pivots 1117a58c3f20SHong Zhang nzero: 0 1118a58c3f20SHong Zhang npos: (global dimension of F) - nneg 1119a58c3f20SHong Zhang */ 1120a58c3f20SHong Zhang 1121a58c3f20SHong Zhang #undef __FUNCT__ 1122a58c3f20SHong Zhang #define __FUNCT__ "MatGetInertia_SBAIJMUMPS" 1123dfbe8321SBarry Smith PetscErrorCode MatGetInertia_SBAIJMUMPS(Mat F,int *nneg,int *nzero,int *npos) 1124a58c3f20SHong Zhang { 1125a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 1126dfbe8321SBarry Smith PetscErrorCode ierr; 1127c1490034SHong Zhang PetscMPIInt size; 1128a58c3f20SHong Zhang 1129a58c3f20SHong Zhang PetscFunctionBegin; 1130ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)F),&size);CHKERRQ(ierr); 1131bcb30aebSHong Zhang /* MUMPS 4.3.1 calls ScaLAPACK when ICNTL(13)=0 (default), which does not offer the possibility to compute the inertia of a dense matrix. Set ICNTL(13)=1 to skip ScaLAPACK */ 1132a5e57a09SHong Zhang if (size > 1 && mumps->id.ICNTL(13) != 1) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"ICNTL(13)=%d. -mat_mumps_icntl_13 must be set as 1 for correct global matrix inertia\n",mumps->id.INFOG(13)); 1133ed85ac9fSHong Zhang 1134710ac8efSHong Zhang if (nneg) *nneg = mumps->id.INFOG(12); 1135ed85ac9fSHong Zhang if (nzero || npos) { 1136ed85ac9fSHong Zhang if (mumps->id.ICNTL(24) != 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"-mat_mumps_icntl_24 must be set as 1 for null pivot row detection"); 1137710ac8efSHong Zhang if (nzero) *nzero = mumps->id.INFOG(28); 1138710ac8efSHong Zhang if (npos) *npos = F->rmap->N - (mumps->id.INFOG(12) + mumps->id.INFOG(28)); 1139a58c3f20SHong Zhang } 1140a58c3f20SHong Zhang PetscFunctionReturn(0); 1141a58c3f20SHong Zhang } 1142ace3df97SHong Zhang #endif /* !defined(PETSC_USE_COMPLEX) */ 1143a58c3f20SHong Zhang 1144397b6df1SKris Buschelman #undef __FUNCT__ 1145f6c57405SHong Zhang #define __FUNCT__ "MatFactorNumeric_MUMPS" 11460481f469SBarry Smith PetscErrorCode MatFactorNumeric_MUMPS(Mat F,Mat A,const MatFactorInfo *info) 1147af281ebdSHong Zhang { 1148a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)(F)->spptr; 11496849ba73SBarry Smith PetscErrorCode ierr; 1150e09efc27SHong Zhang Mat F_diag; 1151ace3abfcSBarry Smith PetscBool isMPIAIJ; 1152397b6df1SKris Buschelman 1153397b6df1SKris Buschelman PetscFunctionBegin; 1154a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_REUSE_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 1155397b6df1SKris Buschelman 1156397b6df1SKris Buschelman /* numerical factorization phase */ 1157329ec9b3SHong Zhang /*-------------------------------*/ 1158a5e57a09SHong Zhang mumps->id.job = JOB_FACTNUMERIC; 11594e34a73bSHong Zhang if (!mumps->id.ICNTL(18)) { /* A is centralized */ 1160a5e57a09SHong Zhang if (!mumps->myid) { 1161940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 1162397b6df1SKris Buschelman } 1163397b6df1SKris Buschelman } else { 1164940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 1165397b6df1SKris Buschelman } 1166a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1167a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) { 1168151787a6SHong Zhang if (mumps->id.INFO(1) == -13) { 1169151787a6SHong Zhang if (mumps->id.INFO(2) < 0) { 1170151787a6SHong Zhang SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: Cannot allocate required memory %d megabytes\n",-mumps->id.INFO(2)); 1171151787a6SHong Zhang } else { 1172151787a6SHong Zhang SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: Cannot allocate required memory %d bytes\n",mumps->id.INFO(2)); 1173151787a6SHong Zhang } 1174151787a6SHong Zhang } else SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: INFO(1)=%d, INFO(2)=%d\n",mumps->id.INFO(1),mumps->id.INFO(2)); 1175397b6df1SKris Buschelman } 1176a5e57a09SHong Zhang if (!mumps->myid && mumps->id.ICNTL(16) > 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB," mumps->id.ICNTL(16):=%d\n",mumps->id.INFOG(16)); 1177397b6df1SKris Buschelman 1178dcd589f8SShri Abhyankar (F)->assembled = PETSC_TRUE; 1179a5e57a09SHong Zhang mumps->matstruc = SAME_NONZERO_PATTERN; 1180a5e57a09SHong Zhang mumps->CleanUpMUMPS = PETSC_TRUE; 1181b5fa320bSStefano Zampini mumps->schur_factored = PETSC_FALSE; 118259ac8732SStefano Zampini mumps->schur_inverted = PETSC_FALSE; 118367877ebaSShri Abhyankar 1184066565c5SStefano Zampini /* just to be sure that ICNTL(19) value returned by a call from MatMumpsGetIcntl is always consistent */ 1185066565c5SStefano Zampini if (!mumps->sym && mumps->id.ICNTL(19) && mumps->id.ICNTL(19) != 1) mumps->id.ICNTL(19) = 3; 1186066565c5SStefano Zampini 1187a5e57a09SHong Zhang if (mumps->size > 1) { 118867877ebaSShri Abhyankar PetscInt lsol_loc; 118967877ebaSShri Abhyankar PetscScalar *sol_loc; 11902205254eSKarl Rupp 1191c2093ab7SHong Zhang ierr = PetscObjectTypeCompare((PetscObject)A,MATMPIAIJ,&isMPIAIJ);CHKERRQ(ierr); 1192c2093ab7SHong Zhang if (isMPIAIJ) F_diag = ((Mat_MPIAIJ*)(F)->data)->A; 1193c2093ab7SHong Zhang else F_diag = ((Mat_MPISBAIJ*)(F)->data)->A; 1194c2093ab7SHong Zhang F_diag->assembled = PETSC_TRUE; 1195c2093ab7SHong Zhang 1196c2093ab7SHong Zhang /* distributed solution; Create x_seq=sol_loc for repeated use */ 1197c2093ab7SHong Zhang if (mumps->x_seq) { 1198c2093ab7SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 1199c2093ab7SHong Zhang ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr); 1200c2093ab7SHong Zhang ierr = VecDestroy(&mumps->x_seq);CHKERRQ(ierr); 1201c2093ab7SHong Zhang } 1202a5e57a09SHong Zhang lsol_loc = mumps->id.INFO(23); /* length of sol_loc */ 1203dcca6d9dSJed Brown ierr = PetscMalloc2(lsol_loc,&sol_loc,lsol_loc,&mumps->id.isol_loc);CHKERRQ(ierr); 1204a5e57a09SHong Zhang mumps->id.lsol_loc = lsol_loc; 1205940cd9d6SSatish Balay mumps->id.sol_loc = (MumpsScalar*)sol_loc; 1206a5e57a09SHong Zhang ierr = VecCreateSeqWithArray(PETSC_COMM_SELF,1,lsol_loc,sol_loc,&mumps->x_seq);CHKERRQ(ierr); 120767877ebaSShri Abhyankar } 1208397b6df1SKris Buschelman PetscFunctionReturn(0); 1209397b6df1SKris Buschelman } 1210397b6df1SKris Buschelman 12119a2535b5SHong Zhang /* Sets MUMPS options from the options database */ 1212dcd589f8SShri Abhyankar #undef __FUNCT__ 12139a2535b5SHong Zhang #define __FUNCT__ "PetscSetMUMPSFromOptions" 12149a2535b5SHong Zhang PetscErrorCode PetscSetMUMPSFromOptions(Mat F, Mat A) 1215dcd589f8SShri Abhyankar { 12169a2535b5SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1217dcd589f8SShri Abhyankar PetscErrorCode ierr; 1218b34f08ffSHong Zhang PetscInt icntl,info[40],i,ninfo=40; 1219ace3abfcSBarry Smith PetscBool flg; 1220dcd589f8SShri Abhyankar 1221dcd589f8SShri Abhyankar PetscFunctionBegin; 1222ce94432eSBarry Smith ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)A),((PetscObject)A)->prefix,"MUMPS Options","Mat");CHKERRQ(ierr); 12239a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_1","ICNTL(1): output stream for error messages","None",mumps->id.ICNTL(1),&icntl,&flg);CHKERRQ(ierr); 12249a2535b5SHong Zhang if (flg) mumps->id.ICNTL(1) = icntl; 12259a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_2","ICNTL(2): output stream for diagnostic printing, statistics, and warning","None",mumps->id.ICNTL(2),&icntl,&flg);CHKERRQ(ierr); 12269a2535b5SHong Zhang if (flg) mumps->id.ICNTL(2) = icntl; 12279a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_3","ICNTL(3): output stream for global information, collected on the host","None",mumps->id.ICNTL(3),&icntl,&flg);CHKERRQ(ierr); 12289a2535b5SHong Zhang if (flg) mumps->id.ICNTL(3) = icntl; 1229dcd589f8SShri Abhyankar 12309a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_4","ICNTL(4): level of printing (0 to 4)","None",mumps->id.ICNTL(4),&icntl,&flg);CHKERRQ(ierr); 12319a2535b5SHong Zhang if (flg) mumps->id.ICNTL(4) = icntl; 12329a2535b5SHong Zhang if (mumps->id.ICNTL(4) || PetscLogPrintInfo) mumps->id.ICNTL(3) = 6; /* resume MUMPS default id.ICNTL(3) = 6 */ 12339a2535b5SHong Zhang 1234d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_6","ICNTL(6): permutes to a zero-free diagonal and/or scale the matrix (0 to 7)","None",mumps->id.ICNTL(6),&icntl,&flg);CHKERRQ(ierr); 12359a2535b5SHong Zhang if (flg) mumps->id.ICNTL(6) = icntl; 12369a2535b5SHong Zhang 1237d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_7","ICNTL(7): computes a symmetric permutation in sequential analysis (0 to 7). 3=Scotch, 4=PORD, 5=Metis","None",mumps->id.ICNTL(7),&icntl,&flg);CHKERRQ(ierr); 1238dcd589f8SShri Abhyankar if (flg) { 12392205254eSKarl Rupp if (icntl== 1 && mumps->size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"pivot order be set by the user in PERM_IN -- not supported by the PETSc/MUMPS interface\n"); 12402205254eSKarl Rupp else mumps->id.ICNTL(7) = icntl; 1241dcd589f8SShri Abhyankar } 1242e0b74bf9SHong Zhang 12430298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_8","ICNTL(8): scaling strategy (-2 to 8 or 77)","None",mumps->id.ICNTL(8),&mumps->id.ICNTL(8),NULL);CHKERRQ(ierr); 1244d341cd04SHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_9","ICNTL(9): computes the solution using A or A^T","None",mumps->id.ICNTL(9),&mumps->id.ICNTL(9),NULL);CHKERRQ(ierr); handled by MatSolveTranspose_MUMPS() */ 12450298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_10","ICNTL(10): max num of refinements","None",mumps->id.ICNTL(10),&mumps->id.ICNTL(10),NULL);CHKERRQ(ierr); 1246d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_11","ICNTL(11): statistics related to an error analysis (via -ksp_view)","None",mumps->id.ICNTL(11),&mumps->id.ICNTL(11),NULL);CHKERRQ(ierr); 1247d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_12","ICNTL(12): an ordering strategy for symmetric matrices (0 to 3)","None",mumps->id.ICNTL(12),&mumps->id.ICNTL(12),NULL);CHKERRQ(ierr); 1248d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_13","ICNTL(13): parallelism of the root node (enable ScaLAPACK) and its splitting","None",mumps->id.ICNTL(13),&mumps->id.ICNTL(13),NULL);CHKERRQ(ierr); 1249d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_14","ICNTL(14): percentage increase in the estimated working space","None",mumps->id.ICNTL(14),&mumps->id.ICNTL(14),NULL);CHKERRQ(ierr); 1250d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_19","ICNTL(19): computes the Schur complement","None",mumps->id.ICNTL(19),&mumps->id.ICNTL(19),NULL);CHKERRQ(ierr); 125159ac8732SStefano Zampini if (mumps->id.ICNTL(19) <= 0 || mumps->id.ICNTL(19) > 3) { /* reset any schur data (if any) */ 125259ac8732SStefano Zampini ierr = MatMumpsResetSchur_Private(mumps);CHKERRQ(ierr); 125359ac8732SStefano Zampini } 12544e34a73bSHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_20","ICNTL(20): the format (dense or sparse) of the right-hand sides","None",mumps->id.ICNTL(20),&mumps->id.ICNTL(20),NULL);CHKERRQ(ierr); -- sparse rhs is not supported in PETSc API */ 1255d341cd04SHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_21","ICNTL(21): the distribution (centralized or distributed) of the solution vectors","None",mumps->id.ICNTL(21),&mumps->id.ICNTL(21),NULL);CHKERRQ(ierr); we only use distributed solution vector */ 12569a2535b5SHong Zhang 1257d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_22","ICNTL(22): in-core/out-of-core factorization and solve (0 or 1)","None",mumps->id.ICNTL(22),&mumps->id.ICNTL(22),NULL);CHKERRQ(ierr); 12580298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_23","ICNTL(23): max size of the working memory (MB) that can allocate per processor","None",mumps->id.ICNTL(23),&mumps->id.ICNTL(23),NULL);CHKERRQ(ierr); 12590298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_24","ICNTL(24): detection of null pivot rows (0 or 1)","None",mumps->id.ICNTL(24),&mumps->id.ICNTL(24),NULL);CHKERRQ(ierr); 12609a2535b5SHong Zhang if (mumps->id.ICNTL(24)) { 12619a2535b5SHong Zhang mumps->id.ICNTL(13) = 1; /* turn-off ScaLAPACK to help with the correct detection of null pivots */ 1262d7ebd59bSHong Zhang } 1263d7ebd59bSHong Zhang 1264d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_25","ICNTL(25): compute a solution of a deficient matrix and a null space basis","None",mumps->id.ICNTL(25),&mumps->id.ICNTL(25),NULL);CHKERRQ(ierr); 1265d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_26","ICNTL(26): drives the solution phase if a Schur complement matrix","None",mumps->id.ICNTL(26),&mumps->id.ICNTL(26),NULL);CHKERRQ(ierr); 12662cd7d884SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_27","ICNTL(27): the blocking size for multiple right-hand sides","None",mumps->id.ICNTL(27),&mumps->id.ICNTL(27),NULL);CHKERRQ(ierr); 12670298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_28","ICNTL(28): use 1 for sequential analysis and ictnl(7) ordering, or 2 for parallel analysis and ictnl(29) ordering","None",mumps->id.ICNTL(28),&mumps->id.ICNTL(28),NULL);CHKERRQ(ierr); 1268d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_29","ICNTL(29): parallel ordering 1 = ptscotch, 2 = parmetis","None",mumps->id.ICNTL(29),&mumps->id.ICNTL(29),NULL);CHKERRQ(ierr); 12690298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_30","ICNTL(30): compute user-specified set of entries in inv(A)","None",mumps->id.ICNTL(30),&mumps->id.ICNTL(30),NULL);CHKERRQ(ierr); 1270d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_31","ICNTL(31): indicates which factors may be discarded during factorization","None",mumps->id.ICNTL(31),&mumps->id.ICNTL(31),NULL);CHKERRQ(ierr); 12714e34a73bSHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_32","ICNTL(32): performs the forward elemination of the right-hand sides during factorization","None",mumps->id.ICNTL(32),&mumps->id.ICNTL(32),NULL);CHKERRQ(ierr); -- not supported by PETSc API */ 12720298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_33","ICNTL(33): compute determinant","None",mumps->id.ICNTL(33),&mumps->id.ICNTL(33),NULL);CHKERRQ(ierr); 1273dcd589f8SShri Abhyankar 12740298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_1","CNTL(1): relative pivoting threshold","None",mumps->id.CNTL(1),&mumps->id.CNTL(1),NULL);CHKERRQ(ierr); 12750298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_2","CNTL(2): stopping criterion of refinement","None",mumps->id.CNTL(2),&mumps->id.CNTL(2),NULL);CHKERRQ(ierr); 12760298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_3","CNTL(3): absolute pivoting threshold","None",mumps->id.CNTL(3),&mumps->id.CNTL(3),NULL);CHKERRQ(ierr); 12770298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_4","CNTL(4): value for static pivoting","None",mumps->id.CNTL(4),&mumps->id.CNTL(4),NULL);CHKERRQ(ierr); 12780298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_5","CNTL(5): fixation for null pivots","None",mumps->id.CNTL(5),&mumps->id.CNTL(5),NULL);CHKERRQ(ierr); 1279e5bb22a1SHong Zhang 12800298fd71SBarry Smith ierr = PetscOptionsString("-mat_mumps_ooc_tmpdir", "out of core directory", "None", mumps->id.ooc_tmpdir, mumps->id.ooc_tmpdir, 256, NULL); 1281b34f08ffSHong Zhang 128216d797efSHong Zhang ierr = PetscOptionsIntArray("-mat_mumps_view_info","request INFO local to each processor","",info,&ninfo,NULL);CHKERRQ(ierr); 1283b34f08ffSHong Zhang if (ninfo) { 1284b34f08ffSHong Zhang if (ninfo > 40) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"number of INFO %d must <= 40\n",ninfo); 1285b34f08ffSHong Zhang ierr = PetscMalloc1(ninfo,&mumps->info);CHKERRQ(ierr); 1286b34f08ffSHong Zhang mumps->ninfo = ninfo; 1287b34f08ffSHong Zhang for (i=0; i<ninfo; i++) { 1288b34f08ffSHong Zhang if (info[i] < 0 || info[i]>40) { 1289b34f08ffSHong Zhang SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"index of INFO %d must between 1 and 40\n",ninfo); 1290b34f08ffSHong Zhang } else { 1291b34f08ffSHong Zhang mumps->info[i] = info[i]; 1292b34f08ffSHong Zhang } 1293b34f08ffSHong Zhang } 1294b34f08ffSHong Zhang } 1295b34f08ffSHong Zhang 1296dcd589f8SShri Abhyankar PetscOptionsEnd(); 1297dcd589f8SShri Abhyankar PetscFunctionReturn(0); 1298dcd589f8SShri Abhyankar } 1299dcd589f8SShri Abhyankar 1300dcd589f8SShri Abhyankar #undef __FUNCT__ 1301dcd589f8SShri Abhyankar #define __FUNCT__ "PetscInitializeMUMPS" 1302f697e70eSHong Zhang PetscErrorCode PetscInitializeMUMPS(Mat A,Mat_MUMPS *mumps) 1303dcd589f8SShri Abhyankar { 1304dcd589f8SShri Abhyankar PetscErrorCode ierr; 1305dcd589f8SShri Abhyankar 1306dcd589f8SShri Abhyankar PetscFunctionBegin; 1307ce94432eSBarry Smith ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)A), &mumps->myid); 1308ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)A),&mumps->size);CHKERRQ(ierr); 1309ce94432eSBarry Smith ierr = MPI_Comm_dup(PetscObjectComm((PetscObject)A),&(mumps->comm_mumps));CHKERRQ(ierr); 13102205254eSKarl Rupp 1311f697e70eSHong Zhang mumps->id.comm_fortran = MPI_Comm_c2f(mumps->comm_mumps); 1312f697e70eSHong Zhang 1313f697e70eSHong Zhang mumps->id.job = JOB_INIT; 1314f697e70eSHong Zhang mumps->id.par = 1; /* host participates factorizaton and solve */ 1315f697e70eSHong Zhang mumps->id.sym = mumps->sym; 13162907cef9SHong Zhang PetscMUMPS_c(&mumps->id); 1317f697e70eSHong Zhang 1318f697e70eSHong Zhang mumps->CleanUpMUMPS = PETSC_FALSE; 13190298fd71SBarry Smith mumps->scat_rhs = NULL; 13200298fd71SBarry Smith mumps->scat_sol = NULL; 13219a2535b5SHong Zhang 132270544d5fSHong Zhang /* set PETSc-MUMPS default options - override MUMPS default */ 13239a2535b5SHong Zhang mumps->id.ICNTL(3) = 0; 13249a2535b5SHong Zhang mumps->id.ICNTL(4) = 0; 13259a2535b5SHong Zhang if (mumps->size == 1) { 13269a2535b5SHong Zhang mumps->id.ICNTL(18) = 0; /* centralized assembled matrix input */ 13279a2535b5SHong Zhang } else { 13289a2535b5SHong Zhang mumps->id.ICNTL(18) = 3; /* distributed assembled matrix input */ 13294e34a73bSHong Zhang mumps->id.ICNTL(20) = 0; /* rhs is in dense format */ 133070544d5fSHong Zhang mumps->id.ICNTL(21) = 1; /* distributed solution */ 13319a2535b5SHong Zhang } 13326444a565SStefano Zampini 13336444a565SStefano Zampini /* schur */ 13346444a565SStefano Zampini mumps->id.size_schur = 0; 13356444a565SStefano Zampini mumps->id.listvar_schur = NULL; 13366444a565SStefano Zampini mumps->id.schur = NULL; 1337b5fa320bSStefano Zampini mumps->schur_second_solve = PETSC_FALSE; 1338b5fa320bSStefano Zampini mumps->sizeredrhs = 0; 1339b5fa320bSStefano Zampini mumps->schur_pivots = NULL; 1340b5fa320bSStefano Zampini mumps->schur_work = NULL; 134159ac8732SStefano Zampini mumps->schur_sol = NULL; 134259ac8732SStefano Zampini mumps->schur_sizesol = 0; 134359ac8732SStefano Zampini mumps->schur_restored = PETSC_TRUE; 134459ac8732SStefano Zampini mumps->schur_factored = PETSC_FALSE; 134559ac8732SStefano Zampini mumps->schur_inverted = PETSC_FALSE; 1346*a0b0af32SStefano Zampini mumps->schur_sym = mumps->id.sym; 1347dcd589f8SShri Abhyankar PetscFunctionReturn(0); 1348dcd589f8SShri Abhyankar } 1349dcd589f8SShri Abhyankar 1350a5e57a09SHong Zhang /* Note Petsc r(=c) permutation is used when mumps->id.ICNTL(7)==1 with centralized assembled matrix input; otherwise r and c are ignored */ 1351397b6df1SKris Buschelman #undef __FUNCT__ 1352f0c56d0fSKris Buschelman #define __FUNCT__ "MatLUFactorSymbolic_AIJMUMPS" 13530481f469SBarry Smith PetscErrorCode MatLUFactorSymbolic_AIJMUMPS(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info) 1354b24902e0SBarry Smith { 1355a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1356dcd589f8SShri Abhyankar PetscErrorCode ierr; 135767877ebaSShri Abhyankar Vec b; 135867877ebaSShri Abhyankar IS is_iden; 135967877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1360397b6df1SKris Buschelman 1361397b6df1SKris Buschelman PetscFunctionBegin; 1362a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1363dcd589f8SShri Abhyankar 13649a2535b5SHong Zhang /* Set MUMPS options from the options database */ 13659a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1366dcd589f8SShri Abhyankar 1367a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 1368dcd589f8SShri Abhyankar 136967877ebaSShri Abhyankar /* analysis phase */ 137067877ebaSShri Abhyankar /*----------------*/ 1371a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1372a5e57a09SHong Zhang mumps->id.n = M; 1373a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 137467877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1375a5e57a09SHong Zhang if (!mumps->myid) { 1376a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1377a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1378940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 137967877ebaSShri Abhyankar } 1380a5e57a09SHong Zhang if (mumps->id.ICNTL(7) == 1) { /* use user-provide matrix ordering - assuming r = c ordering */ 13815248a706SHong Zhang /* 13825248a706SHong Zhang PetscBool flag; 13835248a706SHong Zhang ierr = ISEqual(r,c,&flag);CHKERRQ(ierr); 13845248a706SHong Zhang if (!flag) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"row_perm != col_perm"); 13855248a706SHong Zhang ierr = ISView(r,PETSC_VIEWER_STDOUT_SELF); 13865248a706SHong Zhang */ 1387a5e57a09SHong Zhang if (!mumps->myid) { 1388e0b74bf9SHong Zhang const PetscInt *idx; 1389e0b74bf9SHong Zhang PetscInt i,*perm_in; 13902205254eSKarl Rupp 1391785e854fSJed Brown ierr = PetscMalloc1(M,&perm_in);CHKERRQ(ierr); 1392e0b74bf9SHong Zhang ierr = ISGetIndices(r,&idx);CHKERRQ(ierr); 13932205254eSKarl Rupp 1394a5e57a09SHong Zhang mumps->id.perm_in = perm_in; 1395e0b74bf9SHong Zhang for (i=0; i<M; i++) perm_in[i] = idx[i]+1; /* perm_in[]: start from 1, not 0! */ 1396e0b74bf9SHong Zhang ierr = ISRestoreIndices(r,&idx);CHKERRQ(ierr); 1397e0b74bf9SHong Zhang } 1398e0b74bf9SHong Zhang } 139967877ebaSShri Abhyankar } 140067877ebaSShri Abhyankar break; 140167877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1402a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1403a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1404a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1405940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 140667877ebaSShri Abhyankar } 140767877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1408a5e57a09SHong Zhang if (!mumps->myid) { 14092cd7d884SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->rmap->N,&mumps->b_seq);CHKERRQ(ierr); 14102cd7d884SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,A->rmap->N,0,1,&is_iden);CHKERRQ(ierr); 141167877ebaSShri Abhyankar } else { 1412a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 141367877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 141467877ebaSShri Abhyankar } 14152a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1416a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 14176bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 14186bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 141967877ebaSShri Abhyankar break; 142067877ebaSShri Abhyankar } 1421a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1422a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 142367877ebaSShri Abhyankar 1424719d5645SBarry Smith F->ops->lufactornumeric = MatFactorNumeric_MUMPS; 1425dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 142651d5961aSHong Zhang F->ops->solvetranspose = MatSolveTranspose_MUMPS; 14274e34a73bSHong Zhang F->ops->matsolve = MatMatSolve_MUMPS; 1428b24902e0SBarry Smith PetscFunctionReturn(0); 1429b24902e0SBarry Smith } 1430b24902e0SBarry Smith 1431450b117fSShri Abhyankar /* Note the Petsc r and c permutations are ignored */ 1432450b117fSShri Abhyankar #undef __FUNCT__ 1433450b117fSShri Abhyankar #define __FUNCT__ "MatLUFactorSymbolic_BAIJMUMPS" 1434450b117fSShri Abhyankar PetscErrorCode MatLUFactorSymbolic_BAIJMUMPS(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info) 1435450b117fSShri Abhyankar { 1436a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1437dcd589f8SShri Abhyankar PetscErrorCode ierr; 143867877ebaSShri Abhyankar Vec b; 143967877ebaSShri Abhyankar IS is_iden; 144067877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1441450b117fSShri Abhyankar 1442450b117fSShri Abhyankar PetscFunctionBegin; 1443a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1444dcd589f8SShri Abhyankar 14459a2535b5SHong Zhang /* Set MUMPS options from the options database */ 14469a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1447dcd589f8SShri Abhyankar 1448a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 144967877ebaSShri Abhyankar 145067877ebaSShri Abhyankar /* analysis phase */ 145167877ebaSShri Abhyankar /*----------------*/ 1452a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1453a5e57a09SHong Zhang mumps->id.n = M; 1454a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 145567877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1456a5e57a09SHong Zhang if (!mumps->myid) { 1457a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1458a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1459940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 146067877ebaSShri Abhyankar } 146167877ebaSShri Abhyankar } 146267877ebaSShri Abhyankar break; 146367877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1464a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1465a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1466a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1467940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 146867877ebaSShri Abhyankar } 146967877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1470a5e57a09SHong Zhang if (!mumps->myid) { 1471a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr); 147267877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr); 147367877ebaSShri Abhyankar } else { 1474a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 147567877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 147667877ebaSShri Abhyankar } 14772a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1478a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 14796bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 14806bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 148167877ebaSShri Abhyankar break; 148267877ebaSShri Abhyankar } 1483a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1484a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 148567877ebaSShri Abhyankar 1486450b117fSShri Abhyankar F->ops->lufactornumeric = MatFactorNumeric_MUMPS; 1487dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 148851d5961aSHong Zhang F->ops->solvetranspose = MatSolveTranspose_MUMPS; 1489450b117fSShri Abhyankar PetscFunctionReturn(0); 1490450b117fSShri Abhyankar } 1491b24902e0SBarry Smith 1492141f4205SHong Zhang /* Note the Petsc r permutation and factor info are ignored */ 1493397b6df1SKris Buschelman #undef __FUNCT__ 149467877ebaSShri Abhyankar #define __FUNCT__ "MatCholeskyFactorSymbolic_MUMPS" 149567877ebaSShri Abhyankar PetscErrorCode MatCholeskyFactorSymbolic_MUMPS(Mat F,Mat A,IS r,const MatFactorInfo *info) 1496b24902e0SBarry Smith { 1497a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1498dcd589f8SShri Abhyankar PetscErrorCode ierr; 149967877ebaSShri Abhyankar Vec b; 150067877ebaSShri Abhyankar IS is_iden; 150167877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1502397b6df1SKris Buschelman 1503397b6df1SKris Buschelman PetscFunctionBegin; 1504a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1505dcd589f8SShri Abhyankar 15069a2535b5SHong Zhang /* Set MUMPS options from the options database */ 15079a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1508dcd589f8SShri Abhyankar 1509a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 1510dcd589f8SShri Abhyankar 151167877ebaSShri Abhyankar /* analysis phase */ 151267877ebaSShri Abhyankar /*----------------*/ 1513a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1514a5e57a09SHong Zhang mumps->id.n = M; 1515a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 151667877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1517a5e57a09SHong Zhang if (!mumps->myid) { 1518a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1519a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1520940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 152167877ebaSShri Abhyankar } 152267877ebaSShri Abhyankar } 152367877ebaSShri Abhyankar break; 152467877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1525a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1526a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1527a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1528940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 152967877ebaSShri Abhyankar } 153067877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1531a5e57a09SHong Zhang if (!mumps->myid) { 1532a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr); 153367877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr); 153467877ebaSShri Abhyankar } else { 1535a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 153667877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 153767877ebaSShri Abhyankar } 15382a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1539a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 15406bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 15416bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 154267877ebaSShri Abhyankar break; 154367877ebaSShri Abhyankar } 1544a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1545a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 154667877ebaSShri Abhyankar 15472792810eSHong Zhang F->ops->choleskyfactornumeric = MatFactorNumeric_MUMPS; 1548dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 154951d5961aSHong Zhang F->ops->solvetranspose = MatSolve_MUMPS; 15504e34a73bSHong Zhang F->ops->matsolve = MatMatSolve_MUMPS; 15514e34a73bSHong Zhang #if defined(PETSC_USE_COMPLEX) 15520298fd71SBarry Smith F->ops->getinertia = NULL; 15534e34a73bSHong Zhang #else 15544e34a73bSHong Zhang F->ops->getinertia = MatGetInertia_SBAIJMUMPS; 1555db4efbfdSBarry Smith #endif 1556b24902e0SBarry Smith PetscFunctionReturn(0); 1557b24902e0SBarry Smith } 1558b24902e0SBarry Smith 1559397b6df1SKris Buschelman #undef __FUNCT__ 156064e6c443SBarry Smith #define __FUNCT__ "MatView_MUMPS" 156164e6c443SBarry Smith PetscErrorCode MatView_MUMPS(Mat A,PetscViewer viewer) 156274ed9c26SBarry Smith { 1563f6c57405SHong Zhang PetscErrorCode ierr; 156464e6c443SBarry Smith PetscBool iascii; 156564e6c443SBarry Smith PetscViewerFormat format; 1566a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 1567f6c57405SHong Zhang 1568f6c57405SHong Zhang PetscFunctionBegin; 156964e6c443SBarry Smith /* check if matrix is mumps type */ 157064e6c443SBarry Smith if (A->ops->solve != MatSolve_MUMPS) PetscFunctionReturn(0); 157164e6c443SBarry Smith 1572251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 157364e6c443SBarry Smith if (iascii) { 157464e6c443SBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 157564e6c443SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO) { 157664e6c443SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"MUMPS run parameters:\n");CHKERRQ(ierr); 1577a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," SYM (matrix type): %d \n",mumps->id.sym);CHKERRQ(ierr); 1578a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," PAR (host participation): %d \n",mumps->id.par);CHKERRQ(ierr); 1579a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(1) (output for error): %d \n",mumps->id.ICNTL(1));CHKERRQ(ierr); 1580a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(2) (output of diagnostic msg): %d \n",mumps->id.ICNTL(2));CHKERRQ(ierr); 1581a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(3) (output for global info): %d \n",mumps->id.ICNTL(3));CHKERRQ(ierr); 1582a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(4) (level of printing): %d \n",mumps->id.ICNTL(4));CHKERRQ(ierr); 1583a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(5) (input mat struct): %d \n",mumps->id.ICNTL(5));CHKERRQ(ierr); 1584a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(6) (matrix prescaling): %d \n",mumps->id.ICNTL(6));CHKERRQ(ierr); 1585a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(7) (sequentia matrix ordering):%d \n",mumps->id.ICNTL(7));CHKERRQ(ierr); 1586a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(8) (scalling strategy): %d \n",mumps->id.ICNTL(8));CHKERRQ(ierr); 1587a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(10) (max num of refinements): %d \n",mumps->id.ICNTL(10));CHKERRQ(ierr); 1588a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(11) (error analysis): %d \n",mumps->id.ICNTL(11));CHKERRQ(ierr); 1589a5e57a09SHong Zhang if (mumps->id.ICNTL(11)>0) { 1590a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(4) (inf norm of input mat): %g\n",mumps->id.RINFOG(4));CHKERRQ(ierr); 1591a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(5) (inf norm of solution): %g\n",mumps->id.RINFOG(5));CHKERRQ(ierr); 1592a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(6) (inf norm of residual): %g\n",mumps->id.RINFOG(6));CHKERRQ(ierr); 1593a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(7),RINFOG(8) (backward error est): %g, %g\n",mumps->id.RINFOG(7),mumps->id.RINFOG(8));CHKERRQ(ierr); 1594a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(9) (error estimate): %g \n",mumps->id.RINFOG(9));CHKERRQ(ierr); 1595a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(10),RINFOG(11)(condition numbers): %g, %g\n",mumps->id.RINFOG(10),mumps->id.RINFOG(11));CHKERRQ(ierr); 1596f6c57405SHong Zhang } 1597a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(12) (efficiency control): %d \n",mumps->id.ICNTL(12));CHKERRQ(ierr); 1598a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(13) (efficiency control): %d \n",mumps->id.ICNTL(13));CHKERRQ(ierr); 1599a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(14) (percentage of estimated workspace increase): %d \n",mumps->id.ICNTL(14));CHKERRQ(ierr); 1600f6c57405SHong Zhang /* ICNTL(15-17) not used */ 1601a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(18) (input mat struct): %d \n",mumps->id.ICNTL(18));CHKERRQ(ierr); 1602a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(19) (Shur complement info): %d \n",mumps->id.ICNTL(19));CHKERRQ(ierr); 1603a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(20) (rhs sparse pattern): %d \n",mumps->id.ICNTL(20));CHKERRQ(ierr); 1604ca3dc52bSPierre Jolivet ierr = PetscViewerASCIIPrintf(viewer," ICNTL(21) (solution struct): %d \n",mumps->id.ICNTL(21));CHKERRQ(ierr); 1605a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(22) (in-core/out-of-core facility): %d \n",mumps->id.ICNTL(22));CHKERRQ(ierr); 1606a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(23) (max size of memory can be allocated locally):%d \n",mumps->id.ICNTL(23));CHKERRQ(ierr); 1607c0165424SHong Zhang 1608a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(24) (detection of null pivot rows): %d \n",mumps->id.ICNTL(24));CHKERRQ(ierr); 1609a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(25) (computation of a null space basis): %d \n",mumps->id.ICNTL(25));CHKERRQ(ierr); 1610a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(26) (Schur options for rhs or solution): %d \n",mumps->id.ICNTL(26));CHKERRQ(ierr); 1611a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(27) (experimental parameter): %d \n",mumps->id.ICNTL(27));CHKERRQ(ierr); 1612a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(28) (use parallel or sequential ordering): %d \n",mumps->id.ICNTL(28));CHKERRQ(ierr); 1613a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(29) (parallel ordering): %d \n",mumps->id.ICNTL(29));CHKERRQ(ierr); 161442179a6aSHong Zhang 1615a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(30) (user-specified set of entries in inv(A)): %d \n",mumps->id.ICNTL(30));CHKERRQ(ierr); 1616a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(31) (factors is discarded in the solve phase): %d \n",mumps->id.ICNTL(31));CHKERRQ(ierr); 1617a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(33) (compute determinant): %d \n",mumps->id.ICNTL(33));CHKERRQ(ierr); 1618f6c57405SHong Zhang 1619a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(1) (relative pivoting threshold): %g \n",mumps->id.CNTL(1));CHKERRQ(ierr); 1620a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(2) (stopping criterion of refinement): %g \n",mumps->id.CNTL(2));CHKERRQ(ierr); 1621ca3dc52bSPierre Jolivet ierr = PetscViewerASCIIPrintf(viewer," CNTL(3) (absolute pivoting threshold): %g \n",mumps->id.CNTL(3));CHKERRQ(ierr); 1622ca3dc52bSPierre Jolivet ierr = PetscViewerASCIIPrintf(viewer," CNTL(4) (value of static pivoting): %g \n",mumps->id.CNTL(4));CHKERRQ(ierr); 1623a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(5) (fixation for null pivots): %g \n",mumps->id.CNTL(5));CHKERRQ(ierr); 1624f6c57405SHong Zhang 1625f6c57405SHong Zhang /* infomation local to each processor */ 162634ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(1) (local estimated flops for the elimination after analysis): \n");CHKERRQ(ierr); 16277b23a99aSBarry Smith ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_TRUE);CHKERRQ(ierr); 1628a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(1));CHKERRQ(ierr); 162934ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 163034ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(2) (local estimated flops for the assembly after factorization): \n");CHKERRQ(ierr); 1631a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(2));CHKERRQ(ierr); 163234ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 163334ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(3) (local estimated flops for the elimination after factorization): \n");CHKERRQ(ierr); 1634a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(3));CHKERRQ(ierr); 163534ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1636f6c57405SHong Zhang 163734ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(15) (estimated size of (in MB) MUMPS internal data for running numerical factorization): \n");CHKERRQ(ierr); 1638a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(15));CHKERRQ(ierr); 163934ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1640f6c57405SHong Zhang 164134ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(16) (size of (in MB) MUMPS internal data used during numerical factorization): \n");CHKERRQ(ierr); 1642a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(16));CHKERRQ(ierr); 164334ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1644f6c57405SHong Zhang 164534ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(23) (num of pivots eliminated on this processor after factorization): \n");CHKERRQ(ierr); 1646a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(23));CHKERRQ(ierr); 164734ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1648b34f08ffSHong Zhang 1649b34f08ffSHong Zhang if (mumps->ninfo && mumps->ninfo <= 40){ 1650b34f08ffSHong Zhang PetscInt i; 1651b34f08ffSHong Zhang for (i=0; i<mumps->ninfo; i++){ 1652b34f08ffSHong Zhang ierr = PetscViewerASCIIPrintf(viewer, " INFO(%d): \n",mumps->info[i]);CHKERRQ(ierr); 1653b34f08ffSHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(mumps->info[i]));CHKERRQ(ierr); 1654b34f08ffSHong Zhang ierr = PetscViewerFlush(viewer); 1655b34f08ffSHong Zhang } 1656b34f08ffSHong Zhang } 1657b34f08ffSHong Zhang 1658b34f08ffSHong Zhang 16597b23a99aSBarry Smith ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_FALSE);CHKERRQ(ierr); 1660f6c57405SHong Zhang 1661a5e57a09SHong Zhang if (!mumps->myid) { /* information from the host */ 1662a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(1) (global estimated flops for the elimination after analysis): %g \n",mumps->id.RINFOG(1));CHKERRQ(ierr); 1663a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(2) (global estimated flops for the assembly after factorization): %g \n",mumps->id.RINFOG(2));CHKERRQ(ierr); 1664a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(3) (global estimated flops for the elimination after factorization): %g \n",mumps->id.RINFOG(3));CHKERRQ(ierr); 1665a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," (RINFOG(12) RINFOG(13))*2^INFOG(34) (determinant): (%g,%g)*(2^%d)\n",mumps->id.RINFOG(12),mumps->id.RINFOG(13),mumps->id.INFOG(34));CHKERRQ(ierr); 1666f6c57405SHong Zhang 1667a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(3) (estimated real workspace for factors on all processors after analysis): %d \n",mumps->id.INFOG(3));CHKERRQ(ierr); 1668a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(4) (estimated integer workspace for factors on all processors after analysis): %d \n",mumps->id.INFOG(4));CHKERRQ(ierr); 1669a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(5) (estimated maximum front size in the complete tree): %d \n",mumps->id.INFOG(5));CHKERRQ(ierr); 1670a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(6) (number of nodes in the complete tree): %d \n",mumps->id.INFOG(6));CHKERRQ(ierr); 1671a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(7) (ordering option effectively use after analysis): %d \n",mumps->id.INFOG(7));CHKERRQ(ierr); 1672a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(8) (structural symmetry in percent of the permuted matrix after analysis): %d \n",mumps->id.INFOG(8));CHKERRQ(ierr); 1673a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(9) (total real/complex workspace to store the matrix factors after factorization): %d \n",mumps->id.INFOG(9));CHKERRQ(ierr); 1674a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(10) (total integer space store the matrix factors after factorization): %d \n",mumps->id.INFOG(10));CHKERRQ(ierr); 1675a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(11) (order of largest frontal matrix after factorization): %d \n",mumps->id.INFOG(11));CHKERRQ(ierr); 1676a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(12) (number of off-diagonal pivots): %d \n",mumps->id.INFOG(12));CHKERRQ(ierr); 1677a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(13) (number of delayed pivots after factorization): %d \n",mumps->id.INFOG(13));CHKERRQ(ierr); 1678a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(14) (number of memory compress after factorization): %d \n",mumps->id.INFOG(14));CHKERRQ(ierr); 1679a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(15) (number of steps of iterative refinement after solution): %d \n",mumps->id.INFOG(15));CHKERRQ(ierr); 1680a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(16) (estimated size (in MB) of all MUMPS internal data for factorization after analysis: value on the most memory consuming processor): %d \n",mumps->id.INFOG(16));CHKERRQ(ierr); 1681a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(17) (estimated size of all MUMPS internal data for factorization after analysis: sum over all processors): %d \n",mumps->id.INFOG(17));CHKERRQ(ierr); 1682a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(18) (size of all MUMPS internal data allocated during factorization: value on the most memory consuming processor): %d \n",mumps->id.INFOG(18));CHKERRQ(ierr); 1683a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(19) (size of all MUMPS internal data allocated during factorization: sum over all processors): %d \n",mumps->id.INFOG(19));CHKERRQ(ierr); 1684a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(20) (estimated number of entries in the factors): %d \n",mumps->id.INFOG(20));CHKERRQ(ierr); 1685a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(21) (size in MB of memory effectively used during factorization - value on the most memory consuming processor): %d \n",mumps->id.INFOG(21));CHKERRQ(ierr); 1686a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(22) (size in MB of memory effectively used during factorization - sum over all processors): %d \n",mumps->id.INFOG(22));CHKERRQ(ierr); 1687a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(23) (after analysis: value of ICNTL(6) effectively used): %d \n",mumps->id.INFOG(23));CHKERRQ(ierr); 1688a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(24) (after analysis: value of ICNTL(12) effectively used): %d \n",mumps->id.INFOG(24));CHKERRQ(ierr); 1689a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(25) (after factorization: number of pivots modified by static pivoting): %d \n",mumps->id.INFOG(25));CHKERRQ(ierr); 169040d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(28) (after factorization: number of null pivots encountered): %d\n",mumps->id.INFOG(28));CHKERRQ(ierr); 169140d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(29) (after factorization: effective number of entries in the factors (sum over all processors)): %d\n",mumps->id.INFOG(29));CHKERRQ(ierr); 169240d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(30, 31) (after solution: size in Mbytes of memory used during solution phase): %d, %d\n",mumps->id.INFOG(30),mumps->id.INFOG(31));CHKERRQ(ierr); 169340d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(32) (after analysis: type of analysis done): %d\n",mumps->id.INFOG(32));CHKERRQ(ierr); 169440d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(33) (value used for ICNTL(8)): %d\n",mumps->id.INFOG(33));CHKERRQ(ierr); 169540d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(34) (exponent of the determinant if determinant is requested): %d\n",mumps->id.INFOG(34));CHKERRQ(ierr); 1696f6c57405SHong Zhang } 1697f6c57405SHong Zhang } 1698cb828f0fSHong Zhang } 1699f6c57405SHong Zhang PetscFunctionReturn(0); 1700f6c57405SHong Zhang } 1701f6c57405SHong Zhang 170235bd34faSBarry Smith #undef __FUNCT__ 170335bd34faSBarry Smith #define __FUNCT__ "MatGetInfo_MUMPS" 170435bd34faSBarry Smith PetscErrorCode MatGetInfo_MUMPS(Mat A,MatInfoType flag,MatInfo *info) 170535bd34faSBarry Smith { 1706cb828f0fSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)A->spptr; 170735bd34faSBarry Smith 170835bd34faSBarry Smith PetscFunctionBegin; 170935bd34faSBarry Smith info->block_size = 1.0; 1710cb828f0fSHong Zhang info->nz_allocated = mumps->id.INFOG(20); 1711cb828f0fSHong Zhang info->nz_used = mumps->id.INFOG(20); 171235bd34faSBarry Smith info->nz_unneeded = 0.0; 171335bd34faSBarry Smith info->assemblies = 0.0; 171435bd34faSBarry Smith info->mallocs = 0.0; 171535bd34faSBarry Smith info->memory = 0.0; 171635bd34faSBarry Smith info->fill_ratio_given = 0; 171735bd34faSBarry Smith info->fill_ratio_needed = 0; 171835bd34faSBarry Smith info->factor_mallocs = 0; 171935bd34faSBarry Smith PetscFunctionReturn(0); 172035bd34faSBarry Smith } 172135bd34faSBarry Smith 17225ccb76cbSHong Zhang /* -------------------------------------------------------------------------------------------*/ 17235ccb76cbSHong Zhang #undef __FUNCT__ 17246444a565SStefano Zampini #define __FUNCT__ "MatMumpsSetSchurIndices_MUMPS" 17256444a565SStefano Zampini PetscErrorCode MatMumpsSetSchurIndices_MUMPS(Mat F,PetscInt size,PetscInt idxs[]) 17266444a565SStefano Zampini { 17276444a565SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 17286444a565SStefano Zampini PetscErrorCode ierr; 17296444a565SStefano Zampini 17306444a565SStefano Zampini PetscFunctionBegin; 173159ac8732SStefano Zampini if (mumps->size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"MUMPS parallel Schur complements not yet supported from PETSc\n"); 17326444a565SStefano Zampini if (mumps->id.size_schur != size) { 17336444a565SStefano Zampini ierr = PetscFree2(mumps->id.listvar_schur,mumps->id.schur);CHKERRQ(ierr); 17346444a565SStefano Zampini mumps->id.size_schur = size; 17356444a565SStefano Zampini mumps->id.schur_lld = size; 17366444a565SStefano Zampini ierr = PetscMalloc2(size,&mumps->id.listvar_schur,size*size,&mumps->id.schur);CHKERRQ(ierr); 17376444a565SStefano Zampini } 17386444a565SStefano Zampini ierr = PetscMemcpy(mumps->id.listvar_schur,idxs,size*sizeof(PetscInt));CHKERRQ(ierr); 17396444a565SStefano Zampini if (F->factortype == MAT_FACTOR_LU) { 174059ac8732SStefano Zampini mumps->id.ICNTL(19) = 3; /* MUMPS returns full matrix */ 17416444a565SStefano Zampini } else { 174259ac8732SStefano Zampini mumps->id.ICNTL(19) = 2; /* MUMPS returns lower triangular part */ 17436444a565SStefano Zampini } 174459ac8732SStefano Zampini /* set a special value of ICNTL (not handled my MUMPS) to be used in the solve phase by PETSc */ 1745b5fa320bSStefano Zampini mumps->id.ICNTL(26) = -1; 17466444a565SStefano Zampini PetscFunctionReturn(0); 17476444a565SStefano Zampini } 17486444a565SStefano Zampini 17496444a565SStefano Zampini #undef __FUNCT__ 17506444a565SStefano Zampini #define __FUNCT__ "MatMumpsSetSchurIndices" 17516444a565SStefano Zampini /*@ 17526444a565SStefano Zampini MatMumpsSetSchurIndices - Set indices defining the Schur complement that MUMPS will compute during the factorization steps 17536444a565SStefano Zampini 17546444a565SStefano Zampini Logically Collective on Mat 17556444a565SStefano Zampini 17566444a565SStefano Zampini Input Parameters: 17576444a565SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 17586444a565SStefano Zampini . size - size of the Schur complement indices 17596444a565SStefano Zampini - idxs[] - array of Schur complement indices 17606444a565SStefano Zampini 17616444a565SStefano Zampini Notes: 176259ac8732SStefano Zampini The user has to free the array idxs[] since the indices are copied by the routine. 176359ac8732SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 17646444a565SStefano Zampini 17656444a565SStefano Zampini Level: advanced 17666444a565SStefano Zampini 17676444a565SStefano Zampini References: MUMPS Users' Guide 17686444a565SStefano Zampini 176959ac8732SStefano Zampini .seealso: MatGetFactor(), MatMumpsCreateSchurComplement(), MatMumpsGetSchurComplement() 17706444a565SStefano Zampini @*/ 17716444a565SStefano Zampini PetscErrorCode MatMumpsSetSchurIndices(Mat F,PetscInt size,PetscInt idxs[]) 17726444a565SStefano Zampini { 17736444a565SStefano Zampini PetscErrorCode ierr; 17746444a565SStefano Zampini 17756444a565SStefano Zampini PetscFunctionBegin; 1776e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 1777e807eca7SStefano Zampini if (size) PetscValidIntPointer(idxs,3); 17786444a565SStefano Zampini ierr = PetscTryMethod(F,"MatMumpsSetSchurIndices_C",(Mat,PetscInt,PetscInt[]),(F,size,idxs));CHKERRQ(ierr); 17796444a565SStefano Zampini PetscFunctionReturn(0); 17806444a565SStefano Zampini } 178159ac8732SStefano Zampini 17826444a565SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 17836444a565SStefano Zampini #undef __FUNCT__ 178459ac8732SStefano Zampini #define __FUNCT__ "MatMumpsCreateSchurComplement_MUMPS" 178559ac8732SStefano Zampini PetscErrorCode MatMumpsCreateSchurComplement_MUMPS(Mat F,Mat* S) 17866444a565SStefano Zampini { 17876444a565SStefano Zampini Mat St; 17886444a565SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 17896444a565SStefano Zampini PetscScalar *array; 17906444a565SStefano Zampini #if defined(PETSC_USE_COMPLEX) 17918ac429a0SStefano Zampini PetscScalar im = PetscSqrtScalar((PetscScalar)-1.0); 17926444a565SStefano Zampini #endif 17936444a565SStefano Zampini PetscErrorCode ierr; 17946444a565SStefano Zampini 17956444a565SStefano Zampini PetscFunctionBegin; 179659ac8732SStefano Zampini if (!mumps->CleanUpMUMPS) { /* CleanUpMUMPS is set to true after numerical factorization */ 179759ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Numerical factorization phase not yet performed! You should call MatFactorSymbolic/Numeric before"); 179859ac8732SStefano Zampini } else if (!mumps->id.ICNTL(19)) { 179959ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatMumpsSetSchurIndices to enable it"); 180059ac8732SStefano Zampini } else if (!mumps->id.size_schur) { 180159ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 180259ac8732SStefano Zampini } else if (!mumps->schur_restored) { 180359ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 18046444a565SStefano Zampini } 18056444a565SStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)F),&St);CHKERRQ(ierr); 18066444a565SStefano Zampini ierr = MatSetSizes(St,PETSC_DECIDE,PETSC_DECIDE,mumps->id.size_schur,mumps->id.size_schur);CHKERRQ(ierr); 18076444a565SStefano Zampini ierr = MatSetType(St,MATDENSE);CHKERRQ(ierr); 18086444a565SStefano Zampini ierr = MatSetUp(St);CHKERRQ(ierr); 18096444a565SStefano Zampini ierr = MatDenseGetArray(St,&array);CHKERRQ(ierr); 181059ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full matrix */ 18116444a565SStefano Zampini if (mumps->id.ICNTL(19) == 1) { /* stored by rows */ 18126444a565SStefano Zampini PetscInt i,j,N=mumps->id.size_schur; 18136444a565SStefano Zampini for (i=0;i<N;i++) { 18146444a565SStefano Zampini for (j=0;j<N;j++) { 18156444a565SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 18166444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j]; 18176444a565SStefano Zampini #else 18186444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j].r + im*mumps->id.schur[i*N+j].i; 18196444a565SStefano Zampini #endif 18206444a565SStefano Zampini array[j*N+i] = val; 18216444a565SStefano Zampini } 18226444a565SStefano Zampini } 18236444a565SStefano Zampini } else { /* stored by columns */ 18246444a565SStefano Zampini ierr = PetscMemcpy(array,mumps->id.schur,mumps->id.size_schur*mumps->id.size_schur*sizeof(PetscScalar));CHKERRQ(ierr); 18256444a565SStefano Zampini } 18266444a565SStefano Zampini } else { /* either full or lower-triangular (not packed) */ 18276444a565SStefano Zampini if (mumps->id.ICNTL(19) == 2) { /* lower triangular stored by columns */ 18286444a565SStefano Zampini PetscInt i,j,N=mumps->id.size_schur; 18296444a565SStefano Zampini for (i=0;i<N;i++) { 18306444a565SStefano Zampini for (j=i;j<N;j++) { 18316444a565SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 18326444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j]; 18336444a565SStefano Zampini #else 18346444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j].r + im*mumps->id.schur[i*N+j].i; 18356444a565SStefano Zampini #endif 18366444a565SStefano Zampini array[i*N+j] = val; 18376444a565SStefano Zampini array[j*N+i] = val; 18386444a565SStefano Zampini } 18396444a565SStefano Zampini } 18406444a565SStefano Zampini } else if (mumps->id.ICNTL(19) == 3) { /* full matrix */ 18416444a565SStefano Zampini ierr = PetscMemcpy(array,mumps->id.schur,mumps->id.size_schur*mumps->id.size_schur*sizeof(PetscScalar));CHKERRQ(ierr); 18426444a565SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 18436444a565SStefano Zampini PetscInt i,j,N=mumps->id.size_schur; 18446444a565SStefano Zampini for (i=0;i<N;i++) { 18456444a565SStefano Zampini for (j=0;j<i+1;j++) { 18466444a565SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 18476444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j]; 18486444a565SStefano Zampini #else 18496444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j].r + im*mumps->id.schur[i*N+j].i; 18506444a565SStefano Zampini #endif 18516444a565SStefano Zampini array[i*N+j] = val; 18526444a565SStefano Zampini array[j*N+i] = val; 18536444a565SStefano Zampini } 18546444a565SStefano Zampini } 18556444a565SStefano Zampini } 18566444a565SStefano Zampini } 18576444a565SStefano Zampini ierr = MatDenseRestoreArray(St,&array);CHKERRQ(ierr); 18586444a565SStefano Zampini *S = St; 18596444a565SStefano Zampini PetscFunctionReturn(0); 18606444a565SStefano Zampini } 18616444a565SStefano Zampini 18626444a565SStefano Zampini #undef __FUNCT__ 186359ac8732SStefano Zampini #define __FUNCT__ "MatMumpsCreateSchurComplement" 18646444a565SStefano Zampini /*@ 186559ac8732SStefano Zampini MatMumpsCreateSchurComplement - Create a Schur complement matrix object using Schur data computed by MUMPS during the factorization step 18666444a565SStefano Zampini 18676444a565SStefano Zampini Logically Collective on Mat 18686444a565SStefano Zampini 18696444a565SStefano Zampini Input Parameters: 18706444a565SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 18716444a565SStefano Zampini . *S - location where to return the Schur complement (MATDENSE) 18726444a565SStefano Zampini 18736444a565SStefano Zampini Notes: 187459ac8732SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 187559ac8732SStefano Zampini The routine provides a copy of the Schur data stored within MUMPS data strutures. The caller must destroy the object when it is no longer needed. 1876066565c5SStefano Zampini If MatMumpsInvertSchurComplement has been called, the routine gets back the inverse 18776444a565SStefano Zampini 18786444a565SStefano Zampini Level: advanced 18796444a565SStefano Zampini 18806444a565SStefano Zampini References: MUMPS Users' Guide 18816444a565SStefano Zampini 188259ac8732SStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices(), MatMumpsGetSchurComplement() 188359ac8732SStefano Zampini @*/ 188459ac8732SStefano Zampini PetscErrorCode MatMumpsCreateSchurComplement(Mat F,Mat* S) 188559ac8732SStefano Zampini { 188659ac8732SStefano Zampini PetscErrorCode ierr; 188759ac8732SStefano Zampini 188859ac8732SStefano Zampini PetscFunctionBegin; 1889e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 189059ac8732SStefano Zampini ierr = PetscTryMethod(F,"MatMumpsCreateSchurComplement_C",(Mat,Mat*),(F,S));CHKERRQ(ierr); 189159ac8732SStefano Zampini PetscFunctionReturn(0); 189259ac8732SStefano Zampini } 189359ac8732SStefano Zampini 189459ac8732SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 189559ac8732SStefano Zampini #undef __FUNCT__ 189659ac8732SStefano Zampini #define __FUNCT__ "MatMumpsGetSchurComplement_MUMPS" 189759ac8732SStefano Zampini PetscErrorCode MatMumpsGetSchurComplement_MUMPS(Mat F,Mat* S) 189859ac8732SStefano Zampini { 189959ac8732SStefano Zampini Mat St; 190059ac8732SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 190159ac8732SStefano Zampini PetscErrorCode ierr; 190259ac8732SStefano Zampini 190359ac8732SStefano Zampini PetscFunctionBegin; 190459ac8732SStefano Zampini if (!mumps->CleanUpMUMPS) { /* CleanUpMUMPS is set to true after numerical factorization */ 190559ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Numerical factorization phase not yet performed! You should call MatFactorSymbolic/Numeric before"); 190659ac8732SStefano Zampini } else if (!mumps->id.ICNTL(19)) { 190759ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatMumpsSetSchurIndices to enable it"); 190859ac8732SStefano Zampini } else if (!mumps->id.size_schur) { 190959ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 191059ac8732SStefano Zampini } else if (!mumps->schur_restored) { 191159ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 191259ac8732SStefano Zampini } 191359ac8732SStefano Zampini /* It should be the responsibility of the user to handle different ICNTL(19) cases if they want to work with the raw data */ 191459ac8732SStefano Zampini /* should I also add errors when the Schur complement has been already factored? */ 191559ac8732SStefano Zampini ierr = MatCreateSeqDense(PetscObjectComm((PetscObject)F),mumps->id.size_schur,mumps->id.size_schur,(PetscScalar*)mumps->id.schur,&St);CHKERRQ(ierr); 191659ac8732SStefano Zampini *S = St; 191759ac8732SStefano Zampini mumps->schur_restored = PETSC_FALSE; 191859ac8732SStefano Zampini PetscFunctionReturn(0); 191959ac8732SStefano Zampini } 192059ac8732SStefano Zampini 192159ac8732SStefano Zampini #undef __FUNCT__ 192259ac8732SStefano Zampini #define __FUNCT__ "MatMumpsGetSchurComplement" 192359ac8732SStefano Zampini /*@ 192459ac8732SStefano Zampini MatMumpsGetSchurComplement - Get a Schur complement matrix object using the current status of the raw Schur data computed by MUMPS during the factorization step 192559ac8732SStefano Zampini 192659ac8732SStefano Zampini Logically Collective on Mat 192759ac8732SStefano Zampini 192859ac8732SStefano Zampini Input Parameters: 192959ac8732SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 193059ac8732SStefano Zampini . *S - location where to return the Schur complement (MATDENSE) 193159ac8732SStefano Zampini 193259ac8732SStefano Zampini Notes: 193359ac8732SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 193459ac8732SStefano Zampini The routine uses the pointer to the raw data of the Schur Complement stored within MUMPS data strutures. The caller should call MatMumpsRestoreSchurComplement when the object is no longer needed. 1935066565c5SStefano Zampini If MatMumpsInvertSchurComplement has been called, the routine gets back the inverse 193659ac8732SStefano Zampini 193759ac8732SStefano Zampini Level: advanced 193859ac8732SStefano Zampini 193959ac8732SStefano Zampini References: MUMPS Users' Guide 194059ac8732SStefano Zampini 194159ac8732SStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices(), MatMumpsRestoreSchurComplement(), MatMumpsCreateSchurComplement() 19426444a565SStefano Zampini @*/ 19436444a565SStefano Zampini PetscErrorCode MatMumpsGetSchurComplement(Mat F,Mat* S) 19446444a565SStefano Zampini { 19456444a565SStefano Zampini PetscErrorCode ierr; 19466444a565SStefano Zampini 19476444a565SStefano Zampini PetscFunctionBegin; 1948e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 194959ac8732SStefano Zampini ierr = PetscUseMethod(F,"MatMumpsGetSchurComplement_C",(Mat,Mat*),(F,S));CHKERRQ(ierr); 195059ac8732SStefano Zampini PetscFunctionReturn(0); 195159ac8732SStefano Zampini } 195259ac8732SStefano Zampini 195359ac8732SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 195459ac8732SStefano Zampini #undef __FUNCT__ 195559ac8732SStefano Zampini #define __FUNCT__ "MatMumpsRestoreSchurComplement_MUMPS" 195659ac8732SStefano Zampini PetscErrorCode MatMumpsRestoreSchurComplement_MUMPS(Mat F,Mat* S) 195759ac8732SStefano Zampini { 195859ac8732SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 195959ac8732SStefano Zampini PetscErrorCode ierr; 196059ac8732SStefano Zampini 196159ac8732SStefano Zampini PetscFunctionBegin; 196259ac8732SStefano Zampini if (!mumps->CleanUpMUMPS) { /* CleanUpMUMPS is set to true after numerical factorization */ 196359ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Numerical factorization phase not yet performed! You should call MatFactorSymbolic/Numeric before"); 196459ac8732SStefano Zampini } else if (!mumps->id.ICNTL(19)) { 196559ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatMumpsSetSchurIndices to enable it"); 196659ac8732SStefano Zampini } else if (!mumps->id.size_schur) { 196759ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 1968066565c5SStefano Zampini } else if (mumps->schur_restored) { 1969066565c5SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has been already restored"); 197059ac8732SStefano Zampini } 197159ac8732SStefano Zampini ierr = MatDestroy(S);CHKERRQ(ierr); 197259ac8732SStefano Zampini *S = NULL; 197359ac8732SStefano Zampini mumps->schur_restored = PETSC_TRUE; 197459ac8732SStefano Zampini PetscFunctionReturn(0); 197559ac8732SStefano Zampini } 197659ac8732SStefano Zampini 197759ac8732SStefano Zampini #undef __FUNCT__ 197859ac8732SStefano Zampini #define __FUNCT__ "MatMumpsRestoreSchurComplement" 197959ac8732SStefano Zampini /*@ 198059ac8732SStefano Zampini MatMumpsRestoreSchurComplement - Restore the Schur complement matrix object obtained from a call to MatGetSchurComplement 198159ac8732SStefano Zampini 198259ac8732SStefano Zampini Logically Collective on Mat 198359ac8732SStefano Zampini 198459ac8732SStefano Zampini Input Parameters: 198559ac8732SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 198659ac8732SStefano Zampini . *S - location where the Schur complement is stored 198759ac8732SStefano Zampini 198859ac8732SStefano Zampini Notes: 198959ac8732SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 199059ac8732SStefano Zampini 199159ac8732SStefano Zampini Level: advanced 199259ac8732SStefano Zampini 199359ac8732SStefano Zampini References: MUMPS Users' Guide 199459ac8732SStefano Zampini 199559ac8732SStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices(), MatMumpsGetSchurComplement(), MatMumpsCreateSchurComplement() 199659ac8732SStefano Zampini @*/ 199759ac8732SStefano Zampini PetscErrorCode MatMumpsRestoreSchurComplement(Mat F,Mat* S) 199859ac8732SStefano Zampini { 199959ac8732SStefano Zampini PetscErrorCode ierr; 200059ac8732SStefano Zampini 200159ac8732SStefano Zampini PetscFunctionBegin; 2002e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 200359ac8732SStefano Zampini ierr = PetscUseMethod(F,"MatMumpsRestoreSchurComplement_C",(Mat,Mat*),(F,S));CHKERRQ(ierr); 200459ac8732SStefano Zampini PetscFunctionReturn(0); 200559ac8732SStefano Zampini } 200659ac8732SStefano Zampini 200759ac8732SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 200859ac8732SStefano Zampini #undef __FUNCT__ 200959ac8732SStefano Zampini #define __FUNCT__ "MatMumpsInvertSchurComplement_MUMPS" 201059ac8732SStefano Zampini PetscErrorCode MatMumpsInvertSchurComplement_MUMPS(Mat F) 201159ac8732SStefano Zampini { 201259ac8732SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 201359ac8732SStefano Zampini PetscErrorCode ierr; 201459ac8732SStefano Zampini 201559ac8732SStefano Zampini PetscFunctionBegin; 201659ac8732SStefano Zampini if (!mumps->id.ICNTL(19)) { /* do nothing */ 201759ac8732SStefano Zampini PetscFunctionReturn(0); 201859ac8732SStefano Zampini } 201959ac8732SStefano Zampini if (!mumps->CleanUpMUMPS) { /* CleanUpMUMPS is set to true after numerical factorization */ 202059ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Numerical factorization phase not yet performed! You should call MatFactorSymbolic/Numeric before"); 202159ac8732SStefano Zampini } else if (!mumps->id.size_schur) { 202259ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 202359ac8732SStefano Zampini } else if (!mumps->schur_restored) { 202459ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 202559ac8732SStefano Zampini } 202659ac8732SStefano Zampini ierr = MatMumpsInvertSchur_Private(mumps);CHKERRQ(ierr); 202759ac8732SStefano Zampini PetscFunctionReturn(0); 202859ac8732SStefano Zampini } 202959ac8732SStefano Zampini 203059ac8732SStefano Zampini #undef __FUNCT__ 203159ac8732SStefano Zampini #define __FUNCT__ "MatMumpsInvertSchurComplement" 203259ac8732SStefano Zampini /*@ 203359ac8732SStefano Zampini MatMumpsInvertSchurComplement - Invert the raw Schur data computed by MUMPS during the factorization step 203459ac8732SStefano Zampini 203559ac8732SStefano Zampini Logically Collective on Mat 203659ac8732SStefano Zampini 203759ac8732SStefano Zampini Input Parameters: 203859ac8732SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 203959ac8732SStefano Zampini 204059ac8732SStefano Zampini Notes: 204159ac8732SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 204259ac8732SStefano Zampini The routine uses the pointer to the raw data of the Schur Complement stored within MUMPS data strutures. 204359ac8732SStefano Zampini 204459ac8732SStefano Zampini Level: advanced 204559ac8732SStefano Zampini 204659ac8732SStefano Zampini References: MUMPS Users' Guide 204759ac8732SStefano Zampini 204859ac8732SStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices() 204959ac8732SStefano Zampini @*/ 205059ac8732SStefano Zampini PetscErrorCode MatMumpsInvertSchurComplement(Mat F) 205159ac8732SStefano Zampini { 205259ac8732SStefano Zampini PetscErrorCode ierr; 205359ac8732SStefano Zampini 205459ac8732SStefano Zampini PetscFunctionBegin; 2055e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 205659ac8732SStefano Zampini ierr = PetscTryMethod(F,"MatMumpsInvertSchurComplement_C",(Mat),(F));CHKERRQ(ierr); 20576444a565SStefano Zampini PetscFunctionReturn(0); 20586444a565SStefano Zampini } 20596444a565SStefano Zampini 20606444a565SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 20616444a565SStefano Zampini #undef __FUNCT__ 2062e807eca7SStefano Zampini #define __FUNCT__ "MatMumpsSolveSchurComplement_MUMPS" 2063e807eca7SStefano Zampini PetscErrorCode MatMumpsSolveSchurComplement_MUMPS(Mat F, Vec rhs, Vec sol) 2064e807eca7SStefano Zampini { 2065e807eca7SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2066e807eca7SStefano Zampini MumpsScalar *orhs; 2067e807eca7SStefano Zampini PetscScalar *osol,*nrhs,*nsol; 20689a3a5937SStefano Zampini PetscInt orhs_size,osol_size,olrhs_size; 2069e807eca7SStefano Zampini PetscErrorCode ierr; 2070e807eca7SStefano Zampini 2071e807eca7SStefano Zampini PetscFunctionBegin; 2072e807eca7SStefano Zampini if (!mumps->CleanUpMUMPS) { /* CleanUpMUMPS is set to true after numerical factorization */ 2073e807eca7SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Numerical factorization phase not yet performed! You should call MatFactorSymbolic/Numeric before"); 2074e807eca7SStefano Zampini } else if (!mumps->id.ICNTL(19)) { 2075e807eca7SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatMumpsSetSchurIndices to enable it"); 2076e807eca7SStefano Zampini } else if (!mumps->id.size_schur) { 2077e807eca7SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 2078e807eca7SStefano Zampini } else if (!mumps->schur_restored) { 2079e807eca7SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 2080e807eca7SStefano Zampini } 2081e807eca7SStefano Zampini /* swap pointers */ 2082e807eca7SStefano Zampini orhs = mumps->id.redrhs; 20839a3a5937SStefano Zampini olrhs_size = mumps->id.lredrhs; 2084a12f35bfSStefano Zampini orhs_size = mumps->sizeredrhs; 2085e807eca7SStefano Zampini osol = mumps->schur_sol; 2086a12f35bfSStefano Zampini osol_size = mumps->schur_sizesol; 2087e807eca7SStefano Zampini ierr = VecGetArray(rhs,&nrhs);CHKERRQ(ierr); 2088e807eca7SStefano Zampini ierr = VecGetArray(sol,&nsol);CHKERRQ(ierr); 2089e807eca7SStefano Zampini mumps->id.redrhs = (MumpsScalar*)nrhs; 2090a12f35bfSStefano Zampini ierr = VecGetLocalSize(rhs,&mumps->sizeredrhs);CHKERRQ(ierr); 20919a3a5937SStefano Zampini mumps->id.lredrhs = mumps->sizeredrhs; 2092e807eca7SStefano Zampini mumps->schur_sol = nsol; 2093a12f35bfSStefano Zampini ierr = VecGetLocalSize(sol,&mumps->schur_sizesol);CHKERRQ(ierr); 2094a12f35bfSStefano Zampini 2095e807eca7SStefano Zampini /* solve Schur complement */ 2096e807eca7SStefano Zampini mumps->id.nrhs = 1; 2097e807eca7SStefano Zampini ierr = MatMumpsSolveSchur_Private(mumps,PETSC_FALSE);CHKERRQ(ierr); 2098e807eca7SStefano Zampini /* restore pointers */ 2099e807eca7SStefano Zampini ierr = VecRestoreArray(rhs,&nrhs);CHKERRQ(ierr); 2100e807eca7SStefano Zampini ierr = VecRestoreArray(sol,&nsol);CHKERRQ(ierr); 2101e807eca7SStefano Zampini mumps->id.redrhs = orhs; 21029a3a5937SStefano Zampini mumps->id.lredrhs = olrhs_size; 2103a12f35bfSStefano Zampini mumps->sizeredrhs = orhs_size; 2104e807eca7SStefano Zampini mumps->schur_sol = osol; 2105a12f35bfSStefano Zampini mumps->schur_sizesol = osol_size; 2106e807eca7SStefano Zampini PetscFunctionReturn(0); 2107e807eca7SStefano Zampini } 2108e807eca7SStefano Zampini 2109e807eca7SStefano Zampini #undef __FUNCT__ 2110e807eca7SStefano Zampini #define __FUNCT__ "MatMumpsSolveSchurComplement" 2111e807eca7SStefano Zampini /*@ 2112e807eca7SStefano Zampini MatMumpsSolveSchurComplement - Solve the Schur complement system computed by MUMPS during the factorization step 2113e807eca7SStefano Zampini 2114e807eca7SStefano Zampini Logically Collective on Mat 2115e807eca7SStefano Zampini 2116e807eca7SStefano Zampini Input Parameters: 2117e807eca7SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2118e807eca7SStefano Zampini . rhs - location where the right hand side of the Schur complement system is stored 2119e807eca7SStefano Zampini - sol - location where the solution of the Schur complement system has to be returned 2120e807eca7SStefano Zampini 2121e807eca7SStefano Zampini Notes: 2122e807eca7SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 2123e807eca7SStefano Zampini The sizes of the vectors should match the size of the Schur complement 2124e807eca7SStefano Zampini 2125e807eca7SStefano Zampini Level: advanced 2126e807eca7SStefano Zampini 2127e807eca7SStefano Zampini References: MUMPS Users' Guide 2128e807eca7SStefano Zampini 2129e807eca7SStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices() 2130e807eca7SStefano Zampini @*/ 2131e807eca7SStefano Zampini PetscErrorCode MatMumpsSolveSchurComplement(Mat F, Vec rhs, Vec sol) 2132e807eca7SStefano Zampini { 2133e807eca7SStefano Zampini PetscErrorCode ierr; 2134e807eca7SStefano Zampini 2135e807eca7SStefano Zampini PetscFunctionBegin; 2136e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 2137e807eca7SStefano Zampini PetscValidHeaderSpecific(rhs,VEC_CLASSID,2); 2138e807eca7SStefano Zampini PetscValidHeaderSpecific(sol,VEC_CLASSID,2); 2139e807eca7SStefano Zampini PetscCheckSameComm(F,1,rhs,2); 2140e807eca7SStefano Zampini PetscCheckSameComm(F,1,sol,3); 21417404bcfbSStefano Zampini ierr = PetscUseMethod(F,"MatMumpsSolveSchurComplement_C",(Mat,Vec,Vec),(F,rhs,sol));CHKERRQ(ierr); 21427404bcfbSStefano Zampini PetscFunctionReturn(0); 21437404bcfbSStefano Zampini } 21447404bcfbSStefano Zampini 21457404bcfbSStefano Zampini /* -------------------------------------------------------------------------------------------*/ 21467404bcfbSStefano Zampini #undef __FUNCT__ 21477404bcfbSStefano Zampini #define __FUNCT__ "MatMumpsSolveSchurComplementTranspose_MUMPS" 21487404bcfbSStefano Zampini PetscErrorCode MatMumpsSolveSchurComplementTranspose_MUMPS(Mat F, Vec rhs, Vec sol) 21497404bcfbSStefano Zampini { 21507404bcfbSStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 21517404bcfbSStefano Zampini MumpsScalar *orhs; 21527404bcfbSStefano Zampini PetscScalar *osol,*nrhs,*nsol; 2153a12f35bfSStefano Zampini PetscInt orhs_size,osol_size; 21547404bcfbSStefano Zampini PetscErrorCode ierr; 21557404bcfbSStefano Zampini 21567404bcfbSStefano Zampini PetscFunctionBegin; 21577404bcfbSStefano Zampini if (!mumps->CleanUpMUMPS) { /* CleanUpMUMPS is set to true after numerical factorization */ 21587404bcfbSStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Numerical factorization phase not yet performed! You should call MatFactorSymbolic/Numeric before"); 21597404bcfbSStefano Zampini } else if (!mumps->id.ICNTL(19)) { 21607404bcfbSStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatMumpsSetSchurIndices to enable it"); 21617404bcfbSStefano Zampini } else if (!mumps->id.size_schur) { 21627404bcfbSStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 21637404bcfbSStefano Zampini } else if (!mumps->schur_restored) { 21647404bcfbSStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 21657404bcfbSStefano Zampini } 21667404bcfbSStefano Zampini /* swap pointers */ 21677404bcfbSStefano Zampini orhs = mumps->id.redrhs; 2168a12f35bfSStefano Zampini orhs_size = mumps->sizeredrhs; 21697404bcfbSStefano Zampini osol = mumps->schur_sol; 2170a12f35bfSStefano Zampini osol_size = mumps->schur_sizesol; 21717404bcfbSStefano Zampini ierr = VecGetArray(rhs,&nrhs);CHKERRQ(ierr); 21727404bcfbSStefano Zampini ierr = VecGetArray(sol,&nsol);CHKERRQ(ierr); 21737404bcfbSStefano Zampini mumps->id.redrhs = (MumpsScalar*)nrhs; 2174a12f35bfSStefano Zampini ierr = VecGetLocalSize(rhs,&mumps->sizeredrhs);CHKERRQ(ierr); 21757404bcfbSStefano Zampini mumps->schur_sol = nsol; 2176a12f35bfSStefano Zampini ierr = VecGetLocalSize(sol,&mumps->schur_sizesol);CHKERRQ(ierr); 2177a12f35bfSStefano Zampini 21787404bcfbSStefano Zampini /* solve Schur complement */ 21797404bcfbSStefano Zampini mumps->id.nrhs = 1; 21807404bcfbSStefano Zampini mumps->id.ICNTL(9) = 0; 21817404bcfbSStefano Zampini ierr = MatMumpsSolveSchur_Private(mumps,PETSC_FALSE);CHKERRQ(ierr); 21827404bcfbSStefano Zampini mumps->id.ICNTL(9) = 1; 21837404bcfbSStefano Zampini /* restore pointers */ 21847404bcfbSStefano Zampini ierr = VecRestoreArray(rhs,&nrhs);CHKERRQ(ierr); 21857404bcfbSStefano Zampini ierr = VecRestoreArray(sol,&nsol);CHKERRQ(ierr); 21867404bcfbSStefano Zampini mumps->id.redrhs = orhs; 2187a12f35bfSStefano Zampini mumps->sizeredrhs = orhs_size; 21887404bcfbSStefano Zampini mumps->schur_sol = osol; 2189a12f35bfSStefano Zampini mumps->schur_sizesol = osol_size; 21907404bcfbSStefano Zampini PetscFunctionReturn(0); 21917404bcfbSStefano Zampini } 21927404bcfbSStefano Zampini 21937404bcfbSStefano Zampini #undef __FUNCT__ 2194*a0b0af32SStefano Zampini #define __FUNCT__ "MatMumpsSchurComplementSetSym" 2195*a0b0af32SStefano Zampini /*@ 2196*a0b0af32SStefano Zampini MatMumpsSchurComplementSetSym - Set symmetric info for Schur complement 2197*a0b0af32SStefano Zampini 2198*a0b0af32SStefano Zampini Logically Collective on Mat 2199*a0b0af32SStefano Zampini 2200*a0b0af32SStefano Zampini Input Parameters: 2201*a0b0af32SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2202*a0b0af32SStefano Zampini - sym - either 0 (non-symmetric), 1 (symmetric positive definite) or 2 (symmetric indefinite) following MUMPS convention 2203*a0b0af32SStefano Zampini 2204*a0b0af32SStefano Zampini Notes: 2205*a0b0af32SStefano Zampini The parameter is used to compute the correct factorization of the Schur complement matrices 2206*a0b0af32SStefano Zampini This could be useful in case the nature of the Schur complement is different from that of the matrix to be factored 2207*a0b0af32SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 2208*a0b0af32SStefano Zampini 2209*a0b0af32SStefano Zampini Level: advanced 2210*a0b0af32SStefano Zampini 2211*a0b0af32SStefano Zampini References: MUMPS Users' Guide 2212*a0b0af32SStefano Zampini 2213*a0b0af32SStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices() 2214*a0b0af32SStefano Zampini @*/ 2215*a0b0af32SStefano Zampini PetscErrorCode MatMumpsSchurComplementSetSym(Mat F, PetscInt sym) 2216*a0b0af32SStefano Zampini { 2217*a0b0af32SStefano Zampini PetscErrorCode ierr; 2218*a0b0af32SStefano Zampini 2219*a0b0af32SStefano Zampini PetscFunctionBegin; 2220*a0b0af32SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 2221*a0b0af32SStefano Zampini PetscValidLogicalCollectiveInt(F,sym,2); 2222*a0b0af32SStefano Zampini ierr = PetscUseMethod(F,"MatMumpsSchurComplementSetSym_C",(Mat,PetscInt),(F,sym));CHKERRQ(ierr); 2223*a0b0af32SStefano Zampini PetscFunctionReturn(0); 2224*a0b0af32SStefano Zampini } 2225*a0b0af32SStefano Zampini 2226*a0b0af32SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 2227*a0b0af32SStefano Zampini #undef __FUNCT__ 2228*a0b0af32SStefano Zampini #define __FUNCT__ "MatMumpsSchurComplementSetSym_MUMPS" 2229*a0b0af32SStefano Zampini PetscErrorCode MatMumpsSchurComplementSetSym_MUMPS(Mat F, PetscInt sym) 2230*a0b0af32SStefano Zampini { 2231*a0b0af32SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2232*a0b0af32SStefano Zampini 2233*a0b0af32SStefano Zampini PetscFunctionBegin; 2234*a0b0af32SStefano Zampini if (mumps->schur_factored && mumps->sym != mumps->schur_sym) { 2235*a0b0af32SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ARG_WRONG,"Schur complement data has been already factored"); 2236*a0b0af32SStefano Zampini } 2237*a0b0af32SStefano Zampini mumps->schur_sym = sym; 2238*a0b0af32SStefano Zampini PetscFunctionReturn(0); 2239*a0b0af32SStefano Zampini } 2240*a0b0af32SStefano Zampini 2241*a0b0af32SStefano Zampini #undef __FUNCT__ 22427404bcfbSStefano Zampini #define __FUNCT__ "MatMumpsSolveSchurComplementTranspose" 22437404bcfbSStefano Zampini /*@ 22447404bcfbSStefano Zampini MatMumpsSolveSchurComplementTranspose - Solve the transpose of the Schur complement system computed by MUMPS during the factorization step 22457404bcfbSStefano Zampini 22467404bcfbSStefano Zampini Logically Collective on Mat 22477404bcfbSStefano Zampini 22487404bcfbSStefano Zampini Input Parameters: 22497404bcfbSStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 22507404bcfbSStefano Zampini . rhs - location where the right hand side of the Schur complement system is stored 22517404bcfbSStefano Zampini - sol - location where the solution of the Schur complement system has to be returned 22527404bcfbSStefano Zampini 22537404bcfbSStefano Zampini Notes: 22547404bcfbSStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 22557404bcfbSStefano Zampini The sizes of the vectors should match the size of the Schur complement 22567404bcfbSStefano Zampini 22577404bcfbSStefano Zampini Level: advanced 22587404bcfbSStefano Zampini 22597404bcfbSStefano Zampini References: MUMPS Users' Guide 22607404bcfbSStefano Zampini 22617404bcfbSStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices() 22627404bcfbSStefano Zampini @*/ 22637404bcfbSStefano Zampini PetscErrorCode MatMumpsSolveSchurComplementTranspose(Mat F, Vec rhs, Vec sol) 22647404bcfbSStefano Zampini { 22657404bcfbSStefano Zampini PetscErrorCode ierr; 22667404bcfbSStefano Zampini 22677404bcfbSStefano Zampini PetscFunctionBegin; 22687404bcfbSStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 22697404bcfbSStefano Zampini PetscValidHeaderSpecific(rhs,VEC_CLASSID,2); 22707404bcfbSStefano Zampini PetscValidHeaderSpecific(sol,VEC_CLASSID,2); 22717404bcfbSStefano Zampini PetscCheckSameComm(F,1,rhs,2); 22727404bcfbSStefano Zampini PetscCheckSameComm(F,1,sol,3); 22737404bcfbSStefano Zampini ierr = PetscUseMethod(F,"MatMumpsSolveSchurComplementTranspose_C",(Mat,Vec,Vec),(F,rhs,sol));CHKERRQ(ierr); 2274e807eca7SStefano Zampini PetscFunctionReturn(0); 2275e807eca7SStefano Zampini } 2276e807eca7SStefano Zampini 2277e807eca7SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 2278e807eca7SStefano Zampini #undef __FUNCT__ 22795ccb76cbSHong Zhang #define __FUNCT__ "MatMumpsSetIcntl_MUMPS" 22805ccb76cbSHong Zhang PetscErrorCode MatMumpsSetIcntl_MUMPS(Mat F,PetscInt icntl,PetscInt ival) 22815ccb76cbSHong Zhang { 2282a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 22835ccb76cbSHong Zhang 22845ccb76cbSHong Zhang PetscFunctionBegin; 2285a5e57a09SHong Zhang mumps->id.ICNTL(icntl) = ival; 22865ccb76cbSHong Zhang PetscFunctionReturn(0); 22875ccb76cbSHong Zhang } 22885ccb76cbSHong Zhang 22895ccb76cbSHong Zhang #undef __FUNCT__ 2290bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetIcntl_MUMPS" 2291bc6112feSHong Zhang PetscErrorCode MatMumpsGetIcntl_MUMPS(Mat F,PetscInt icntl,PetscInt *ival) 2292bc6112feSHong Zhang { 2293bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2294bc6112feSHong Zhang 2295bc6112feSHong Zhang PetscFunctionBegin; 2296bc6112feSHong Zhang *ival = mumps->id.ICNTL(icntl); 2297bc6112feSHong Zhang PetscFunctionReturn(0); 2298bc6112feSHong Zhang } 2299bc6112feSHong Zhang 2300bc6112feSHong Zhang #undef __FUNCT__ 23015ccb76cbSHong Zhang #define __FUNCT__ "MatMumpsSetIcntl" 23025ccb76cbSHong Zhang /*@ 23035ccb76cbSHong Zhang MatMumpsSetIcntl - Set MUMPS parameter ICNTL() 23045ccb76cbSHong Zhang 23055ccb76cbSHong Zhang Logically Collective on Mat 23065ccb76cbSHong Zhang 23075ccb76cbSHong Zhang Input Parameters: 23085ccb76cbSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 23095ccb76cbSHong Zhang . icntl - index of MUMPS parameter array ICNTL() 23105ccb76cbSHong Zhang - ival - value of MUMPS ICNTL(icntl) 23115ccb76cbSHong Zhang 23125ccb76cbSHong Zhang Options Database: 23135ccb76cbSHong Zhang . -mat_mumps_icntl_<icntl> <ival> 23145ccb76cbSHong Zhang 23155ccb76cbSHong Zhang Level: beginner 23165ccb76cbSHong Zhang 23175ccb76cbSHong Zhang References: MUMPS Users' Guide 23185ccb76cbSHong Zhang 23195ccb76cbSHong Zhang .seealso: MatGetFactor() 23205ccb76cbSHong Zhang @*/ 23215ccb76cbSHong Zhang PetscErrorCode MatMumpsSetIcntl(Mat F,PetscInt icntl,PetscInt ival) 23225ccb76cbSHong Zhang { 23235ccb76cbSHong Zhang PetscErrorCode ierr; 23245ccb76cbSHong Zhang 23255ccb76cbSHong Zhang PetscFunctionBegin; 23265ccb76cbSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 23275ccb76cbSHong Zhang PetscValidLogicalCollectiveInt(F,ival,3); 23285ccb76cbSHong Zhang ierr = PetscTryMethod(F,"MatMumpsSetIcntl_C",(Mat,PetscInt,PetscInt),(F,icntl,ival));CHKERRQ(ierr); 23295ccb76cbSHong Zhang PetscFunctionReturn(0); 23305ccb76cbSHong Zhang } 23315ccb76cbSHong Zhang 2332bc6112feSHong Zhang #undef __FUNCT__ 2333bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetIcntl" 2334a21f80fcSHong Zhang /*@ 2335a21f80fcSHong Zhang MatMumpsGetIcntl - Get MUMPS parameter ICNTL() 2336a21f80fcSHong Zhang 2337a21f80fcSHong Zhang Logically Collective on Mat 2338a21f80fcSHong Zhang 2339a21f80fcSHong Zhang Input Parameters: 2340a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2341a21f80fcSHong Zhang - icntl - index of MUMPS parameter array ICNTL() 2342a21f80fcSHong Zhang 2343a21f80fcSHong Zhang Output Parameter: 2344a21f80fcSHong Zhang . ival - value of MUMPS ICNTL(icntl) 2345a21f80fcSHong Zhang 2346a21f80fcSHong Zhang Level: beginner 2347a21f80fcSHong Zhang 2348a21f80fcSHong Zhang References: MUMPS Users' Guide 2349a21f80fcSHong Zhang 2350a21f80fcSHong Zhang .seealso: MatGetFactor() 2351a21f80fcSHong Zhang @*/ 2352bc6112feSHong Zhang PetscErrorCode MatMumpsGetIcntl(Mat F,PetscInt icntl,PetscInt *ival) 2353bc6112feSHong Zhang { 2354bc6112feSHong Zhang PetscErrorCode ierr; 2355bc6112feSHong Zhang 2356bc6112feSHong Zhang PetscFunctionBegin; 2357bc6112feSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 2358bc6112feSHong Zhang PetscValidIntPointer(ival,3); 2359bc6112feSHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetIcntl_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 2360bc6112feSHong Zhang PetscFunctionReturn(0); 2361bc6112feSHong Zhang } 2362bc6112feSHong Zhang 23638928b65cSHong Zhang /* -------------------------------------------------------------------------------------------*/ 23648928b65cSHong Zhang #undef __FUNCT__ 23658928b65cSHong Zhang #define __FUNCT__ "MatMumpsSetCntl_MUMPS" 23668928b65cSHong Zhang PetscErrorCode MatMumpsSetCntl_MUMPS(Mat F,PetscInt icntl,PetscReal val) 23678928b65cSHong Zhang { 23688928b65cSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 23698928b65cSHong Zhang 23708928b65cSHong Zhang PetscFunctionBegin; 23718928b65cSHong Zhang mumps->id.CNTL(icntl) = val; 23728928b65cSHong Zhang PetscFunctionReturn(0); 23738928b65cSHong Zhang } 23748928b65cSHong Zhang 23758928b65cSHong Zhang #undef __FUNCT__ 2376bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetCntl_MUMPS" 2377bc6112feSHong Zhang PetscErrorCode MatMumpsGetCntl_MUMPS(Mat F,PetscInt icntl,PetscReal *val) 2378bc6112feSHong Zhang { 2379bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2380bc6112feSHong Zhang 2381bc6112feSHong Zhang PetscFunctionBegin; 2382bc6112feSHong Zhang *val = mumps->id.CNTL(icntl); 2383bc6112feSHong Zhang PetscFunctionReturn(0); 2384bc6112feSHong Zhang } 2385bc6112feSHong Zhang 2386bc6112feSHong Zhang #undef __FUNCT__ 23878928b65cSHong Zhang #define __FUNCT__ "MatMumpsSetCntl" 23888928b65cSHong Zhang /*@ 23898928b65cSHong Zhang MatMumpsSetCntl - Set MUMPS parameter CNTL() 23908928b65cSHong Zhang 23918928b65cSHong Zhang Logically Collective on Mat 23928928b65cSHong Zhang 23938928b65cSHong Zhang Input Parameters: 23948928b65cSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 23958928b65cSHong Zhang . icntl - index of MUMPS parameter array CNTL() 23968928b65cSHong Zhang - val - value of MUMPS CNTL(icntl) 23978928b65cSHong Zhang 23988928b65cSHong Zhang Options Database: 23998928b65cSHong Zhang . -mat_mumps_cntl_<icntl> <val> 24008928b65cSHong Zhang 24018928b65cSHong Zhang Level: beginner 24028928b65cSHong Zhang 24038928b65cSHong Zhang References: MUMPS Users' Guide 24048928b65cSHong Zhang 24058928b65cSHong Zhang .seealso: MatGetFactor() 24068928b65cSHong Zhang @*/ 24078928b65cSHong Zhang PetscErrorCode MatMumpsSetCntl(Mat F,PetscInt icntl,PetscReal val) 24088928b65cSHong Zhang { 24098928b65cSHong Zhang PetscErrorCode ierr; 24108928b65cSHong Zhang 24118928b65cSHong Zhang PetscFunctionBegin; 24128928b65cSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 2413bc6112feSHong Zhang PetscValidLogicalCollectiveReal(F,val,3); 24148928b65cSHong Zhang ierr = PetscTryMethod(F,"MatMumpsSetCntl_C",(Mat,PetscInt,PetscReal),(F,icntl,val));CHKERRQ(ierr); 24158928b65cSHong Zhang PetscFunctionReturn(0); 24168928b65cSHong Zhang } 24178928b65cSHong Zhang 2418bc6112feSHong Zhang #undef __FUNCT__ 2419bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetCntl" 2420a21f80fcSHong Zhang /*@ 2421a21f80fcSHong Zhang MatMumpsGetCntl - Get MUMPS parameter CNTL() 2422a21f80fcSHong Zhang 2423a21f80fcSHong Zhang Logically Collective on Mat 2424a21f80fcSHong Zhang 2425a21f80fcSHong Zhang Input Parameters: 2426a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2427a21f80fcSHong Zhang - icntl - index of MUMPS parameter array CNTL() 2428a21f80fcSHong Zhang 2429a21f80fcSHong Zhang Output Parameter: 2430a21f80fcSHong Zhang . val - value of MUMPS CNTL(icntl) 2431a21f80fcSHong Zhang 2432a21f80fcSHong Zhang Level: beginner 2433a21f80fcSHong Zhang 2434a21f80fcSHong Zhang References: MUMPS Users' Guide 2435a21f80fcSHong Zhang 2436a21f80fcSHong Zhang .seealso: MatGetFactor() 2437a21f80fcSHong Zhang @*/ 2438bc6112feSHong Zhang PetscErrorCode MatMumpsGetCntl(Mat F,PetscInt icntl,PetscReal *val) 2439bc6112feSHong Zhang { 2440bc6112feSHong Zhang PetscErrorCode ierr; 2441bc6112feSHong Zhang 2442bc6112feSHong Zhang PetscFunctionBegin; 2443bc6112feSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 2444bc6112feSHong Zhang PetscValidRealPointer(val,3); 2445bc6112feSHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetCntl_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 2446bc6112feSHong Zhang PetscFunctionReturn(0); 2447bc6112feSHong Zhang } 2448bc6112feSHong Zhang 2449bc6112feSHong Zhang #undef __FUNCT__ 2450ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfo_MUMPS" 2451ca810319SHong Zhang PetscErrorCode MatMumpsGetInfo_MUMPS(Mat F,PetscInt icntl,PetscInt *info) 2452bc6112feSHong Zhang { 2453bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2454bc6112feSHong Zhang 2455bc6112feSHong Zhang PetscFunctionBegin; 2456bc6112feSHong Zhang *info = mumps->id.INFO(icntl); 2457bc6112feSHong Zhang PetscFunctionReturn(0); 2458bc6112feSHong Zhang } 2459bc6112feSHong Zhang 2460bc6112feSHong Zhang #undef __FUNCT__ 2461ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfog_MUMPS" 2462ca810319SHong Zhang PetscErrorCode MatMumpsGetInfog_MUMPS(Mat F,PetscInt icntl,PetscInt *infog) 2463bc6112feSHong Zhang { 2464bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2465bc6112feSHong Zhang 2466bc6112feSHong Zhang PetscFunctionBegin; 2467bc6112feSHong Zhang *infog = mumps->id.INFOG(icntl); 2468bc6112feSHong Zhang PetscFunctionReturn(0); 2469bc6112feSHong Zhang } 2470bc6112feSHong Zhang 2471bc6112feSHong Zhang #undef __FUNCT__ 2472ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfo_MUMPS" 2473ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfo_MUMPS(Mat F,PetscInt icntl,PetscReal *rinfo) 2474bc6112feSHong Zhang { 2475bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2476bc6112feSHong Zhang 2477bc6112feSHong Zhang PetscFunctionBegin; 2478bc6112feSHong Zhang *rinfo = mumps->id.RINFO(icntl); 2479bc6112feSHong Zhang PetscFunctionReturn(0); 2480bc6112feSHong Zhang } 2481bc6112feSHong Zhang 2482bc6112feSHong Zhang #undef __FUNCT__ 2483ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfog_MUMPS" 2484ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfog_MUMPS(Mat F,PetscInt icntl,PetscReal *rinfog) 2485bc6112feSHong Zhang { 2486bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2487bc6112feSHong Zhang 2488bc6112feSHong Zhang PetscFunctionBegin; 2489bc6112feSHong Zhang *rinfog = mumps->id.RINFOG(icntl); 2490bc6112feSHong Zhang PetscFunctionReturn(0); 2491bc6112feSHong Zhang } 2492bc6112feSHong Zhang 2493bc6112feSHong Zhang #undef __FUNCT__ 2494ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfo" 2495a21f80fcSHong Zhang /*@ 2496a21f80fcSHong Zhang MatMumpsGetInfo - Get MUMPS parameter INFO() 2497a21f80fcSHong Zhang 2498a21f80fcSHong Zhang Logically Collective on Mat 2499a21f80fcSHong Zhang 2500a21f80fcSHong Zhang Input Parameters: 2501a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2502a21f80fcSHong Zhang - icntl - index of MUMPS parameter array INFO() 2503a21f80fcSHong Zhang 2504a21f80fcSHong Zhang Output Parameter: 2505a21f80fcSHong Zhang . ival - value of MUMPS INFO(icntl) 2506a21f80fcSHong Zhang 2507a21f80fcSHong Zhang Level: beginner 2508a21f80fcSHong Zhang 2509a21f80fcSHong Zhang References: MUMPS Users' Guide 2510a21f80fcSHong Zhang 2511a21f80fcSHong Zhang .seealso: MatGetFactor() 2512a21f80fcSHong Zhang @*/ 2513ca810319SHong Zhang PetscErrorCode MatMumpsGetInfo(Mat F,PetscInt icntl,PetscInt *ival) 2514bc6112feSHong Zhang { 2515bc6112feSHong Zhang PetscErrorCode ierr; 2516bc6112feSHong Zhang 2517bc6112feSHong Zhang PetscFunctionBegin; 2518ca810319SHong Zhang PetscValidIntPointer(ival,3); 2519ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetInfo_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 2520bc6112feSHong Zhang PetscFunctionReturn(0); 2521bc6112feSHong Zhang } 2522bc6112feSHong Zhang 2523bc6112feSHong Zhang #undef __FUNCT__ 2524ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfog" 2525a21f80fcSHong Zhang /*@ 2526a21f80fcSHong Zhang MatMumpsGetInfog - Get MUMPS parameter INFOG() 2527a21f80fcSHong Zhang 2528a21f80fcSHong Zhang Logically Collective on Mat 2529a21f80fcSHong Zhang 2530a21f80fcSHong Zhang Input Parameters: 2531a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2532a21f80fcSHong Zhang - icntl - index of MUMPS parameter array INFOG() 2533a21f80fcSHong Zhang 2534a21f80fcSHong Zhang Output Parameter: 2535a21f80fcSHong Zhang . ival - value of MUMPS INFOG(icntl) 2536a21f80fcSHong Zhang 2537a21f80fcSHong Zhang Level: beginner 2538a21f80fcSHong Zhang 2539a21f80fcSHong Zhang References: MUMPS Users' Guide 2540a21f80fcSHong Zhang 2541a21f80fcSHong Zhang .seealso: MatGetFactor() 2542a21f80fcSHong Zhang @*/ 2543ca810319SHong Zhang PetscErrorCode MatMumpsGetInfog(Mat F,PetscInt icntl,PetscInt *ival) 2544bc6112feSHong Zhang { 2545bc6112feSHong Zhang PetscErrorCode ierr; 2546bc6112feSHong Zhang 2547bc6112feSHong Zhang PetscFunctionBegin; 2548ca810319SHong Zhang PetscValidIntPointer(ival,3); 2549ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetInfog_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 2550bc6112feSHong Zhang PetscFunctionReturn(0); 2551bc6112feSHong Zhang } 2552bc6112feSHong Zhang 2553bc6112feSHong Zhang #undef __FUNCT__ 2554ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfo" 2555a21f80fcSHong Zhang /*@ 2556a21f80fcSHong Zhang MatMumpsGetRinfo - Get MUMPS parameter RINFO() 2557a21f80fcSHong Zhang 2558a21f80fcSHong Zhang Logically Collective on Mat 2559a21f80fcSHong Zhang 2560a21f80fcSHong Zhang Input Parameters: 2561a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2562a21f80fcSHong Zhang - icntl - index of MUMPS parameter array RINFO() 2563a21f80fcSHong Zhang 2564a21f80fcSHong Zhang Output Parameter: 2565a21f80fcSHong Zhang . val - value of MUMPS RINFO(icntl) 2566a21f80fcSHong Zhang 2567a21f80fcSHong Zhang Level: beginner 2568a21f80fcSHong Zhang 2569a21f80fcSHong Zhang References: MUMPS Users' Guide 2570a21f80fcSHong Zhang 2571a21f80fcSHong Zhang .seealso: MatGetFactor() 2572a21f80fcSHong Zhang @*/ 2573ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfo(Mat F,PetscInt icntl,PetscReal *val) 2574bc6112feSHong Zhang { 2575bc6112feSHong Zhang PetscErrorCode ierr; 2576bc6112feSHong Zhang 2577bc6112feSHong Zhang PetscFunctionBegin; 2578bc6112feSHong Zhang PetscValidRealPointer(val,3); 2579ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetRinfo_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 2580bc6112feSHong Zhang PetscFunctionReturn(0); 2581bc6112feSHong Zhang } 2582bc6112feSHong Zhang 2583bc6112feSHong Zhang #undef __FUNCT__ 2584ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfog" 2585a21f80fcSHong Zhang /*@ 2586a21f80fcSHong Zhang MatMumpsGetRinfog - Get MUMPS parameter RINFOG() 2587a21f80fcSHong Zhang 2588a21f80fcSHong Zhang Logically Collective on Mat 2589a21f80fcSHong Zhang 2590a21f80fcSHong Zhang Input Parameters: 2591a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2592a21f80fcSHong Zhang - icntl - index of MUMPS parameter array RINFOG() 2593a21f80fcSHong Zhang 2594a21f80fcSHong Zhang Output Parameter: 2595a21f80fcSHong Zhang . val - value of MUMPS RINFOG(icntl) 2596a21f80fcSHong Zhang 2597a21f80fcSHong Zhang Level: beginner 2598a21f80fcSHong Zhang 2599a21f80fcSHong Zhang References: MUMPS Users' Guide 2600a21f80fcSHong Zhang 2601a21f80fcSHong Zhang .seealso: MatGetFactor() 2602a21f80fcSHong Zhang @*/ 2603ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfog(Mat F,PetscInt icntl,PetscReal *val) 2604bc6112feSHong Zhang { 2605bc6112feSHong Zhang PetscErrorCode ierr; 2606bc6112feSHong Zhang 2607bc6112feSHong Zhang PetscFunctionBegin; 2608bc6112feSHong Zhang PetscValidRealPointer(val,3); 2609ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetRinfog_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 2610bc6112feSHong Zhang PetscFunctionReturn(0); 2611bc6112feSHong Zhang } 2612bc6112feSHong Zhang 261324b6179bSKris Buschelman /*MC 26142692d6eeSBarry Smith MATSOLVERMUMPS - A matrix type providing direct solvers (LU and Cholesky) for 261524b6179bSKris Buschelman distributed and sequential matrices via the external package MUMPS. 261624b6179bSKris Buschelman 261741c8de11SBarry Smith Works with MATAIJ and MATSBAIJ matrices 261824b6179bSKris Buschelman 2619c2b89b5dSBarry Smith Use ./configure --download-mumps --download-scalapack --download-parmetis --download-metis --download-ptscotch to have PETSc installed with MUMPS 2620c2b89b5dSBarry Smith 2621c2b89b5dSBarry Smith Use -pc_type cholesky or lu -pc_factor_mat_solver_package mumps to us this direct solver 2622c2b89b5dSBarry Smith 262324b6179bSKris Buschelman Options Database Keys: 26244e34a73bSHong Zhang + -mat_mumps_icntl_1 <6>: ICNTL(1): output stream for error messages (None) 26254e34a73bSHong Zhang . -mat_mumps_icntl_2 <0>: ICNTL(2): output stream for diagnostic printing, statistics, and warning (None) 26264e34a73bSHong Zhang . -mat_mumps_icntl_3 <0>: ICNTL(3): output stream for global information, collected on the host (None) 26274e34a73bSHong Zhang . -mat_mumps_icntl_4 <0>: ICNTL(4): level of printing (0 to 4) (None) 26284e34a73bSHong Zhang . -mat_mumps_icntl_6 <7>: ICNTL(6): permutes to a zero-free diagonal and/or scale the matrix (0 to 7) (None) 26294e34a73bSHong Zhang . -mat_mumps_icntl_7 <7>: ICNTL(7): computes a symmetric permutation in sequential analysis (0 to 7). 3=Scotch, 4=PORD, 5=Metis (None) 26304e34a73bSHong Zhang . -mat_mumps_icntl_8 <77>: ICNTL(8): scaling strategy (-2 to 8 or 77) (None) 26314e34a73bSHong Zhang . -mat_mumps_icntl_10 <0>: ICNTL(10): max num of refinements (None) 26324e34a73bSHong Zhang . -mat_mumps_icntl_11 <0>: ICNTL(11): statistics related to an error analysis (via -ksp_view) (None) 26334e34a73bSHong Zhang . -mat_mumps_icntl_12 <1>: ICNTL(12): an ordering strategy for symmetric matrices (0 to 3) (None) 26344e34a73bSHong Zhang . -mat_mumps_icntl_13 <0>: ICNTL(13): parallelism of the root node (enable ScaLAPACK) and its splitting (None) 26354e34a73bSHong Zhang . -mat_mumps_icntl_14 <20>: ICNTL(14): percentage increase in the estimated working space (None) 26364e34a73bSHong Zhang . -mat_mumps_icntl_19 <0>: ICNTL(19): computes the Schur complement (None) 26374e34a73bSHong Zhang . -mat_mumps_icntl_22 <0>: ICNTL(22): in-core/out-of-core factorization and solve (0 or 1) (None) 26384e34a73bSHong Zhang . -mat_mumps_icntl_23 <0>: ICNTL(23): max size of the working memory (MB) that can allocate per processor (None) 26394e34a73bSHong Zhang . -mat_mumps_icntl_24 <0>: ICNTL(24): detection of null pivot rows (0 or 1) (None) 26404e34a73bSHong Zhang . -mat_mumps_icntl_25 <0>: ICNTL(25): compute a solution of a deficient matrix and a null space basis (None) 26414e34a73bSHong Zhang . -mat_mumps_icntl_26 <0>: ICNTL(26): drives the solution phase if a Schur complement matrix (None) 26424e34a73bSHong Zhang . -mat_mumps_icntl_28 <1>: ICNTL(28): use 1 for sequential analysis and ictnl(7) ordering, or 2 for parallel analysis and ictnl(29) ordering (None) 26434e34a73bSHong Zhang . -mat_mumps_icntl_29 <0>: ICNTL(29): parallel ordering 1 = ptscotch, 2 = parmetis (None) 26444e34a73bSHong Zhang . -mat_mumps_icntl_30 <0>: ICNTL(30): compute user-specified set of entries in inv(A) (None) 26454e34a73bSHong Zhang . -mat_mumps_icntl_31 <0>: ICNTL(31): indicates which factors may be discarded during factorization (None) 26464e34a73bSHong Zhang . -mat_mumps_icntl_33 <0>: ICNTL(33): compute determinant (None) 26474e34a73bSHong Zhang . -mat_mumps_cntl_1 <0.01>: CNTL(1): relative pivoting threshold (None) 26484e34a73bSHong Zhang . -mat_mumps_cntl_2 <1.49012e-08>: CNTL(2): stopping criterion of refinement (None) 26494e34a73bSHong Zhang . -mat_mumps_cntl_3 <0>: CNTL(3): absolute pivoting threshold (None) 26504e34a73bSHong Zhang . -mat_mumps_cntl_4 <-1>: CNTL(4): value for static pivoting (None) 26514e34a73bSHong Zhang - -mat_mumps_cntl_5 <0>: CNTL(5): fixation for null pivots (None) 265224b6179bSKris Buschelman 265324b6179bSKris Buschelman Level: beginner 265424b6179bSKris Buschelman 265541c8de11SBarry Smith .seealso: PCFactorSetMatSolverPackage(), MatSolverPackage 265641c8de11SBarry Smith 265724b6179bSKris Buschelman M*/ 265824b6179bSKris Buschelman 265935bd34faSBarry Smith #undef __FUNCT__ 266035bd34faSBarry Smith #define __FUNCT__ "MatFactorGetSolverPackage_mumps" 2661f7a08781SBarry Smith static PetscErrorCode MatFactorGetSolverPackage_mumps(Mat A,const MatSolverPackage *type) 266235bd34faSBarry Smith { 266335bd34faSBarry Smith PetscFunctionBegin; 26642692d6eeSBarry Smith *type = MATSOLVERMUMPS; 266535bd34faSBarry Smith PetscFunctionReturn(0); 266635bd34faSBarry Smith } 266735bd34faSBarry Smith 2668bccb9932SShri Abhyankar /* MatGetFactor for Seq and MPI AIJ matrices */ 26692877fffaSHong Zhang #undef __FUNCT__ 2670bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_aij_mumps" 26718cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_aij_mumps(Mat A,MatFactorType ftype,Mat *F) 26722877fffaSHong Zhang { 26732877fffaSHong Zhang Mat B; 26742877fffaSHong Zhang PetscErrorCode ierr; 26752877fffaSHong Zhang Mat_MUMPS *mumps; 2676ace3abfcSBarry Smith PetscBool isSeqAIJ; 26772877fffaSHong Zhang 26782877fffaSHong Zhang PetscFunctionBegin; 26792877fffaSHong Zhang /* Create the factorization matrix */ 2680251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQAIJ,&isSeqAIJ);CHKERRQ(ierr); 2681ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 26822877fffaSHong Zhang ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 26832877fffaSHong Zhang ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2684bccb9932SShri Abhyankar if (isSeqAIJ) { 26850298fd71SBarry Smith ierr = MatSeqAIJSetPreallocation(B,0,NULL);CHKERRQ(ierr); 2686bccb9932SShri Abhyankar } else { 26870298fd71SBarry Smith ierr = MatMPIAIJSetPreallocation(B,0,NULL,0,NULL);CHKERRQ(ierr); 2688bccb9932SShri Abhyankar } 26892877fffaSHong Zhang 2690b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 26912205254eSKarl Rupp 26922877fffaSHong Zhang B->ops->view = MatView_MUMPS; 269335bd34faSBarry Smith B->ops->getinfo = MatGetInfo_MUMPS; 269420be8e61SHong Zhang B->ops->getdiagonal = MatGetDiagonal_MUMPS; 26952205254eSKarl Rupp 2696bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 2697bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 2698bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 2699bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 2700bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 2701bc6112feSHong Zhang 2702ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 2703ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 2704ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 2705ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 27066444a565SStefano Zampini 27076444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetSchurIndices_C",MatMumpsSetSchurIndices_MUMPS);CHKERRQ(ierr); 270859ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsInvertSchurComplement_C",MatMumpsInvertSchurComplement_MUMPS);CHKERRQ(ierr); 270959ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsCreateSchurComplement_C",MatMumpsCreateSchurComplement_MUMPS);CHKERRQ(ierr); 27106444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetSchurComplement_C",MatMumpsGetSchurComplement_MUMPS);CHKERRQ(ierr); 271159ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsRestoreSchurComplement_C",MatMumpsRestoreSchurComplement_MUMPS);CHKERRQ(ierr); 2712e807eca7SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplement_C",MatMumpsSolveSchurComplement_MUMPS);CHKERRQ(ierr); 27137404bcfbSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplementTranspose_C",MatMumpsSolveSchurComplementTranspose_MUMPS);CHKERRQ(ierr); 2714*a0b0af32SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSchurComplementSetSym_C",MatMumpsSchurComplementSetSym_MUMPS);CHKERRQ(ierr); 2715e807eca7SStefano Zampini 2716450b117fSShri Abhyankar if (ftype == MAT_FACTOR_LU) { 2717450b117fSShri Abhyankar B->ops->lufactorsymbolic = MatLUFactorSymbolic_AIJMUMPS; 2718d5f3da31SBarry Smith B->factortype = MAT_FACTOR_LU; 2719bccb9932SShri Abhyankar if (isSeqAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqaij_seqaij; 2720bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpiaij_mpiaij; 2721746480a1SHong Zhang mumps->sym = 0; 2722dcd589f8SShri Abhyankar } else { 272367877ebaSShri Abhyankar B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_MUMPS; 2724450b117fSShri Abhyankar B->factortype = MAT_FACTOR_CHOLESKY; 2725bccb9932SShri Abhyankar if (isSeqAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqaij_seqsbaij; 2726bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpiaij_mpisbaij; 272759ac8732SStefano Zampini #if defined(PETSC_USE_COMPLEX) 272859ac8732SStefano Zampini mumps->sym = 2; 272959ac8732SStefano Zampini #else 27306fdc2a6dSBarry Smith if (A->spd_set && A->spd) mumps->sym = 1; 27316fdc2a6dSBarry Smith else mumps->sym = 2; 273259ac8732SStefano Zampini #endif 2733450b117fSShri Abhyankar } 27342877fffaSHong Zhang 27352877fffaSHong Zhang mumps->isAIJ = PETSC_TRUE; 2736bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 27372877fffaSHong Zhang B->ops->destroy = MatDestroy_MUMPS; 27382877fffaSHong Zhang B->spptr = (void*)mumps; 27392205254eSKarl Rupp 2740f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 2741746480a1SHong Zhang 27422877fffaSHong Zhang *F = B; 27432877fffaSHong Zhang PetscFunctionReturn(0); 27442877fffaSHong Zhang } 27452877fffaSHong Zhang 2746bccb9932SShri Abhyankar /* MatGetFactor for Seq and MPI SBAIJ matrices */ 27472877fffaSHong Zhang #undef __FUNCT__ 2748bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_sbaij_mumps" 27498cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_sbaij_mumps(Mat A,MatFactorType ftype,Mat *F) 27502877fffaSHong Zhang { 27512877fffaSHong Zhang Mat B; 27522877fffaSHong Zhang PetscErrorCode ierr; 27532877fffaSHong Zhang Mat_MUMPS *mumps; 2754ace3abfcSBarry Smith PetscBool isSeqSBAIJ; 27552877fffaSHong Zhang 27562877fffaSHong Zhang PetscFunctionBegin; 2757ce94432eSBarry Smith if (ftype != MAT_FACTOR_CHOLESKY) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with MUMPS LU, use AIJ matrix"); 2758ce94432eSBarry Smith if (A->rmap->bs > 1) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with block size > 1 with MUMPS Cholesky, use AIJ matrix instead"); 2759251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQSBAIJ,&isSeqSBAIJ);CHKERRQ(ierr); 27602877fffaSHong Zhang /* Create the factorization matrix */ 2761ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 27622877fffaSHong Zhang ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 27632877fffaSHong Zhang ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2764b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 2765bccb9932SShri Abhyankar if (isSeqSBAIJ) { 27660298fd71SBarry Smith ierr = MatSeqSBAIJSetPreallocation(B,1,0,NULL);CHKERRQ(ierr); 27672205254eSKarl Rupp 276816ebf90aSShri Abhyankar mumps->ConvertToTriples = MatConvertToTriples_seqsbaij_seqsbaij; 2769dcd589f8SShri Abhyankar } else { 27700298fd71SBarry Smith ierr = MatMPISBAIJSetPreallocation(B,1,0,NULL,0,NULL);CHKERRQ(ierr); 27712205254eSKarl Rupp 2772bccb9932SShri Abhyankar mumps->ConvertToTriples = MatConvertToTriples_mpisbaij_mpisbaij; 2773bccb9932SShri Abhyankar } 2774bccb9932SShri Abhyankar 277567877ebaSShri Abhyankar B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_MUMPS; 2776bccb9932SShri Abhyankar B->ops->view = MatView_MUMPS; 277720be8e61SHong Zhang B->ops->getdiagonal = MatGetDiagonal_MUMPS; 27782205254eSKarl Rupp 2779bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 2780b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 2781b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 2782b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 2783b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 2784bc6112feSHong Zhang 2785ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 2786ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 2787ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 2788ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 27892205254eSKarl Rupp 27906444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetSchurIndices_C",MatMumpsSetSchurIndices_MUMPS);CHKERRQ(ierr); 279159ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsInvertSchurComplement_C",MatMumpsInvertSchurComplement_MUMPS);CHKERRQ(ierr); 279259ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsCreateSchurComplement_C",MatMumpsCreateSchurComplement_MUMPS);CHKERRQ(ierr); 27936444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetSchurComplement_C",MatMumpsGetSchurComplement_MUMPS);CHKERRQ(ierr); 279459ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsRestoreSchurComplement_C",MatMumpsRestoreSchurComplement_MUMPS);CHKERRQ(ierr); 2795e807eca7SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplement_C",MatMumpsSolveSchurComplement_MUMPS);CHKERRQ(ierr); 27967404bcfbSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplementTranspose_C",MatMumpsSolveSchurComplementTranspose_MUMPS);CHKERRQ(ierr); 2797*a0b0af32SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSchurComplementSetSym_C",MatMumpsSchurComplementSetSym_MUMPS);CHKERRQ(ierr); 27986444a565SStefano Zampini 2799f4762488SHong Zhang B->factortype = MAT_FACTOR_CHOLESKY; 280059ac8732SStefano Zampini #if defined(PETSC_USE_COMPLEX) 280159ac8732SStefano Zampini mumps->sym = 2; 280259ac8732SStefano Zampini #else 28036fdc2a6dSBarry Smith if (A->spd_set && A->spd) mumps->sym = 1; 28046fdc2a6dSBarry Smith else mumps->sym = 2; 280559ac8732SStefano Zampini #endif 2806a214ac2aSShri Abhyankar 2807bccb9932SShri Abhyankar mumps->isAIJ = PETSC_FALSE; 2808bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 2809f3c0ef26SHong Zhang B->ops->destroy = MatDestroy_MUMPS; 28102877fffaSHong Zhang B->spptr = (void*)mumps; 28112205254eSKarl Rupp 2812f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 2813746480a1SHong Zhang 28142877fffaSHong Zhang *F = B; 28152877fffaSHong Zhang PetscFunctionReturn(0); 28162877fffaSHong Zhang } 281797969023SHong Zhang 2818450b117fSShri Abhyankar #undef __FUNCT__ 2819bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_baij_mumps" 28208cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_baij_mumps(Mat A,MatFactorType ftype,Mat *F) 282167877ebaSShri Abhyankar { 282267877ebaSShri Abhyankar Mat B; 282367877ebaSShri Abhyankar PetscErrorCode ierr; 282467877ebaSShri Abhyankar Mat_MUMPS *mumps; 2825ace3abfcSBarry Smith PetscBool isSeqBAIJ; 282667877ebaSShri Abhyankar 282767877ebaSShri Abhyankar PetscFunctionBegin; 282867877ebaSShri Abhyankar /* Create the factorization matrix */ 2829251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQBAIJ,&isSeqBAIJ);CHKERRQ(ierr); 2830ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 283167877ebaSShri Abhyankar ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 283267877ebaSShri Abhyankar ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2833bccb9932SShri Abhyankar if (isSeqBAIJ) { 28340298fd71SBarry Smith ierr = MatSeqBAIJSetPreallocation(B,A->rmap->bs,0,NULL);CHKERRQ(ierr); 2835bccb9932SShri Abhyankar } else { 28360298fd71SBarry Smith ierr = MatMPIBAIJSetPreallocation(B,A->rmap->bs,0,NULL,0,NULL);CHKERRQ(ierr); 2837bccb9932SShri Abhyankar } 2838450b117fSShri Abhyankar 2839b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 2840450b117fSShri Abhyankar if (ftype == MAT_FACTOR_LU) { 2841450b117fSShri Abhyankar B->ops->lufactorsymbolic = MatLUFactorSymbolic_BAIJMUMPS; 2842450b117fSShri Abhyankar B->factortype = MAT_FACTOR_LU; 2843bccb9932SShri Abhyankar if (isSeqBAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqbaij_seqaij; 2844bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpibaij_mpiaij; 2845746480a1SHong Zhang mumps->sym = 0; 2846f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Cannot use PETSc BAIJ matrices with MUMPS Cholesky, use SBAIJ or AIJ matrix instead\n"); 2847bccb9932SShri Abhyankar 2848450b117fSShri Abhyankar B->ops->view = MatView_MUMPS; 284920be8e61SHong Zhang B->ops->getdiagonal = MatGetDiagonal_MUMPS; 28502205254eSKarl Rupp 2851bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 2852bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 2853bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 2854bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 2855bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 2856bc6112feSHong Zhang 2857ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 2858ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 2859ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 2860ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 2861450b117fSShri Abhyankar 28626444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetSchurIndices_C",MatMumpsSetSchurIndices_MUMPS);CHKERRQ(ierr); 286359ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsInvertSchurComplement_C",MatMumpsInvertSchurComplement_MUMPS);CHKERRQ(ierr); 286459ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsCreateSchurComplement_C",MatMumpsCreateSchurComplement_MUMPS);CHKERRQ(ierr); 28656444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetSchurComplement_C",MatMumpsGetSchurComplement_MUMPS);CHKERRQ(ierr); 286659ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsRestoreSchurComplement_C",MatMumpsRestoreSchurComplement_MUMPS);CHKERRQ(ierr); 2867e807eca7SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplement_C",MatMumpsSolveSchurComplement_MUMPS);CHKERRQ(ierr); 28687404bcfbSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplementTranspose_C",MatMumpsSolveSchurComplementTranspose_MUMPS);CHKERRQ(ierr); 2869*a0b0af32SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSchurComplementSetSym_C",MatMumpsSchurComplementSetSym_MUMPS);CHKERRQ(ierr); 28706444a565SStefano Zampini 2871450b117fSShri Abhyankar mumps->isAIJ = PETSC_TRUE; 2872bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 2873450b117fSShri Abhyankar B->ops->destroy = MatDestroy_MUMPS; 2874450b117fSShri Abhyankar B->spptr = (void*)mumps; 28752205254eSKarl Rupp 2876f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 2877746480a1SHong Zhang 2878450b117fSShri Abhyankar *F = B; 2879450b117fSShri Abhyankar PetscFunctionReturn(0); 2880450b117fSShri Abhyankar } 288142c9c57cSBarry Smith 288242c9c57cSBarry Smith PETSC_EXTERN PetscErrorCode MatGetFactor_aij_mumps(Mat,MatFactorType,Mat*); 288342c9c57cSBarry Smith PETSC_EXTERN PetscErrorCode MatGetFactor_baij_mumps(Mat,MatFactorType,Mat*); 288442c9c57cSBarry Smith PETSC_EXTERN PetscErrorCode MatGetFactor_sbaij_mumps(Mat,MatFactorType,Mat*); 288542c9c57cSBarry Smith 288642c9c57cSBarry Smith #undef __FUNCT__ 288742c9c57cSBarry Smith #define __FUNCT__ "MatSolverPackageRegister_MUMPS" 288829b38603SBarry Smith PETSC_EXTERN PetscErrorCode MatSolverPackageRegister_MUMPS(void) 288942c9c57cSBarry Smith { 289042c9c57cSBarry Smith PetscErrorCode ierr; 289142c9c57cSBarry Smith 289242c9c57cSBarry Smith PetscFunctionBegin; 289342c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIAIJ,MAT_FACTOR_LU,MatGetFactor_aij_mumps);CHKERRQ(ierr); 289442c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_aij_mumps);CHKERRQ(ierr); 289542c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIBAIJ,MAT_FACTOR_LU,MatGetFactor_baij_mumps);CHKERRQ(ierr); 289642c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_baij_mumps);CHKERRQ(ierr); 289742c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPISBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_sbaij_mumps);CHKERRQ(ierr); 289842c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQAIJ,MAT_FACTOR_LU,MatGetFactor_aij_mumps);CHKERRQ(ierr); 289942c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_aij_mumps);CHKERRQ(ierr); 290042c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQBAIJ,MAT_FACTOR_LU,MatGetFactor_baij_mumps);CHKERRQ(ierr); 290142c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_baij_mumps);CHKERRQ(ierr); 290242c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQSBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_sbaij_mumps);CHKERRQ(ierr); 290342c9c57cSBarry Smith PetscFunctionReturn(0); 290442c9c57cSBarry Smith } 290542c9c57cSBarry Smith 2906