11c2a3de1SBarry Smith 2397b6df1SKris Buschelman /* 3c2b5dc30SHong Zhang Provides an interface to the MUMPS sparse solver 4397b6df1SKris Buschelman */ 551d5961aSHong Zhang 6c6db04a5SJed Brown #include <../src/mat/impls/aij/mpi/mpiaij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <../src/mat/impls/sbaij/mpi/mpisbaij.h> 8b5fa320bSStefano Zampini #include <petscblaslapack.h> 9397b6df1SKris Buschelman 10397b6df1SKris Buschelman EXTERN_C_BEGIN 11397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 122907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 132907cef9SHong Zhang #include <cmumps_c.h> 142907cef9SHong Zhang #else 15c6db04a5SJed Brown #include <zmumps_c.h> 162907cef9SHong Zhang #endif 172907cef9SHong Zhang #else 182907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 192907cef9SHong Zhang #include <smumps_c.h> 20397b6df1SKris Buschelman #else 21c6db04a5SJed Brown #include <dmumps_c.h> 22397b6df1SKris Buschelman #endif 232907cef9SHong Zhang #endif 24397b6df1SKris Buschelman EXTERN_C_END 25397b6df1SKris Buschelman #define JOB_INIT -1 263d472b54SHong Zhang #define JOB_FACTSYMBOLIC 1 273d472b54SHong Zhang #define JOB_FACTNUMERIC 2 283d472b54SHong Zhang #define JOB_SOLVE 3 29397b6df1SKris Buschelman #define JOB_END -2 303d472b54SHong Zhang 312907cef9SHong Zhang /* calls to MUMPS */ 322907cef9SHong Zhang #if defined(PETSC_USE_COMPLEX) 332907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 342907cef9SHong Zhang #define PetscMUMPS_c cmumps_c 352907cef9SHong Zhang #else 362907cef9SHong Zhang #define PetscMUMPS_c zmumps_c 372907cef9SHong Zhang #endif 382907cef9SHong Zhang #else 392907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 402907cef9SHong Zhang #define PetscMUMPS_c smumps_c 412907cef9SHong Zhang #else 422907cef9SHong Zhang #define PetscMUMPS_c dmumps_c 432907cef9SHong Zhang #endif 442907cef9SHong Zhang #endif 452907cef9SHong Zhang 46940cd9d6SSatish Balay /* declare MumpsScalar */ 47940cd9d6SSatish Balay #if defined(PETSC_USE_COMPLEX) 48940cd9d6SSatish Balay #if defined(PETSC_USE_REAL_SINGLE) 49940cd9d6SSatish Balay #define MumpsScalar mumps_complex 50940cd9d6SSatish Balay #else 51940cd9d6SSatish Balay #define MumpsScalar mumps_double_complex 52940cd9d6SSatish Balay #endif 53940cd9d6SSatish Balay #else 54940cd9d6SSatish Balay #define MumpsScalar PetscScalar 55940cd9d6SSatish Balay #endif 563d472b54SHong Zhang 57397b6df1SKris Buschelman /* macros s.t. indices match MUMPS documentation */ 58397b6df1SKris Buschelman #define ICNTL(I) icntl[(I)-1] 59397b6df1SKris Buschelman #define CNTL(I) cntl[(I)-1] 60397b6df1SKris Buschelman #define INFOG(I) infog[(I)-1] 61a7aca84bSHong Zhang #define INFO(I) info[(I)-1] 62397b6df1SKris Buschelman #define RINFOG(I) rinfog[(I)-1] 63adc1d99fSHong Zhang #define RINFO(I) rinfo[(I)-1] 64397b6df1SKris Buschelman 65397b6df1SKris Buschelman typedef struct { 66397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 672907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 682907cef9SHong Zhang CMUMPS_STRUC_C id; 692907cef9SHong Zhang #else 70397b6df1SKris Buschelman ZMUMPS_STRUC_C id; 712907cef9SHong Zhang #endif 722907cef9SHong Zhang #else 732907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 742907cef9SHong Zhang SMUMPS_STRUC_C id; 75397b6df1SKris Buschelman #else 76397b6df1SKris Buschelman DMUMPS_STRUC_C id; 77397b6df1SKris Buschelman #endif 782907cef9SHong Zhang #endif 792907cef9SHong Zhang 80397b6df1SKris Buschelman MatStructure matstruc; 81c1490034SHong Zhang PetscMPIInt myid,size; 82a5e57a09SHong Zhang PetscInt *irn,*jcn,nz,sym; 83397b6df1SKris Buschelman PetscScalar *val; 84397b6df1SKris Buschelman MPI_Comm comm_mumps; 8564e6c443SBarry Smith PetscBool isAIJ,CleanUpMUMPS; 86a5e57a09SHong Zhang PetscInt ICNTL9_pre; /* check if ICNTL(9) is changed from previous MatSolve */ 87801fbe65SHong Zhang VecScatter scat_rhs, scat_sol; /* used by MatSolve() */ 88801fbe65SHong Zhang Vec b_seq,x_seq; 89b34f08ffSHong Zhang PetscInt ninfo,*info; /* display INFO */ 90b5fa320bSStefano Zampini PetscBool schur_second_solve; 91b5fa320bSStefano Zampini PetscInt sizeredrhs; 92b5fa320bSStefano Zampini PetscInt *schur_pivots; 9359ac8732SStefano Zampini PetscInt schur_B_lwork; 94b5fa320bSStefano Zampini PetscScalar *schur_work; 9559ac8732SStefano Zampini PetscScalar *schur_sol; 9659ac8732SStefano Zampini PetscInt schur_sizesol; 9759ac8732SStefano Zampini PetscBool schur_restored; 9859ac8732SStefano Zampini PetscBool schur_factored; 9959ac8732SStefano Zampini PetscBool schur_inverted; 1002205254eSKarl Rupp 101bf0cc555SLisandro Dalcin PetscErrorCode (*Destroy)(Mat); 102bccb9932SShri Abhyankar PetscErrorCode (*ConvertToTriples)(Mat, int, MatReuse, int*, int**, int**, PetscScalar**); 103f0c56d0fSKris Buschelman } Mat_MUMPS; 104f0c56d0fSKris Buschelman 10509573ac7SBarry Smith extern PetscErrorCode MatDuplicate_MUMPS(Mat,MatDuplicateOption,Mat*); 106b24902e0SBarry Smith 10759ac8732SStefano Zampini #undef __FUNCT__ 10859ac8732SStefano Zampini #define __FUNCT__ "MatMumpsResetSchur_Private" 10959ac8732SStefano Zampini static PetscErrorCode MatMumpsResetSchur_Private(Mat_MUMPS* mumps) 110b5fa320bSStefano Zampini { 111b5fa320bSStefano Zampini PetscErrorCode ierr; 112b5fa320bSStefano Zampini 113b5fa320bSStefano Zampini PetscFunctionBegin; 11459ac8732SStefano Zampini ierr = PetscFree2(mumps->id.listvar_schur,mumps->id.schur);CHKERRQ(ierr); 11559ac8732SStefano Zampini ierr = PetscFree(mumps->id.redrhs);CHKERRQ(ierr); 11659ac8732SStefano Zampini ierr = PetscFree(mumps->schur_sol);CHKERRQ(ierr); 11759ac8732SStefano Zampini ierr = PetscFree(mumps->schur_pivots);CHKERRQ(ierr); 11859ac8732SStefano Zampini ierr = PetscFree(mumps->schur_work);CHKERRQ(ierr); 11959ac8732SStefano Zampini if (!mumps->schur_restored) { 12059ac8732SStefano Zampini SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 12159ac8732SStefano Zampini } 12259ac8732SStefano Zampini mumps->id.size_schur = 0; 12359ac8732SStefano Zampini mumps->id.ICNTL(19) = 0; 12459ac8732SStefano Zampini PetscFunctionReturn(0); 12559ac8732SStefano Zampini } 12659ac8732SStefano Zampini 12759ac8732SStefano Zampini #undef __FUNCT__ 12859ac8732SStefano Zampini #define __FUNCT__ "MatMumpsFactorSchur_Private" 12959ac8732SStefano Zampini static PetscErrorCode MatMumpsFactorSchur_Private(Mat_MUMPS* mumps) 13059ac8732SStefano Zampini { 13159ac8732SStefano Zampini PetscBLASInt B_N,B_ierr,B_slda; 13259ac8732SStefano Zampini PetscErrorCode ierr; 13359ac8732SStefano Zampini 13459ac8732SStefano Zampini PetscFunctionBegin; 13559ac8732SStefano Zampini if (mumps->schur_factored) { 13659ac8732SStefano Zampini PetscFunctionReturn(0); 13759ac8732SStefano Zampini } 13859ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.size_schur,&B_N);CHKERRQ(ierr); 13959ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.schur_lld,&B_slda);CHKERRQ(ierr); 14059ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full Schur matrix */ 14159ac8732SStefano Zampini if (!mumps->schur_pivots) { 14259ac8732SStefano Zampini ierr = PetscMalloc1(B_N,&mumps->schur_pivots);CHKERRQ(ierr); 14359ac8732SStefano Zampini } 14459ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 14559ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetrf",LAPACKgetrf_(&B_N,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,&B_ierr)); 14659ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 14759ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GETRF Lapack routine %d",(int)B_ierr); 14859ac8732SStefano Zampini } else { /* either full or lower-triangular (not packed) */ 14959ac8732SStefano Zampini char ord[2]; 15059ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 15159ac8732SStefano Zampini sprintf(ord,"L"); 15259ac8732SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 15359ac8732SStefano Zampini sprintf(ord,"U"); 15459ac8732SStefano Zampini } 15559ac8732SStefano Zampini if (mumps->id.sym == 2) { 15659ac8732SStefano Zampini if (!mumps->schur_pivots) { 15759ac8732SStefano Zampini PetscScalar lwork; 15859ac8732SStefano Zampini 15959ac8732SStefano Zampini ierr = PetscMalloc1(B_N,&mumps->schur_pivots);CHKERRQ(ierr); 16059ac8732SStefano Zampini mumps->schur_B_lwork=-1; 16159ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 16259ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytrf",LAPACKsytrf_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,&lwork,&mumps->schur_B_lwork,&B_ierr)); 16359ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 16459ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SYTRF Lapack routine %d",(int)B_ierr); 16559ac8732SStefano Zampini ierr = PetscBLASIntCast((PetscInt)PetscRealPart(lwork),&mumps->schur_B_lwork);CHKERRQ(ierr); 16659ac8732SStefano Zampini ierr = PetscMalloc1(mumps->schur_B_lwork,&mumps->schur_work);CHKERRQ(ierr); 16759ac8732SStefano Zampini } 16859ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 16959ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytrf",LAPACKsytrf_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,mumps->schur_work,&mumps->schur_B_lwork,&B_ierr)); 17059ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 17159ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYTRF Lapack routine %d",(int)B_ierr); 17259ac8732SStefano Zampini } else { 17359ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 17459ac8732SStefano Zampini PetscStackCallBLAS("LAPACKpotrf",LAPACKpotrf_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,&B_ierr)); 17559ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 17659ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in POTRF Lapack routine %d",(int)B_ierr); 17759ac8732SStefano Zampini } 17859ac8732SStefano Zampini } 17959ac8732SStefano Zampini mumps->schur_factored = PETSC_TRUE; 18059ac8732SStefano Zampini PetscFunctionReturn(0); 18159ac8732SStefano Zampini } 18259ac8732SStefano Zampini 18359ac8732SStefano Zampini #undef __FUNCT__ 18459ac8732SStefano Zampini #define __FUNCT__ "MatMumpsInvertSchur_Private" 18559ac8732SStefano Zampini static PetscErrorCode MatMumpsInvertSchur_Private(Mat_MUMPS* mumps) 18659ac8732SStefano Zampini { 18759ac8732SStefano Zampini PetscBLASInt B_N,B_ierr,B_slda; 18859ac8732SStefano Zampini PetscErrorCode ierr; 18959ac8732SStefano Zampini 19059ac8732SStefano Zampini PetscFunctionBegin; 19159ac8732SStefano Zampini ierr = MatMumpsFactorSchur_Private(mumps);CHKERRQ(ierr); 19259ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.size_schur,&B_N);CHKERRQ(ierr); 19359ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.schur_lld,&B_slda);CHKERRQ(ierr); 19459ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full Schur matrix */ 19559ac8732SStefano Zampini if (!mumps->schur_work) { 19659ac8732SStefano Zampini PetscScalar lwork; 19759ac8732SStefano Zampini 19859ac8732SStefano Zampini mumps->schur_B_lwork = -1; 19959ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 20059ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetri",LAPACKgetri_(&B_N,(PetscScalar*)mumps->id.schur,&B_N,mumps->schur_pivots,&lwork,&mumps->schur_B_lwork,&B_ierr)); 20159ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 20259ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to GETRI Lapack routine %d",(int)B_ierr); 20359ac8732SStefano Zampini ierr = PetscBLASIntCast((PetscInt)PetscRealPart(lwork),&mumps->schur_B_lwork);CHKERRQ(ierr); 20459ac8732SStefano Zampini ierr = PetscMalloc1(mumps->schur_B_lwork,&mumps->schur_work);CHKERRQ(ierr); 20559ac8732SStefano Zampini } 20659ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 20759ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetri",LAPACKgetri_(&B_N,(PetscScalar*)mumps->id.schur,&B_N,mumps->schur_pivots,mumps->schur_work,&mumps->schur_B_lwork,&B_ierr)); 20859ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 20959ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GETRI Lapack routine %d",(int)B_ierr); 21059ac8732SStefano Zampini } else { /* either full or lower-triangular (not packed) */ 21159ac8732SStefano Zampini char ord[2]; 21259ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 21359ac8732SStefano Zampini sprintf(ord,"L"); 21459ac8732SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 21559ac8732SStefano Zampini sprintf(ord,"U"); 21659ac8732SStefano Zampini } 21759ac8732SStefano Zampini if (mumps->id.sym == 2) { 21859ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 21959ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytri",LAPACKsytri_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_N,mumps->schur_pivots,mumps->schur_work,&B_ierr)); 22059ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 22159ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYTRI Lapack routine %d",(int)B_ierr); 22259ac8732SStefano Zampini } else { 22359ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 22459ac8732SStefano Zampini PetscStackCallBLAS("LAPACKpotri",LAPACKpotri_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_N,&B_ierr)); 22559ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 22659ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in POTRI Lapack routine %d",(int)B_ierr); 22759ac8732SStefano Zampini } 22859ac8732SStefano Zampini } 22959ac8732SStefano Zampini mumps->schur_inverted = PETSC_TRUE; 23059ac8732SStefano Zampini PetscFunctionReturn(0); 23159ac8732SStefano Zampini } 23259ac8732SStefano Zampini 23359ac8732SStefano Zampini #undef __FUNCT__ 23459ac8732SStefano Zampini #define __FUNCT__ "MatMumpsSolveSchur_Private" 235e807eca7SStefano Zampini static PetscErrorCode MatMumpsSolveSchur_Private(Mat_MUMPS* mumps, PetscBool sol_in_redrhs) 23659ac8732SStefano Zampini { 23759ac8732SStefano Zampini PetscBLASInt B_N,B_Nrhs,B_ierr,B_slda,B_rlda; 23859ac8732SStefano Zampini PetscScalar one=1.,zero=0.; 23959ac8732SStefano Zampini PetscErrorCode ierr; 24059ac8732SStefano Zampini 24159ac8732SStefano Zampini PetscFunctionBegin; 24259ac8732SStefano Zampini ierr = MatMumpsFactorSchur_Private(mumps);CHKERRQ(ierr); 243b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.size_schur,&B_N);CHKERRQ(ierr); 244b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.schur_lld,&B_slda);CHKERRQ(ierr); 245b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.nrhs,&B_Nrhs);CHKERRQ(ierr); 246b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.lredrhs,&B_rlda);CHKERRQ(ierr); 24759ac8732SStefano Zampini if (mumps->schur_inverted) { 24859ac8732SStefano Zampini PetscInt sizesol = B_Nrhs*B_N; 24959ac8732SStefano Zampini if (!mumps->schur_sol || sizesol > mumps->schur_sizesol) { 25059ac8732SStefano Zampini ierr = PetscFree(mumps->schur_sol);CHKERRQ(ierr); 25159ac8732SStefano Zampini ierr = PetscMalloc1(sizesol,&mumps->schur_sol);CHKERRQ(ierr); 25259ac8732SStefano Zampini mumps->schur_sizesol = sizesol; 253b5fa320bSStefano Zampini } 25459ac8732SStefano Zampini if (!mumps->sym) { 25559ac8732SStefano Zampini char type[2]; 256b5fa320bSStefano Zampini if (mumps->id.ICNTL(19) == 1) { /* stored by rows */ 25759ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 25859ac8732SStefano Zampini sprintf(type,"N"); 259b5fa320bSStefano Zampini } else { 26059ac8732SStefano Zampini sprintf(type,"T"); 261b5fa320bSStefano Zampini } 26259ac8732SStefano Zampini } else { /* stored by columns */ 26359ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 26459ac8732SStefano Zampini sprintf(type,"T"); 26559ac8732SStefano Zampini } else { 26659ac8732SStefano Zampini sprintf(type,"N"); 26759ac8732SStefano Zampini } 26859ac8732SStefano Zampini } 26959ac8732SStefano Zampini PetscStackCallBLAS("BLASgemm",BLASgemm_(type,"N",&B_N,&B_Nrhs,&B_N,&one,(PetscScalar*)mumps->id.schur,&B_slda,(PetscScalar*)mumps->id.redrhs,&B_rlda,&zero,mumps->schur_sol,&B_rlda)); 27059ac8732SStefano Zampini } else { 27159ac8732SStefano Zampini char ord[2]; 27259ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 27359ac8732SStefano Zampini sprintf(ord,"L"); 27459ac8732SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 27559ac8732SStefano Zampini sprintf(ord,"U"); 27659ac8732SStefano Zampini } 27759ac8732SStefano Zampini PetscStackCallBLAS("BLASsymm",BLASsymm_("L",ord,&B_N,&B_Nrhs,&one,(PetscScalar*)mumps->id.schur,&B_slda,(PetscScalar*)mumps->id.redrhs,&B_rlda,&zero,mumps->schur_sol,&B_rlda)); 27859ac8732SStefano Zampini } 279e807eca7SStefano Zampini if (sol_in_redrhs) { 28059ac8732SStefano Zampini ierr = PetscMemcpy(mumps->id.redrhs,mumps->schur_sol,sizesol*sizeof(PetscScalar));CHKERRQ(ierr); 281e807eca7SStefano Zampini } 282a12f35bfSStefano Zampini } else { /* Schur complement has not been inverted */ 283a12f35bfSStefano Zampini MumpsScalar *orhs=NULL; 284a12f35bfSStefano Zampini 285a12f35bfSStefano Zampini if (!sol_in_redrhs) { 286a12f35bfSStefano Zampini PetscInt sizesol = B_Nrhs*B_N; 287a12f35bfSStefano Zampini if (!mumps->schur_sol || sizesol > mumps->schur_sizesol) { 288a12f35bfSStefano Zampini ierr = PetscFree(mumps->schur_sol);CHKERRQ(ierr); 289a12f35bfSStefano Zampini ierr = PetscMalloc1(sizesol,&mumps->schur_sol);CHKERRQ(ierr); 290a12f35bfSStefano Zampini mumps->schur_sizesol = sizesol; 291a12f35bfSStefano Zampini } 292a12f35bfSStefano Zampini orhs = mumps->id.redrhs; 293a12f35bfSStefano Zampini ierr = PetscMemcpy(mumps->schur_sol,mumps->id.redrhs,sizesol*sizeof(PetscScalar));CHKERRQ(ierr); 294a12f35bfSStefano Zampini mumps->id.redrhs = (MumpsScalar*)mumps->schur_sol; 295a12f35bfSStefano Zampini } 29659ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full Schur matrix */ 29759ac8732SStefano Zampini char type[2]; 29859ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 1) { /* stored by rows */ 29959ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 30059ac8732SStefano Zampini sprintf(type,"N"); 30159ac8732SStefano Zampini } else { 30259ac8732SStefano Zampini sprintf(type,"T"); 30359ac8732SStefano Zampini } 30459ac8732SStefano Zampini } else { /* stored by columns */ 30559ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 30659ac8732SStefano Zampini sprintf(type,"T"); 30759ac8732SStefano Zampini } else { 30859ac8732SStefano Zampini sprintf(type,"N"); 30959ac8732SStefano Zampini } 31059ac8732SStefano Zampini } 31159ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 31259ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetrs",LAPACKgetrs_(type,&B_N,&B_Nrhs,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,(PetscScalar*)mumps->id.redrhs,&B_rlda,&B_ierr)); 313b5fa320bSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 314b5fa320bSStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GETRS Lapack routine %d",(int)B_ierr); 315b5fa320bSStefano Zampini } else { /* either full or lower-triangular (not packed) */ 316b5fa320bSStefano Zampini char ord[2]; 317b5fa320bSStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 318b5fa320bSStefano Zampini sprintf(ord,"L"); 319b5fa320bSStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 320b5fa320bSStefano Zampini sprintf(ord,"U"); 321b5fa320bSStefano Zampini } 322b5fa320bSStefano Zampini if (mumps->id.sym == 2) { 323b5fa320bSStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 32459ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytrs",LAPACKsytrs_(ord,&B_N,&B_Nrhs,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,(PetscScalar*)mumps->id.redrhs,&B_rlda,&B_ierr)); 325b5fa320bSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 326b5fa320bSStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYTRS Lapack routine %d",(int)B_ierr); 327b5fa320bSStefano Zampini } else { 328b5fa320bSStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 32959ac8732SStefano Zampini PetscStackCallBLAS("LAPACKpotrs",LAPACKpotrs_(ord,&B_N,&B_Nrhs,(PetscScalar*)mumps->id.schur,&B_slda,(PetscScalar*)mumps->id.redrhs,&B_rlda,&B_ierr)); 330b5fa320bSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 331b5fa320bSStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in POTRS Lapack routine %d",(int)B_ierr); 332b5fa320bSStefano Zampini } 333b5fa320bSStefano Zampini } 334e807eca7SStefano Zampini if (!sol_in_redrhs) { 335a12f35bfSStefano Zampini mumps->id.redrhs = orhs; 336e807eca7SStefano Zampini } 33759ac8732SStefano Zampini } 338b5fa320bSStefano Zampini PetscFunctionReturn(0); 339b5fa320bSStefano Zampini } 340b5fa320bSStefano Zampini 34159ac8732SStefano Zampini #undef __FUNCT__ 34259ac8732SStefano Zampini #define __FUNCT__ "MatMumpsHandleSchur_Private" 343b5fa320bSStefano Zampini static PetscErrorCode MatMumpsHandleSchur_Private(Mat_MUMPS* mumps) 344b5fa320bSStefano Zampini { 345b5fa320bSStefano Zampini PetscErrorCode ierr; 346b5fa320bSStefano Zampini 347b5fa320bSStefano Zampini PetscFunctionBegin; 348b5fa320bSStefano Zampini if (!mumps->id.ICNTL(19)) { /* do nothing when Schur complement has not been computed */ 349b5fa320bSStefano Zampini PetscFunctionReturn(0); 350b5fa320bSStefano Zampini } 351b5fa320bSStefano Zampini if (!mumps->schur_second_solve) { /* prepare for the condensation step */ 352b5fa320bSStefano Zampini /* check if schur complement has been computed 353e807eca7SStefano Zampini We set by default ICNTL(26) == -1 when Schur indices have been provided by the user. 354b5fa320bSStefano Zampini According to MUMPS (5.0.0) manual, any value should be harmful during the factorization phase 355b5fa320bSStefano Zampini Unless the user provides a valid value for ICNTL(26), MatSolve and MatMatSolve routines solve the full system. 356b5fa320bSStefano Zampini This requires an extra call to PetscMUMPS_c and the computation of the factors for S, handled setting double_schur_solve to PETSC_TRUE */ 357b5fa320bSStefano Zampini if (mumps->id.ICNTL(26) < 0 || mumps->id.ICNTL(26) > 2) { 358b5fa320bSStefano Zampini PetscInt sizeredrhs = mumps->id.nrhs*mumps->id.size_schur; 359b5fa320bSStefano Zampini /* allocate MUMPS internal array to store reduced right-hand sides */ 360b5fa320bSStefano Zampini if (!mumps->id.redrhs || sizeredrhs > mumps->sizeredrhs) { 361b5fa320bSStefano Zampini ierr = PetscFree(mumps->id.redrhs);CHKERRQ(ierr); 362b5fa320bSStefano Zampini mumps->id.lredrhs = mumps->id.size_schur; 363b5fa320bSStefano Zampini ierr = PetscMalloc1(mumps->id.nrhs*mumps->id.lredrhs,&mumps->id.redrhs);CHKERRQ(ierr); 364b5fa320bSStefano Zampini mumps->sizeredrhs = mumps->id.nrhs*mumps->id.lredrhs; 365b5fa320bSStefano Zampini } 366b5fa320bSStefano Zampini mumps->schur_second_solve = PETSC_TRUE; 367b5fa320bSStefano Zampini mumps->id.ICNTL(26) = 1; /* condensation phase */ 368b5fa320bSStefano Zampini } 369b5fa320bSStefano Zampini } else { /* prepare for the expansion step */ 370b5fa320bSStefano Zampini /* solve Schur complement (this should be done by the MUMPS user, so basically us) */ 371e807eca7SStefano Zampini ierr = MatMumpsSolveSchur_Private(mumps,PETSC_TRUE);CHKERRQ(ierr); 372b5fa320bSStefano Zampini mumps->id.ICNTL(26) = 2; /* expansion phase */ 373b5fa320bSStefano Zampini PetscMUMPS_c(&mumps->id); 374b5fa320bSStefano Zampini if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 375b5fa320bSStefano Zampini /* restore defaults */ 376b5fa320bSStefano Zampini mumps->id.ICNTL(26) = -1; 377b5fa320bSStefano Zampini mumps->schur_second_solve = PETSC_FALSE; 378b5fa320bSStefano Zampini } 379b5fa320bSStefano Zampini PetscFunctionReturn(0); 380b5fa320bSStefano Zampini } 381b5fa320bSStefano Zampini 382397b6df1SKris Buschelman /* 383d341cd04SHong Zhang MatConvertToTriples_A_B - convert Petsc matrix to triples: row[nz], col[nz], val[nz] 384d341cd04SHong Zhang 385397b6df1SKris Buschelman input: 38667877ebaSShri Abhyankar A - matrix in aij,baij or sbaij (bs=1) format 387397b6df1SKris Buschelman shift - 0: C style output triple; 1: Fortran style output triple. 388bccb9932SShri Abhyankar reuse - MAT_INITIAL_MATRIX: spaces are allocated and values are set for the triple 389bccb9932SShri Abhyankar MAT_REUSE_MATRIX: only the values in v array are updated 390397b6df1SKris Buschelman output: 391397b6df1SKris Buschelman nnz - dim of r, c, and v (number of local nonzero entries of A) 392397b6df1SKris Buschelman r, c, v - row and col index, matrix values (matrix triples) 393eb9baa12SBarry Smith 394eb9baa12SBarry Smith The returned values r, c, and sometimes v are obtained in a single PetscMalloc(). Then in MatDestroy_MUMPS() it is 395eb9baa12SBarry Smith freed with PetscFree((mumps->irn); This is not ideal code, the fact that v is ONLY sometimes part of mumps->irn means 396eb9baa12SBarry Smith that the PetscMalloc() cannot easily be replaced with a PetscMalloc3(). 397eb9baa12SBarry Smith 398397b6df1SKris Buschelman */ 39916ebf90aSShri Abhyankar 40016ebf90aSShri Abhyankar #undef __FUNCT__ 40116ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqaij_seqaij" 402bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqaij_seqaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 403b24902e0SBarry Smith { 404185f6596SHong Zhang const PetscInt *ai,*aj,*ajj,M=A->rmap->n; 40567877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 406dfbe8321SBarry Smith PetscErrorCode ierr; 407c1490034SHong Zhang PetscInt *row,*col; 40816ebf90aSShri Abhyankar Mat_SeqAIJ *aa=(Mat_SeqAIJ*)A->data; 409397b6df1SKris Buschelman 410397b6df1SKris Buschelman PetscFunctionBegin; 41116ebf90aSShri Abhyankar *v=aa->a; 412bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 4132205254eSKarl Rupp nz = aa->nz; 4142205254eSKarl Rupp ai = aa->i; 4152205254eSKarl Rupp aj = aa->j; 41616ebf90aSShri Abhyankar *nnz = nz; 417785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 418185f6596SHong Zhang col = row + nz; 419185f6596SHong Zhang 42016ebf90aSShri Abhyankar nz = 0; 42116ebf90aSShri Abhyankar for (i=0; i<M; i++) { 42216ebf90aSShri Abhyankar rnz = ai[i+1] - ai[i]; 42367877ebaSShri Abhyankar ajj = aj + ai[i]; 42467877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 42567877ebaSShri Abhyankar row[nz] = i+shift; col[nz++] = ajj[j] + shift; 42616ebf90aSShri Abhyankar } 42716ebf90aSShri Abhyankar } 42816ebf90aSShri Abhyankar *r = row; *c = col; 42916ebf90aSShri Abhyankar } 43016ebf90aSShri Abhyankar PetscFunctionReturn(0); 43116ebf90aSShri Abhyankar } 432397b6df1SKris Buschelman 43316ebf90aSShri Abhyankar #undef __FUNCT__ 43467877ebaSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqbaij_seqaij" 435bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqbaij_seqaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 43667877ebaSShri Abhyankar { 43767877ebaSShri Abhyankar Mat_SeqBAIJ *aa=(Mat_SeqBAIJ*)A->data; 43833d57670SJed Brown const PetscInt *ai,*aj,*ajj,bs2 = aa->bs2; 43933d57670SJed Brown PetscInt bs,M,nz,idx=0,rnz,i,j,k,m; 44067877ebaSShri Abhyankar PetscErrorCode ierr; 44167877ebaSShri Abhyankar PetscInt *row,*col; 44267877ebaSShri Abhyankar 44367877ebaSShri Abhyankar PetscFunctionBegin; 44433d57670SJed Brown ierr = MatGetBlockSize(A,&bs);CHKERRQ(ierr); 44533d57670SJed Brown M = A->rmap->N/bs; 446cf3759fdSShri Abhyankar *v = aa->a; 447bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 448cf3759fdSShri Abhyankar ai = aa->i; aj = aa->j; 44967877ebaSShri Abhyankar nz = bs2*aa->nz; 45067877ebaSShri Abhyankar *nnz = nz; 451785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 452185f6596SHong Zhang col = row + nz; 453185f6596SHong Zhang 45467877ebaSShri Abhyankar for (i=0; i<M; i++) { 45567877ebaSShri Abhyankar ajj = aj + ai[i]; 45667877ebaSShri Abhyankar rnz = ai[i+1] - ai[i]; 45767877ebaSShri Abhyankar for (k=0; k<rnz; k++) { 45867877ebaSShri Abhyankar for (j=0; j<bs; j++) { 45967877ebaSShri Abhyankar for (m=0; m<bs; m++) { 46067877ebaSShri Abhyankar row[idx] = i*bs + m + shift; 461cf3759fdSShri Abhyankar col[idx++] = bs*(ajj[k]) + j + shift; 46267877ebaSShri Abhyankar } 46367877ebaSShri Abhyankar } 46467877ebaSShri Abhyankar } 46567877ebaSShri Abhyankar } 466cf3759fdSShri Abhyankar *r = row; *c = col; 46767877ebaSShri Abhyankar } 46867877ebaSShri Abhyankar PetscFunctionReturn(0); 46967877ebaSShri Abhyankar } 47067877ebaSShri Abhyankar 47167877ebaSShri Abhyankar #undef __FUNCT__ 47216ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqsbaij_seqsbaij" 473bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqsbaij_seqsbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 47416ebf90aSShri Abhyankar { 47567877ebaSShri Abhyankar const PetscInt *ai, *aj,*ajj,M=A->rmap->n; 47667877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 47716ebf90aSShri Abhyankar PetscErrorCode ierr; 47816ebf90aSShri Abhyankar PetscInt *row,*col; 47916ebf90aSShri Abhyankar Mat_SeqSBAIJ *aa=(Mat_SeqSBAIJ*)A->data; 48016ebf90aSShri Abhyankar 48116ebf90aSShri Abhyankar PetscFunctionBegin; 482882afa5aSHong Zhang *v = aa->a; 483bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 4842205254eSKarl Rupp nz = aa->nz; 4852205254eSKarl Rupp ai = aa->i; 4862205254eSKarl Rupp aj = aa->j; 4872205254eSKarl Rupp *v = aa->a; 48816ebf90aSShri Abhyankar *nnz = nz; 489785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 490185f6596SHong Zhang col = row + nz; 491185f6596SHong Zhang 49216ebf90aSShri Abhyankar nz = 0; 49316ebf90aSShri Abhyankar for (i=0; i<M; i++) { 49416ebf90aSShri Abhyankar rnz = ai[i+1] - ai[i]; 49567877ebaSShri Abhyankar ajj = aj + ai[i]; 49667877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 49767877ebaSShri Abhyankar row[nz] = i+shift; col[nz++] = ajj[j] + shift; 49816ebf90aSShri Abhyankar } 49916ebf90aSShri Abhyankar } 50016ebf90aSShri Abhyankar *r = row; *c = col; 50116ebf90aSShri Abhyankar } 50216ebf90aSShri Abhyankar PetscFunctionReturn(0); 50316ebf90aSShri Abhyankar } 50416ebf90aSShri Abhyankar 50516ebf90aSShri Abhyankar #undef __FUNCT__ 50616ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqaij_seqsbaij" 507bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqaij_seqsbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 50816ebf90aSShri Abhyankar { 50967877ebaSShri Abhyankar const PetscInt *ai,*aj,*ajj,*adiag,M=A->rmap->n; 51067877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 51167877ebaSShri Abhyankar const PetscScalar *av,*v1; 51216ebf90aSShri Abhyankar PetscScalar *val; 51316ebf90aSShri Abhyankar PetscErrorCode ierr; 51416ebf90aSShri Abhyankar PetscInt *row,*col; 515829b1710SHong Zhang Mat_SeqAIJ *aa=(Mat_SeqAIJ*)A->data; 51616ebf90aSShri Abhyankar 51716ebf90aSShri Abhyankar PetscFunctionBegin; 51816ebf90aSShri Abhyankar ai =aa->i; aj=aa->j;av=aa->a; 51916ebf90aSShri Abhyankar adiag=aa->diag; 520bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 521829b1710SHong Zhang /* count nz in the uppper triangular part of A */ 522829b1710SHong Zhang nz = 0; 523829b1710SHong Zhang for (i=0; i<M; i++) nz += ai[i+1] - adiag[i]; 52416ebf90aSShri Abhyankar *nnz = nz; 525829b1710SHong Zhang 526185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 527185f6596SHong Zhang col = row + nz; 528185f6596SHong Zhang val = (PetscScalar*)(col + nz); 529185f6596SHong Zhang 53016ebf90aSShri Abhyankar nz = 0; 53116ebf90aSShri Abhyankar for (i=0; i<M; i++) { 53216ebf90aSShri Abhyankar rnz = ai[i+1] - adiag[i]; 53367877ebaSShri Abhyankar ajj = aj + adiag[i]; 534cf3759fdSShri Abhyankar v1 = av + adiag[i]; 53567877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 53667877ebaSShri Abhyankar row[nz] = i+shift; col[nz] = ajj[j] + shift; val[nz++] = v1[j]; 53716ebf90aSShri Abhyankar } 53816ebf90aSShri Abhyankar } 53916ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 540397b6df1SKris Buschelman } else { 54116ebf90aSShri Abhyankar nz = 0; val = *v; 54216ebf90aSShri Abhyankar for (i=0; i <M; i++) { 54316ebf90aSShri Abhyankar rnz = ai[i+1] - adiag[i]; 54467877ebaSShri Abhyankar ajj = aj + adiag[i]; 54567877ebaSShri Abhyankar v1 = av + adiag[i]; 54667877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 54767877ebaSShri Abhyankar val[nz++] = v1[j]; 54816ebf90aSShri Abhyankar } 54916ebf90aSShri Abhyankar } 55016ebf90aSShri Abhyankar } 55116ebf90aSShri Abhyankar PetscFunctionReturn(0); 55216ebf90aSShri Abhyankar } 55316ebf90aSShri Abhyankar 55416ebf90aSShri Abhyankar #undef __FUNCT__ 55516ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpisbaij_mpisbaij" 556bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpisbaij_mpisbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 55716ebf90aSShri Abhyankar { 55816ebf90aSShri Abhyankar const PetscInt *ai, *aj, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 55916ebf90aSShri Abhyankar PetscErrorCode ierr; 56016ebf90aSShri Abhyankar PetscInt rstart,nz,i,j,jj,irow,countA,countB; 56116ebf90aSShri Abhyankar PetscInt *row,*col; 56216ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 56316ebf90aSShri Abhyankar PetscScalar *val; 564397b6df1SKris Buschelman Mat_MPISBAIJ *mat = (Mat_MPISBAIJ*)A->data; 565397b6df1SKris Buschelman Mat_SeqSBAIJ *aa = (Mat_SeqSBAIJ*)(mat->A)->data; 566397b6df1SKris Buschelman Mat_SeqBAIJ *bb = (Mat_SeqBAIJ*)(mat->B)->data; 56716ebf90aSShri Abhyankar 56816ebf90aSShri Abhyankar PetscFunctionBegin; 569d0f46423SBarry Smith ai=aa->i; aj=aa->j; bi=bb->i; bj=bb->j; rstart= A->rmap->rstart; 570397b6df1SKris Buschelman av=aa->a; bv=bb->a; 571397b6df1SKris Buschelman 5722205254eSKarl Rupp garray = mat->garray; 5732205254eSKarl Rupp 574bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 57516ebf90aSShri Abhyankar nz = aa->nz + bb->nz; 57616ebf90aSShri Abhyankar *nnz = nz; 577185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 578185f6596SHong Zhang col = row + nz; 579185f6596SHong Zhang val = (PetscScalar*)(col + nz); 580185f6596SHong Zhang 581397b6df1SKris Buschelman *r = row; *c = col; *v = val; 582397b6df1SKris Buschelman } else { 583397b6df1SKris Buschelman row = *r; col = *c; val = *v; 584397b6df1SKris Buschelman } 585397b6df1SKris Buschelman 586028e57e8SHong Zhang jj = 0; irow = rstart; 587397b6df1SKris Buschelman for (i=0; i<m; i++) { 588397b6df1SKris Buschelman ajj = aj + ai[i]; /* ptr to the beginning of this row */ 589397b6df1SKris Buschelman countA = ai[i+1] - ai[i]; 590397b6df1SKris Buschelman countB = bi[i+1] - bi[i]; 591397b6df1SKris Buschelman bjj = bj + bi[i]; 59216ebf90aSShri Abhyankar v1 = av + ai[i]; 59316ebf90aSShri Abhyankar v2 = bv + bi[i]; 594397b6df1SKris Buschelman 595397b6df1SKris Buschelman /* A-part */ 596397b6df1SKris Buschelman for (j=0; j<countA; j++) { 597bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 598397b6df1SKris Buschelman row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 599397b6df1SKris Buschelman } 60016ebf90aSShri Abhyankar val[jj++] = v1[j]; 601397b6df1SKris Buschelman } 60216ebf90aSShri Abhyankar 60316ebf90aSShri Abhyankar /* B-part */ 60416ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 605bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 606397b6df1SKris Buschelman row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 607397b6df1SKris Buschelman } 60816ebf90aSShri Abhyankar val[jj++] = v2[j]; 60916ebf90aSShri Abhyankar } 61016ebf90aSShri Abhyankar irow++; 61116ebf90aSShri Abhyankar } 61216ebf90aSShri Abhyankar PetscFunctionReturn(0); 61316ebf90aSShri Abhyankar } 61416ebf90aSShri Abhyankar 61516ebf90aSShri Abhyankar #undef __FUNCT__ 61616ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpiaij_mpiaij" 617bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpiaij_mpiaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 61816ebf90aSShri Abhyankar { 61916ebf90aSShri Abhyankar const PetscInt *ai, *aj, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 62016ebf90aSShri Abhyankar PetscErrorCode ierr; 62116ebf90aSShri Abhyankar PetscInt rstart,nz,i,j,jj,irow,countA,countB; 62216ebf90aSShri Abhyankar PetscInt *row,*col; 62316ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 62416ebf90aSShri Abhyankar PetscScalar *val; 62516ebf90aSShri Abhyankar Mat_MPIAIJ *mat = (Mat_MPIAIJ*)A->data; 62616ebf90aSShri Abhyankar Mat_SeqAIJ *aa = (Mat_SeqAIJ*)(mat->A)->data; 62716ebf90aSShri Abhyankar Mat_SeqAIJ *bb = (Mat_SeqAIJ*)(mat->B)->data; 62816ebf90aSShri Abhyankar 62916ebf90aSShri Abhyankar PetscFunctionBegin; 63016ebf90aSShri Abhyankar ai=aa->i; aj=aa->j; bi=bb->i; bj=bb->j; rstart= A->rmap->rstart; 63116ebf90aSShri Abhyankar av=aa->a; bv=bb->a; 63216ebf90aSShri Abhyankar 6332205254eSKarl Rupp garray = mat->garray; 6342205254eSKarl Rupp 635bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 63616ebf90aSShri Abhyankar nz = aa->nz + bb->nz; 63716ebf90aSShri Abhyankar *nnz = nz; 638185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 639185f6596SHong Zhang col = row + nz; 640185f6596SHong Zhang val = (PetscScalar*)(col + nz); 641185f6596SHong Zhang 64216ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 64316ebf90aSShri Abhyankar } else { 64416ebf90aSShri Abhyankar row = *r; col = *c; val = *v; 64516ebf90aSShri Abhyankar } 64616ebf90aSShri Abhyankar 64716ebf90aSShri Abhyankar jj = 0; irow = rstart; 64816ebf90aSShri Abhyankar for (i=0; i<m; i++) { 64916ebf90aSShri Abhyankar ajj = aj + ai[i]; /* ptr to the beginning of this row */ 65016ebf90aSShri Abhyankar countA = ai[i+1] - ai[i]; 65116ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 65216ebf90aSShri Abhyankar bjj = bj + bi[i]; 65316ebf90aSShri Abhyankar v1 = av + ai[i]; 65416ebf90aSShri Abhyankar v2 = bv + bi[i]; 65516ebf90aSShri Abhyankar 65616ebf90aSShri Abhyankar /* A-part */ 65716ebf90aSShri Abhyankar for (j=0; j<countA; j++) { 658bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 65916ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 66016ebf90aSShri Abhyankar } 66116ebf90aSShri Abhyankar val[jj++] = v1[j]; 66216ebf90aSShri Abhyankar } 66316ebf90aSShri Abhyankar 66416ebf90aSShri Abhyankar /* B-part */ 66516ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 666bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 66716ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 66816ebf90aSShri Abhyankar } 66916ebf90aSShri Abhyankar val[jj++] = v2[j]; 67016ebf90aSShri Abhyankar } 67116ebf90aSShri Abhyankar irow++; 67216ebf90aSShri Abhyankar } 67316ebf90aSShri Abhyankar PetscFunctionReturn(0); 67416ebf90aSShri Abhyankar } 67516ebf90aSShri Abhyankar 67616ebf90aSShri Abhyankar #undef __FUNCT__ 67767877ebaSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpibaij_mpiaij" 678bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpibaij_mpiaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 67967877ebaSShri Abhyankar { 68067877ebaSShri Abhyankar Mat_MPIBAIJ *mat = (Mat_MPIBAIJ*)A->data; 68167877ebaSShri Abhyankar Mat_SeqBAIJ *aa = (Mat_SeqBAIJ*)(mat->A)->data; 68267877ebaSShri Abhyankar Mat_SeqBAIJ *bb = (Mat_SeqBAIJ*)(mat->B)->data; 68367877ebaSShri Abhyankar const PetscInt *ai = aa->i, *bi = bb->i, *aj = aa->j, *bj = bb->j,*ajj, *bjj; 684d985c460SShri Abhyankar const PetscInt *garray = mat->garray,mbs=mat->mbs,rstart=A->rmap->rstart; 68533d57670SJed Brown const PetscInt bs2=mat->bs2; 68667877ebaSShri Abhyankar PetscErrorCode ierr; 68733d57670SJed Brown PetscInt bs,nz,i,j,k,n,jj,irow,countA,countB,idx; 68867877ebaSShri Abhyankar PetscInt *row,*col; 68967877ebaSShri Abhyankar const PetscScalar *av=aa->a, *bv=bb->a,*v1,*v2; 69067877ebaSShri Abhyankar PetscScalar *val; 69167877ebaSShri Abhyankar 69267877ebaSShri Abhyankar PetscFunctionBegin; 69333d57670SJed Brown ierr = MatGetBlockSize(A,&bs);CHKERRQ(ierr); 694bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 69567877ebaSShri Abhyankar nz = bs2*(aa->nz + bb->nz); 69667877ebaSShri Abhyankar *nnz = nz; 697185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 698185f6596SHong Zhang col = row + nz; 699185f6596SHong Zhang val = (PetscScalar*)(col + nz); 700185f6596SHong Zhang 70167877ebaSShri Abhyankar *r = row; *c = col; *v = val; 70267877ebaSShri Abhyankar } else { 70367877ebaSShri Abhyankar row = *r; col = *c; val = *v; 70467877ebaSShri Abhyankar } 70567877ebaSShri Abhyankar 706d985c460SShri Abhyankar jj = 0; irow = rstart; 70767877ebaSShri Abhyankar for (i=0; i<mbs; i++) { 70867877ebaSShri Abhyankar countA = ai[i+1] - ai[i]; 70967877ebaSShri Abhyankar countB = bi[i+1] - bi[i]; 71067877ebaSShri Abhyankar ajj = aj + ai[i]; 71167877ebaSShri Abhyankar bjj = bj + bi[i]; 71267877ebaSShri Abhyankar v1 = av + bs2*ai[i]; 71367877ebaSShri Abhyankar v2 = bv + bs2*bi[i]; 71467877ebaSShri Abhyankar 71567877ebaSShri Abhyankar idx = 0; 71667877ebaSShri Abhyankar /* A-part */ 71767877ebaSShri Abhyankar for (k=0; k<countA; k++) { 71867877ebaSShri Abhyankar for (j=0; j<bs; j++) { 71967877ebaSShri Abhyankar for (n=0; n<bs; n++) { 720bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 721d985c460SShri Abhyankar row[jj] = irow + n + shift; 722d985c460SShri Abhyankar col[jj] = rstart + bs*ajj[k] + j + shift; 72367877ebaSShri Abhyankar } 72467877ebaSShri Abhyankar val[jj++] = v1[idx++]; 72567877ebaSShri Abhyankar } 72667877ebaSShri Abhyankar } 72767877ebaSShri Abhyankar } 72867877ebaSShri Abhyankar 72967877ebaSShri Abhyankar idx = 0; 73067877ebaSShri Abhyankar /* B-part */ 73167877ebaSShri Abhyankar for (k=0; k<countB; k++) { 73267877ebaSShri Abhyankar for (j=0; j<bs; j++) { 73367877ebaSShri Abhyankar for (n=0; n<bs; n++) { 734bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 735d985c460SShri Abhyankar row[jj] = irow + n + shift; 736d985c460SShri Abhyankar col[jj] = bs*garray[bjj[k]] + j + shift; 73767877ebaSShri Abhyankar } 738d985c460SShri Abhyankar val[jj++] = v2[idx++]; 73967877ebaSShri Abhyankar } 74067877ebaSShri Abhyankar } 74167877ebaSShri Abhyankar } 742d985c460SShri Abhyankar irow += bs; 74367877ebaSShri Abhyankar } 74467877ebaSShri Abhyankar PetscFunctionReturn(0); 74567877ebaSShri Abhyankar } 74667877ebaSShri Abhyankar 74767877ebaSShri Abhyankar #undef __FUNCT__ 74816ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpiaij_mpisbaij" 749bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpiaij_mpisbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 75016ebf90aSShri Abhyankar { 75116ebf90aSShri Abhyankar const PetscInt *ai, *aj,*adiag, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 75216ebf90aSShri Abhyankar PetscErrorCode ierr; 753e0bace9bSHong Zhang PetscInt rstart,nz,nza,nzb,i,j,jj,irow,countA,countB; 75416ebf90aSShri Abhyankar PetscInt *row,*col; 75516ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 75616ebf90aSShri Abhyankar PetscScalar *val; 75716ebf90aSShri Abhyankar Mat_MPIAIJ *mat = (Mat_MPIAIJ*)A->data; 75816ebf90aSShri Abhyankar Mat_SeqAIJ *aa =(Mat_SeqAIJ*)(mat->A)->data; 75916ebf90aSShri Abhyankar Mat_SeqAIJ *bb =(Mat_SeqAIJ*)(mat->B)->data; 76016ebf90aSShri Abhyankar 76116ebf90aSShri Abhyankar PetscFunctionBegin; 76216ebf90aSShri Abhyankar ai=aa->i; aj=aa->j; adiag=aa->diag; 76316ebf90aSShri Abhyankar bi=bb->i; bj=bb->j; garray = mat->garray; 76416ebf90aSShri Abhyankar av=aa->a; bv=bb->a; 7652205254eSKarl Rupp 76616ebf90aSShri Abhyankar rstart = A->rmap->rstart; 76716ebf90aSShri Abhyankar 768bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 769e0bace9bSHong Zhang nza = 0; /* num of upper triangular entries in mat->A, including diagonals */ 770e0bace9bSHong Zhang nzb = 0; /* num of upper triangular entries in mat->B */ 77116ebf90aSShri Abhyankar for (i=0; i<m; i++) { 772e0bace9bSHong Zhang nza += (ai[i+1] - adiag[i]); 77316ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 77416ebf90aSShri Abhyankar bjj = bj + bi[i]; 775e0bace9bSHong Zhang for (j=0; j<countB; j++) { 776e0bace9bSHong Zhang if (garray[bjj[j]] > rstart) nzb++; 777e0bace9bSHong Zhang } 778e0bace9bSHong Zhang } 77916ebf90aSShri Abhyankar 780e0bace9bSHong Zhang nz = nza + nzb; /* total nz of upper triangular part of mat */ 78116ebf90aSShri Abhyankar *nnz = nz; 782185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 783185f6596SHong Zhang col = row + nz; 784185f6596SHong Zhang val = (PetscScalar*)(col + nz); 785185f6596SHong Zhang 78616ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 78716ebf90aSShri Abhyankar } else { 78816ebf90aSShri Abhyankar row = *r; col = *c; val = *v; 78916ebf90aSShri Abhyankar } 79016ebf90aSShri Abhyankar 79116ebf90aSShri Abhyankar jj = 0; irow = rstart; 79216ebf90aSShri Abhyankar for (i=0; i<m; i++) { 79316ebf90aSShri Abhyankar ajj = aj + adiag[i]; /* ptr to the beginning of the diagonal of this row */ 79416ebf90aSShri Abhyankar v1 = av + adiag[i]; 79516ebf90aSShri Abhyankar countA = ai[i+1] - adiag[i]; 79616ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 79716ebf90aSShri Abhyankar bjj = bj + bi[i]; 79816ebf90aSShri Abhyankar v2 = bv + bi[i]; 79916ebf90aSShri Abhyankar 80016ebf90aSShri Abhyankar /* A-part */ 80116ebf90aSShri Abhyankar for (j=0; j<countA; j++) { 802bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 80316ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 80416ebf90aSShri Abhyankar } 80516ebf90aSShri Abhyankar val[jj++] = v1[j]; 80616ebf90aSShri Abhyankar } 80716ebf90aSShri Abhyankar 80816ebf90aSShri Abhyankar /* B-part */ 80916ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 81016ebf90aSShri Abhyankar if (garray[bjj[j]] > rstart) { 811bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 81216ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 81316ebf90aSShri Abhyankar } 81416ebf90aSShri Abhyankar val[jj++] = v2[j]; 81516ebf90aSShri Abhyankar } 816397b6df1SKris Buschelman } 817397b6df1SKris Buschelman irow++; 818397b6df1SKris Buschelman } 819397b6df1SKris Buschelman PetscFunctionReturn(0); 820397b6df1SKris Buschelman } 821397b6df1SKris Buschelman 822397b6df1SKris Buschelman #undef __FUNCT__ 82320be8e61SHong Zhang #define __FUNCT__ "MatGetDiagonal_MUMPS" 82420be8e61SHong Zhang PetscErrorCode MatGetDiagonal_MUMPS(Mat A,Vec v) 82520be8e61SHong Zhang { 82620be8e61SHong Zhang PetscFunctionBegin; 82720be8e61SHong Zhang SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Mat type: MUMPS factor"); 82820be8e61SHong Zhang PetscFunctionReturn(0); 82920be8e61SHong Zhang } 83020be8e61SHong Zhang 83120be8e61SHong Zhang #undef __FUNCT__ 8323924e44cSKris Buschelman #define __FUNCT__ "MatDestroy_MUMPS" 833dfbe8321SBarry Smith PetscErrorCode MatDestroy_MUMPS(Mat A) 834dfbe8321SBarry Smith { 835a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 836dfbe8321SBarry Smith PetscErrorCode ierr; 837b24902e0SBarry Smith 838397b6df1SKris Buschelman PetscFunctionBegin; 839a5e57a09SHong Zhang if (mumps->CleanUpMUMPS) { 840397b6df1SKris Buschelman /* Terminate instance, deallocate memories */ 841a5e57a09SHong Zhang ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr); 842a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_rhs);CHKERRQ(ierr); 843a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 844801fbe65SHong Zhang ierr = VecDestroy(&mumps->b_seq);CHKERRQ(ierr); 845a5e57a09SHong Zhang ierr = VecDestroy(&mumps->x_seq);CHKERRQ(ierr); 846a5e57a09SHong Zhang ierr = PetscFree(mumps->id.perm_in);CHKERRQ(ierr); 847a5e57a09SHong Zhang ierr = PetscFree(mumps->irn);CHKERRQ(ierr); 848b34f08ffSHong Zhang ierr = PetscFree(mumps->info);CHKERRQ(ierr); 84959ac8732SStefano Zampini ierr = MatMumpsResetSchur_Private(mumps);CHKERRQ(ierr); 850a5e57a09SHong Zhang mumps->id.job = JOB_END; 851a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 852a5e57a09SHong Zhang ierr = MPI_Comm_free(&(mumps->comm_mumps));CHKERRQ(ierr); 853397b6df1SKris Buschelman } 854a5e57a09SHong Zhang if (mumps->Destroy) { 855a5e57a09SHong Zhang ierr = (mumps->Destroy)(A);CHKERRQ(ierr); 856bf0cc555SLisandro Dalcin } 857bf0cc555SLisandro Dalcin ierr = PetscFree(A->spptr);CHKERRQ(ierr); 858bf0cc555SLisandro Dalcin 85997969023SHong Zhang /* clear composed functions */ 860bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatFactorGetSolverPackage_C",NULL);CHKERRQ(ierr); 861bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetIcntl_C",NULL);CHKERRQ(ierr); 862bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetIcntl_C",NULL);CHKERRQ(ierr); 863bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetCntl_C",NULL);CHKERRQ(ierr); 864bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetCntl_C",NULL);CHKERRQ(ierr); 865bc6112feSHong Zhang 866ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetInfo_C",NULL);CHKERRQ(ierr); 867ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetInfog_C",NULL);CHKERRQ(ierr); 868ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetRinfo_C",NULL);CHKERRQ(ierr); 869ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetRinfog_C",NULL);CHKERRQ(ierr); 8706444a565SStefano Zampini 8716444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetSchurIndices_C",NULL);CHKERRQ(ierr); 87259ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsInvertSchurComplement_C",NULL);CHKERRQ(ierr); 87359ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsCreateSchurComplement_C",NULL);CHKERRQ(ierr); 8746444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetSchurComplement_C",NULL);CHKERRQ(ierr); 87559ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsRestoreSchurComplement_C",NULL);CHKERRQ(ierr); 876e807eca7SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSolveSchurComplement_C",NULL);CHKERRQ(ierr); 8777404bcfbSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSolveSchurComplementTranspose_C",NULL);CHKERRQ(ierr); 878397b6df1SKris Buschelman PetscFunctionReturn(0); 879397b6df1SKris Buschelman } 880397b6df1SKris Buschelman 881397b6df1SKris Buschelman #undef __FUNCT__ 882f6c57405SHong Zhang #define __FUNCT__ "MatSolve_MUMPS" 883b24902e0SBarry Smith PetscErrorCode MatSolve_MUMPS(Mat A,Vec b,Vec x) 884b24902e0SBarry Smith { 885a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 886d54de34fSKris Buschelman PetscScalar *array; 88767877ebaSShri Abhyankar Vec b_seq; 888329ec9b3SHong Zhang IS is_iden,is_petsc; 889dfbe8321SBarry Smith PetscErrorCode ierr; 890329ec9b3SHong Zhang PetscInt i; 891883f2eb9SBarry Smith static PetscBool cite1 = PETSC_FALSE,cite2 = PETSC_FALSE; 892397b6df1SKris Buschelman 893397b6df1SKris Buschelman PetscFunctionBegin; 894883f2eb9SBarry Smith ierr = PetscCitationsRegister("@article{MUMPS01,\n author = {P.~R. Amestoy and I.~S. Duff and J.-Y. L'Excellent and J. Koster},\n title = {A fully asynchronous multifrontal solver using distributed dynamic scheduling},\n journal = {SIAM Journal on Matrix Analysis and Applications},\n volume = {23},\n number = {1},\n pages = {15--41},\n year = {2001}\n}\n",&cite1);CHKERRQ(ierr); 895883f2eb9SBarry Smith ierr = PetscCitationsRegister("@article{MUMPS02,\n author = {P.~R. Amestoy and A. Guermouche and J.-Y. L'Excellent and S. Pralet},\n title = {Hybrid scheduling for the parallel solution of linear systems},\n journal = {Parallel Computing},\n volume = {32},\n number = {2},\n pages = {136--156},\n year = {2006}\n}\n",&cite2);CHKERRQ(ierr); 896a5e57a09SHong Zhang mumps->id.nrhs = 1; 897a5e57a09SHong Zhang b_seq = mumps->b_seq; 898a5e57a09SHong Zhang if (mumps->size > 1) { 899329ec9b3SHong Zhang /* MUMPS only supports centralized rhs. Scatter b into a seqential rhs vector */ 900a5e57a09SHong Zhang ierr = VecScatterBegin(mumps->scat_rhs,b,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 901a5e57a09SHong Zhang ierr = VecScatterEnd(mumps->scat_rhs,b,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 902a5e57a09SHong Zhang if (!mumps->myid) {ierr = VecGetArray(b_seq,&array);CHKERRQ(ierr);} 903397b6df1SKris Buschelman } else { /* size == 1 */ 904397b6df1SKris Buschelman ierr = VecCopy(b,x);CHKERRQ(ierr); 905397b6df1SKris Buschelman ierr = VecGetArray(x,&array);CHKERRQ(ierr); 906397b6df1SKris Buschelman } 907a5e57a09SHong Zhang if (!mumps->myid) { /* define rhs on the host */ 908a5e57a09SHong Zhang mumps->id.nrhs = 1; 909940cd9d6SSatish Balay mumps->id.rhs = (MumpsScalar*)array; 910397b6df1SKris Buschelman } 911397b6df1SKris Buschelman 912b5fa320bSStefano Zampini /* handle condensation step of Schur complement (if any) */ 913b5fa320bSStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps);CHKERRQ(ierr); 914b5fa320bSStefano Zampini 915397b6df1SKris Buschelman /* solve phase */ 916329ec9b3SHong Zhang /*-------------*/ 917a5e57a09SHong Zhang mumps->id.job = JOB_SOLVE; 918a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 919a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 920397b6df1SKris Buschelman 921b5fa320bSStefano Zampini /* handle expansion step of Schur complement (if any) */ 922b5fa320bSStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps);CHKERRQ(ierr); 923b5fa320bSStefano Zampini 924a5e57a09SHong Zhang if (mumps->size > 1) { /* convert mumps distributed solution to petsc mpi x */ 925a5e57a09SHong Zhang if (mumps->scat_sol && mumps->ICNTL9_pre != mumps->id.ICNTL(9)) { 926a5e57a09SHong Zhang /* when id.ICNTL(9) changes, the contents of lsol_loc may change (not its size, lsol_loc), recreates scat_sol */ 927a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 928397b6df1SKris Buschelman } 929a5e57a09SHong Zhang if (!mumps->scat_sol) { /* create scatter scat_sol */ 930a5e57a09SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,mumps->id.lsol_loc,0,1,&is_iden);CHKERRQ(ierr); /* from */ 931a5e57a09SHong Zhang for (i=0; i<mumps->id.lsol_loc; i++) { 932a5e57a09SHong Zhang mumps->id.isol_loc[i] -= 1; /* change Fortran style to C style */ 933a5e57a09SHong Zhang } 934a5e57a09SHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,mumps->id.lsol_loc,mumps->id.isol_loc,PETSC_COPY_VALUES,&is_petsc);CHKERRQ(ierr); /* to */ 935a5e57a09SHong Zhang ierr = VecScatterCreate(mumps->x_seq,is_iden,x,is_petsc,&mumps->scat_sol);CHKERRQ(ierr); 9366bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 9376bf464f9SBarry Smith ierr = ISDestroy(&is_petsc);CHKERRQ(ierr); 9382205254eSKarl Rupp 939a5e57a09SHong Zhang mumps->ICNTL9_pre = mumps->id.ICNTL(9); /* save current value of id.ICNTL(9) */ 940397b6df1SKris Buschelman } 941a5e57a09SHong Zhang 942a5e57a09SHong Zhang ierr = VecScatterBegin(mumps->scat_sol,mumps->x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 943a5e57a09SHong Zhang ierr = VecScatterEnd(mumps->scat_sol,mumps->x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 944329ec9b3SHong Zhang } 945397b6df1SKris Buschelman PetscFunctionReturn(0); 946397b6df1SKris Buschelman } 947397b6df1SKris Buschelman 94851d5961aSHong Zhang #undef __FUNCT__ 94951d5961aSHong Zhang #define __FUNCT__ "MatSolveTranspose_MUMPS" 95051d5961aSHong Zhang PetscErrorCode MatSolveTranspose_MUMPS(Mat A,Vec b,Vec x) 95151d5961aSHong Zhang { 952a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 95351d5961aSHong Zhang PetscErrorCode ierr; 95451d5961aSHong Zhang 95551d5961aSHong Zhang PetscFunctionBegin; 956a5e57a09SHong Zhang mumps->id.ICNTL(9) = 0; 9570ad0caddSJed Brown ierr = MatSolve_MUMPS(A,b,x);CHKERRQ(ierr); 958a5e57a09SHong Zhang mumps->id.ICNTL(9) = 1; 95951d5961aSHong Zhang PetscFunctionReturn(0); 96051d5961aSHong Zhang } 96151d5961aSHong Zhang 962e0b74bf9SHong Zhang #undef __FUNCT__ 963e0b74bf9SHong Zhang #define __FUNCT__ "MatMatSolve_MUMPS" 964e0b74bf9SHong Zhang PetscErrorCode MatMatSolve_MUMPS(Mat A,Mat B,Mat X) 965e0b74bf9SHong Zhang { 966bda8bf91SBarry Smith PetscErrorCode ierr; 967bda8bf91SBarry Smith PetscBool flg; 9684e34a73bSHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 969334c5f61SHong Zhang PetscInt i,nrhs,M; 9702cd7d884SHong Zhang PetscScalar *array,*bray; 971bda8bf91SBarry Smith 972e0b74bf9SHong Zhang PetscFunctionBegin; 9730298fd71SBarry Smith ierr = PetscObjectTypeCompareAny((PetscObject)B,&flg,MATSEQDENSE,MATMPIDENSE,NULL);CHKERRQ(ierr); 974801fbe65SHong Zhang if (!flg) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_ARG_WRONG,"Matrix B must be MATDENSE matrix"); 9750298fd71SBarry Smith ierr = PetscObjectTypeCompareAny((PetscObject)X,&flg,MATSEQDENSE,MATMPIDENSE,NULL);CHKERRQ(ierr); 976801fbe65SHong Zhang if (!flg) SETERRQ(PetscObjectComm((PetscObject)X),PETSC_ERR_ARG_WRONG,"Matrix X must be MATDENSE matrix"); 977801fbe65SHong Zhang if (B->rmap->n != X->rmap->n) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_ARG_WRONG,"Matrix B and X must have same row distribution"); 9784e34a73bSHong Zhang 9792cd7d884SHong Zhang ierr = MatGetSize(B,&M,&nrhs);CHKERRQ(ierr); 980334c5f61SHong Zhang mumps->id.nrhs = nrhs; 981334c5f61SHong Zhang mumps->id.lrhs = M; 9824e34a73bSHong Zhang 9832cd7d884SHong Zhang if (mumps->size == 1) { 9842cd7d884SHong Zhang /* copy B to X */ 9852cd7d884SHong Zhang ierr = MatDenseGetArray(B,&bray);CHKERRQ(ierr); 9862cd7d884SHong Zhang ierr = MatDenseGetArray(X,&array);CHKERRQ(ierr); 9876444a565SStefano Zampini ierr = PetscMemcpy(array,bray,M*nrhs*sizeof(PetscScalar));CHKERRQ(ierr); 9882cd7d884SHong Zhang ierr = MatDenseRestoreArray(B,&bray);CHKERRQ(ierr); 989940cd9d6SSatish Balay mumps->id.rhs = (MumpsScalar*)array; 990b5fa320bSStefano Zampini /* handle condensation step of Schur complement (if any) */ 991b5fa320bSStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps);CHKERRQ(ierr); 992801fbe65SHong Zhang 9932cd7d884SHong Zhang /* solve phase */ 9942cd7d884SHong Zhang /*-------------*/ 9952cd7d884SHong Zhang mumps->id.job = JOB_SOLVE; 9962cd7d884SHong Zhang PetscMUMPS_c(&mumps->id); 9972cd7d884SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 998b5fa320bSStefano Zampini 999b5fa320bSStefano Zampini /* handle expansion step of Schur complement (if any) */ 1000b5fa320bSStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps);CHKERRQ(ierr); 10012cd7d884SHong Zhang ierr = MatDenseRestoreArray(X,&array);CHKERRQ(ierr); 1002334c5f61SHong Zhang } else { /*--------- parallel case --------*/ 100371aed81dSHong Zhang PetscInt lsol_loc,nlsol_loc,*isol_loc,*idx,*iidx,*idxx,*isol_loc_save; 10041070efccSSatish Balay MumpsScalar *sol_loc,*sol_loc_save; 1005801fbe65SHong Zhang IS is_to,is_from; 1006334c5f61SHong Zhang PetscInt k,proc,j,m; 1007801fbe65SHong Zhang const PetscInt *rstart; 1008334c5f61SHong Zhang Vec v_mpi,b_seq,x_seq; 1009334c5f61SHong Zhang VecScatter scat_rhs,scat_sol; 1010801fbe65SHong Zhang 1011801fbe65SHong Zhang /* create x_seq to hold local solution */ 101271aed81dSHong Zhang isol_loc_save = mumps->id.isol_loc; /* save it for MatSovle() */ 101371aed81dSHong Zhang sol_loc_save = mumps->id.sol_loc; 1014801fbe65SHong Zhang 101571aed81dSHong Zhang lsol_loc = mumps->id.INFO(23); 101671aed81dSHong Zhang nlsol_loc = nrhs*lsol_loc; /* length of sol_loc */ 101771aed81dSHong Zhang ierr = PetscMalloc2(nlsol_loc,&sol_loc,nlsol_loc,&isol_loc);CHKERRQ(ierr); 1018940cd9d6SSatish Balay mumps->id.sol_loc = (MumpsScalar*)sol_loc; 1019801fbe65SHong Zhang mumps->id.isol_loc = isol_loc; 1020801fbe65SHong Zhang 10211070efccSSatish Balay ierr = VecCreateSeqWithArray(PETSC_COMM_SELF,1,nlsol_loc,(PetscScalar*)sol_loc,&x_seq);CHKERRQ(ierr); 10222cd7d884SHong Zhang 102374f0fcc7SHong Zhang /* copy rhs matrix B into vector v_mpi */ 1024334c5f61SHong Zhang ierr = MatGetLocalSize(B,&m,NULL);CHKERRQ(ierr); 1025801fbe65SHong Zhang ierr = MatDenseGetArray(B,&bray);CHKERRQ(ierr); 102674f0fcc7SHong Zhang ierr = VecCreateMPIWithArray(PetscObjectComm((PetscObject)B),1,nrhs*m,nrhs*M,(const PetscScalar*)bray,&v_mpi);CHKERRQ(ierr); 1027801fbe65SHong Zhang ierr = MatDenseRestoreArray(B,&bray);CHKERRQ(ierr); 1028801fbe65SHong Zhang 1029334c5f61SHong Zhang /* scatter v_mpi to b_seq because MUMPS only supports centralized rhs */ 103074f0fcc7SHong Zhang /* idx: maps from k-th index of v_mpi to (i,j)-th global entry of B; 1031801fbe65SHong Zhang iidx: inverse of idx, will be used by scattering xx_seq -> X */ 1032801fbe65SHong Zhang ierr = PetscMalloc2(nrhs*M,&idx,nrhs*M,&iidx);CHKERRQ(ierr); 1033801fbe65SHong Zhang ierr = MatGetOwnershipRanges(B,&rstart);CHKERRQ(ierr); 1034801fbe65SHong Zhang k = 0; 1035801fbe65SHong Zhang for (proc=0; proc<mumps->size; proc++){ 1036801fbe65SHong Zhang for (j=0; j<nrhs; j++){ 1037801fbe65SHong Zhang for (i=rstart[proc]; i<rstart[proc+1]; i++){ 1038801fbe65SHong Zhang iidx[j*M + i] = k; 1039801fbe65SHong Zhang idx[k++] = j*M + i; 1040801fbe65SHong Zhang } 1041801fbe65SHong Zhang } 10422cd7d884SHong Zhang } 10432cd7d884SHong Zhang 1044801fbe65SHong Zhang if (!mumps->myid) { 1045334c5f61SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,nrhs*M,&b_seq);CHKERRQ(ierr); 1046801fbe65SHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,nrhs*M,idx,PETSC_COPY_VALUES,&is_to);CHKERRQ(ierr); 1047801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,nrhs*M,0,1,&is_from);CHKERRQ(ierr); 1048801fbe65SHong Zhang } else { 1049334c5f61SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&b_seq);CHKERRQ(ierr); 1050801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_to);CHKERRQ(ierr); 1051801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_from);CHKERRQ(ierr); 1052801fbe65SHong Zhang } 1053334c5f61SHong Zhang ierr = VecScatterCreate(v_mpi,is_from,b_seq,is_to,&scat_rhs);CHKERRQ(ierr); 1054334c5f61SHong Zhang ierr = VecScatterBegin(scat_rhs,v_mpi,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1055801fbe65SHong Zhang ierr = ISDestroy(&is_to);CHKERRQ(ierr); 1056801fbe65SHong Zhang ierr = ISDestroy(&is_from);CHKERRQ(ierr); 1057334c5f61SHong Zhang ierr = VecScatterEnd(scat_rhs,v_mpi,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1058801fbe65SHong Zhang 1059801fbe65SHong Zhang if (!mumps->myid) { /* define rhs on the host */ 1060334c5f61SHong Zhang ierr = VecGetArray(b_seq,&bray);CHKERRQ(ierr); 1061940cd9d6SSatish Balay mumps->id.rhs = (MumpsScalar*)bray; 1062334c5f61SHong Zhang ierr = VecRestoreArray(b_seq,&bray);CHKERRQ(ierr); 1063801fbe65SHong Zhang } 1064801fbe65SHong Zhang 1065801fbe65SHong Zhang /* solve phase */ 1066801fbe65SHong Zhang /*-------------*/ 1067801fbe65SHong Zhang mumps->id.job = JOB_SOLVE; 1068801fbe65SHong Zhang PetscMUMPS_c(&mumps->id); 1069801fbe65SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 1070801fbe65SHong Zhang 1071334c5f61SHong Zhang /* scatter mumps distributed solution to petsc vector v_mpi, which shares local arrays with solution matrix X */ 107274f0fcc7SHong Zhang ierr = MatDenseGetArray(X,&array);CHKERRQ(ierr); 107374f0fcc7SHong Zhang ierr = VecPlaceArray(v_mpi,array);CHKERRQ(ierr); 1074801fbe65SHong Zhang 1075334c5f61SHong Zhang /* create scatter scat_sol */ 107671aed81dSHong Zhang ierr = PetscMalloc1(nlsol_loc,&idxx);CHKERRQ(ierr); 107771aed81dSHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,nlsol_loc,0,1,&is_from);CHKERRQ(ierr); 107871aed81dSHong Zhang for (i=0; i<lsol_loc; i++) { 1079334c5f61SHong Zhang isol_loc[i] -= 1; /* change Fortran style to C style */ 1080334c5f61SHong Zhang idxx[i] = iidx[isol_loc[i]]; 1081801fbe65SHong Zhang for (j=1; j<nrhs; j++){ 1082334c5f61SHong Zhang idxx[j*lsol_loc+i] = iidx[isol_loc[i]+j*M]; 1083801fbe65SHong Zhang } 1084801fbe65SHong Zhang } 108571aed81dSHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,nlsol_loc,idxx,PETSC_COPY_VALUES,&is_to);CHKERRQ(ierr); 1086334c5f61SHong Zhang ierr = VecScatterCreate(x_seq,is_from,v_mpi,is_to,&scat_sol);CHKERRQ(ierr); 1087334c5f61SHong Zhang ierr = VecScatterBegin(scat_sol,x_seq,v_mpi,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1088801fbe65SHong Zhang ierr = ISDestroy(&is_from);CHKERRQ(ierr); 1089801fbe65SHong Zhang ierr = ISDestroy(&is_to);CHKERRQ(ierr); 1090334c5f61SHong Zhang ierr = VecScatterEnd(scat_sol,x_seq,v_mpi,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1091801fbe65SHong Zhang ierr = MatDenseRestoreArray(X,&array);CHKERRQ(ierr); 109271aed81dSHong Zhang 109371aed81dSHong Zhang /* free spaces */ 109471aed81dSHong Zhang mumps->id.sol_loc = sol_loc_save; 109571aed81dSHong Zhang mumps->id.isol_loc = isol_loc_save; 109671aed81dSHong Zhang 109771aed81dSHong Zhang ierr = PetscFree2(sol_loc,isol_loc);CHKERRQ(ierr); 1098801fbe65SHong Zhang ierr = PetscFree2(idx,iidx);CHKERRQ(ierr); 1099801fbe65SHong Zhang ierr = PetscFree(idxx);CHKERRQ(ierr); 110071aed81dSHong Zhang ierr = VecDestroy(&x_seq);CHKERRQ(ierr); 110174f0fcc7SHong Zhang ierr = VecDestroy(&v_mpi);CHKERRQ(ierr); 1102334c5f61SHong Zhang ierr = VecDestroy(&b_seq);CHKERRQ(ierr); 1103334c5f61SHong Zhang ierr = VecScatterDestroy(&scat_rhs);CHKERRQ(ierr); 1104334c5f61SHong Zhang ierr = VecScatterDestroy(&scat_sol);CHKERRQ(ierr); 1105801fbe65SHong Zhang } 1106e0b74bf9SHong Zhang PetscFunctionReturn(0); 1107e0b74bf9SHong Zhang } 1108e0b74bf9SHong Zhang 1109ace3df97SHong Zhang #if !defined(PETSC_USE_COMPLEX) 1110a58c3f20SHong Zhang /* 1111a58c3f20SHong Zhang input: 1112a58c3f20SHong Zhang F: numeric factor 1113a58c3f20SHong Zhang output: 1114a58c3f20SHong Zhang nneg: total number of negative pivots 1115a58c3f20SHong Zhang nzero: 0 1116a58c3f20SHong Zhang npos: (global dimension of F) - nneg 1117a58c3f20SHong Zhang */ 1118a58c3f20SHong Zhang 1119a58c3f20SHong Zhang #undef __FUNCT__ 1120a58c3f20SHong Zhang #define __FUNCT__ "MatGetInertia_SBAIJMUMPS" 1121dfbe8321SBarry Smith PetscErrorCode MatGetInertia_SBAIJMUMPS(Mat F,int *nneg,int *nzero,int *npos) 1122a58c3f20SHong Zhang { 1123a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 1124dfbe8321SBarry Smith PetscErrorCode ierr; 1125c1490034SHong Zhang PetscMPIInt size; 1126a58c3f20SHong Zhang 1127a58c3f20SHong Zhang PetscFunctionBegin; 1128ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)F),&size);CHKERRQ(ierr); 1129bcb30aebSHong Zhang /* MUMPS 4.3.1 calls ScaLAPACK when ICNTL(13)=0 (default), which does not offer the possibility to compute the inertia of a dense matrix. Set ICNTL(13)=1 to skip ScaLAPACK */ 1130a5e57a09SHong Zhang if (size > 1 && mumps->id.ICNTL(13) != 1) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"ICNTL(13)=%d. -mat_mumps_icntl_13 must be set as 1 for correct global matrix inertia\n",mumps->id.INFOG(13)); 1131ed85ac9fSHong Zhang 1132710ac8efSHong Zhang if (nneg) *nneg = mumps->id.INFOG(12); 1133ed85ac9fSHong Zhang if (nzero || npos) { 1134ed85ac9fSHong Zhang if (mumps->id.ICNTL(24) != 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"-mat_mumps_icntl_24 must be set as 1 for null pivot row detection"); 1135710ac8efSHong Zhang if (nzero) *nzero = mumps->id.INFOG(28); 1136710ac8efSHong Zhang if (npos) *npos = F->rmap->N - (mumps->id.INFOG(12) + mumps->id.INFOG(28)); 1137a58c3f20SHong Zhang } 1138a58c3f20SHong Zhang PetscFunctionReturn(0); 1139a58c3f20SHong Zhang } 1140ace3df97SHong Zhang #endif /* !defined(PETSC_USE_COMPLEX) */ 1141a58c3f20SHong Zhang 1142397b6df1SKris Buschelman #undef __FUNCT__ 1143f6c57405SHong Zhang #define __FUNCT__ "MatFactorNumeric_MUMPS" 11440481f469SBarry Smith PetscErrorCode MatFactorNumeric_MUMPS(Mat F,Mat A,const MatFactorInfo *info) 1145af281ebdSHong Zhang { 1146a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)(F)->spptr; 11476849ba73SBarry Smith PetscErrorCode ierr; 1148e09efc27SHong Zhang Mat F_diag; 1149ace3abfcSBarry Smith PetscBool isMPIAIJ; 1150397b6df1SKris Buschelman 1151397b6df1SKris Buschelman PetscFunctionBegin; 1152a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_REUSE_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 1153397b6df1SKris Buschelman 1154397b6df1SKris Buschelman /* numerical factorization phase */ 1155329ec9b3SHong Zhang /*-------------------------------*/ 1156a5e57a09SHong Zhang mumps->id.job = JOB_FACTNUMERIC; 11574e34a73bSHong Zhang if (!mumps->id.ICNTL(18)) { /* A is centralized */ 1158a5e57a09SHong Zhang if (!mumps->myid) { 1159940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 1160397b6df1SKris Buschelman } 1161397b6df1SKris Buschelman } else { 1162940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 1163397b6df1SKris Buschelman } 1164a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1165a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) { 1166151787a6SHong Zhang if (mumps->id.INFO(1) == -13) { 1167151787a6SHong Zhang if (mumps->id.INFO(2) < 0) { 1168151787a6SHong Zhang SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: Cannot allocate required memory %d megabytes\n",-mumps->id.INFO(2)); 1169151787a6SHong Zhang } else { 1170151787a6SHong Zhang SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: Cannot allocate required memory %d bytes\n",mumps->id.INFO(2)); 1171151787a6SHong Zhang } 1172151787a6SHong Zhang } else SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: INFO(1)=%d, INFO(2)=%d\n",mumps->id.INFO(1),mumps->id.INFO(2)); 1173397b6df1SKris Buschelman } 1174a5e57a09SHong Zhang if (!mumps->myid && mumps->id.ICNTL(16) > 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB," mumps->id.ICNTL(16):=%d\n",mumps->id.INFOG(16)); 1175397b6df1SKris Buschelman 1176dcd589f8SShri Abhyankar (F)->assembled = PETSC_TRUE; 1177a5e57a09SHong Zhang mumps->matstruc = SAME_NONZERO_PATTERN; 1178a5e57a09SHong Zhang mumps->CleanUpMUMPS = PETSC_TRUE; 1179b5fa320bSStefano Zampini mumps->schur_factored = PETSC_FALSE; 118059ac8732SStefano Zampini mumps->schur_inverted = PETSC_FALSE; 118167877ebaSShri Abhyankar 1182066565c5SStefano Zampini /* just to be sure that ICNTL(19) value returned by a call from MatMumpsGetIcntl is always consistent */ 1183066565c5SStefano Zampini if (!mumps->sym && mumps->id.ICNTL(19) && mumps->id.ICNTL(19) != 1) mumps->id.ICNTL(19) = 3; 1184066565c5SStefano Zampini 1185a5e57a09SHong Zhang if (mumps->size > 1) { 118667877ebaSShri Abhyankar PetscInt lsol_loc; 118767877ebaSShri Abhyankar PetscScalar *sol_loc; 11882205254eSKarl Rupp 1189c2093ab7SHong Zhang ierr = PetscObjectTypeCompare((PetscObject)A,MATMPIAIJ,&isMPIAIJ);CHKERRQ(ierr); 1190c2093ab7SHong Zhang if (isMPIAIJ) F_diag = ((Mat_MPIAIJ*)(F)->data)->A; 1191c2093ab7SHong Zhang else F_diag = ((Mat_MPISBAIJ*)(F)->data)->A; 1192c2093ab7SHong Zhang F_diag->assembled = PETSC_TRUE; 1193c2093ab7SHong Zhang 1194c2093ab7SHong Zhang /* distributed solution; Create x_seq=sol_loc for repeated use */ 1195c2093ab7SHong Zhang if (mumps->x_seq) { 1196c2093ab7SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 1197c2093ab7SHong Zhang ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr); 1198c2093ab7SHong Zhang ierr = VecDestroy(&mumps->x_seq);CHKERRQ(ierr); 1199c2093ab7SHong Zhang } 1200a5e57a09SHong Zhang lsol_loc = mumps->id.INFO(23); /* length of sol_loc */ 1201dcca6d9dSJed Brown ierr = PetscMalloc2(lsol_loc,&sol_loc,lsol_loc,&mumps->id.isol_loc);CHKERRQ(ierr); 1202a5e57a09SHong Zhang mumps->id.lsol_loc = lsol_loc; 1203940cd9d6SSatish Balay mumps->id.sol_loc = (MumpsScalar*)sol_loc; 1204a5e57a09SHong Zhang ierr = VecCreateSeqWithArray(PETSC_COMM_SELF,1,lsol_loc,sol_loc,&mumps->x_seq);CHKERRQ(ierr); 120567877ebaSShri Abhyankar } 1206397b6df1SKris Buschelman PetscFunctionReturn(0); 1207397b6df1SKris Buschelman } 1208397b6df1SKris Buschelman 12099a2535b5SHong Zhang /* Sets MUMPS options from the options database */ 1210dcd589f8SShri Abhyankar #undef __FUNCT__ 12119a2535b5SHong Zhang #define __FUNCT__ "PetscSetMUMPSFromOptions" 12129a2535b5SHong Zhang PetscErrorCode PetscSetMUMPSFromOptions(Mat F, Mat A) 1213dcd589f8SShri Abhyankar { 12149a2535b5SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1215dcd589f8SShri Abhyankar PetscErrorCode ierr; 1216b34f08ffSHong Zhang PetscInt icntl,info[40],i,ninfo=40; 1217ace3abfcSBarry Smith PetscBool flg; 1218dcd589f8SShri Abhyankar 1219dcd589f8SShri Abhyankar PetscFunctionBegin; 1220ce94432eSBarry Smith ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)A),((PetscObject)A)->prefix,"MUMPS Options","Mat");CHKERRQ(ierr); 12219a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_1","ICNTL(1): output stream for error messages","None",mumps->id.ICNTL(1),&icntl,&flg);CHKERRQ(ierr); 12229a2535b5SHong Zhang if (flg) mumps->id.ICNTL(1) = icntl; 12239a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_2","ICNTL(2): output stream for diagnostic printing, statistics, and warning","None",mumps->id.ICNTL(2),&icntl,&flg);CHKERRQ(ierr); 12249a2535b5SHong Zhang if (flg) mumps->id.ICNTL(2) = icntl; 12259a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_3","ICNTL(3): output stream for global information, collected on the host","None",mumps->id.ICNTL(3),&icntl,&flg);CHKERRQ(ierr); 12269a2535b5SHong Zhang if (flg) mumps->id.ICNTL(3) = icntl; 1227dcd589f8SShri Abhyankar 12289a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_4","ICNTL(4): level of printing (0 to 4)","None",mumps->id.ICNTL(4),&icntl,&flg);CHKERRQ(ierr); 12299a2535b5SHong Zhang if (flg) mumps->id.ICNTL(4) = icntl; 12309a2535b5SHong Zhang if (mumps->id.ICNTL(4) || PetscLogPrintInfo) mumps->id.ICNTL(3) = 6; /* resume MUMPS default id.ICNTL(3) = 6 */ 12319a2535b5SHong Zhang 1232d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_6","ICNTL(6): permutes to a zero-free diagonal and/or scale the matrix (0 to 7)","None",mumps->id.ICNTL(6),&icntl,&flg);CHKERRQ(ierr); 12339a2535b5SHong Zhang if (flg) mumps->id.ICNTL(6) = icntl; 12349a2535b5SHong Zhang 1235d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_7","ICNTL(7): computes a symmetric permutation in sequential analysis (0 to 7). 3=Scotch, 4=PORD, 5=Metis","None",mumps->id.ICNTL(7),&icntl,&flg);CHKERRQ(ierr); 1236dcd589f8SShri Abhyankar if (flg) { 12372205254eSKarl Rupp if (icntl== 1 && mumps->size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"pivot order be set by the user in PERM_IN -- not supported by the PETSc/MUMPS interface\n"); 12382205254eSKarl Rupp else mumps->id.ICNTL(7) = icntl; 1239dcd589f8SShri Abhyankar } 1240e0b74bf9SHong Zhang 12410298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_8","ICNTL(8): scaling strategy (-2 to 8 or 77)","None",mumps->id.ICNTL(8),&mumps->id.ICNTL(8),NULL);CHKERRQ(ierr); 1242d341cd04SHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_9","ICNTL(9): computes the solution using A or A^T","None",mumps->id.ICNTL(9),&mumps->id.ICNTL(9),NULL);CHKERRQ(ierr); handled by MatSolveTranspose_MUMPS() */ 12430298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_10","ICNTL(10): max num of refinements","None",mumps->id.ICNTL(10),&mumps->id.ICNTL(10),NULL);CHKERRQ(ierr); 1244d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_11","ICNTL(11): statistics related to an error analysis (via -ksp_view)","None",mumps->id.ICNTL(11),&mumps->id.ICNTL(11),NULL);CHKERRQ(ierr); 1245d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_12","ICNTL(12): an ordering strategy for symmetric matrices (0 to 3)","None",mumps->id.ICNTL(12),&mumps->id.ICNTL(12),NULL);CHKERRQ(ierr); 1246d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_13","ICNTL(13): parallelism of the root node (enable ScaLAPACK) and its splitting","None",mumps->id.ICNTL(13),&mumps->id.ICNTL(13),NULL);CHKERRQ(ierr); 1247d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_14","ICNTL(14): percentage increase in the estimated working space","None",mumps->id.ICNTL(14),&mumps->id.ICNTL(14),NULL);CHKERRQ(ierr); 1248d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_19","ICNTL(19): computes the Schur complement","None",mumps->id.ICNTL(19),&mumps->id.ICNTL(19),NULL);CHKERRQ(ierr); 124959ac8732SStefano Zampini if (mumps->id.ICNTL(19) <= 0 || mumps->id.ICNTL(19) > 3) { /* reset any schur data (if any) */ 125059ac8732SStefano Zampini ierr = MatMumpsResetSchur_Private(mumps);CHKERRQ(ierr); 125159ac8732SStefano Zampini } 12524e34a73bSHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_20","ICNTL(20): the format (dense or sparse) of the right-hand sides","None",mumps->id.ICNTL(20),&mumps->id.ICNTL(20),NULL);CHKERRQ(ierr); -- sparse rhs is not supported in PETSc API */ 1253d341cd04SHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_21","ICNTL(21): the distribution (centralized or distributed) of the solution vectors","None",mumps->id.ICNTL(21),&mumps->id.ICNTL(21),NULL);CHKERRQ(ierr); we only use distributed solution vector */ 12549a2535b5SHong Zhang 1255d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_22","ICNTL(22): in-core/out-of-core factorization and solve (0 or 1)","None",mumps->id.ICNTL(22),&mumps->id.ICNTL(22),NULL);CHKERRQ(ierr); 12560298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_23","ICNTL(23): max size of the working memory (MB) that can allocate per processor","None",mumps->id.ICNTL(23),&mumps->id.ICNTL(23),NULL);CHKERRQ(ierr); 12570298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_24","ICNTL(24): detection of null pivot rows (0 or 1)","None",mumps->id.ICNTL(24),&mumps->id.ICNTL(24),NULL);CHKERRQ(ierr); 12589a2535b5SHong Zhang if (mumps->id.ICNTL(24)) { 12599a2535b5SHong Zhang mumps->id.ICNTL(13) = 1; /* turn-off ScaLAPACK to help with the correct detection of null pivots */ 1260d7ebd59bSHong Zhang } 1261d7ebd59bSHong Zhang 1262d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_25","ICNTL(25): compute a solution of a deficient matrix and a null space basis","None",mumps->id.ICNTL(25),&mumps->id.ICNTL(25),NULL);CHKERRQ(ierr); 1263d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_26","ICNTL(26): drives the solution phase if a Schur complement matrix","None",mumps->id.ICNTL(26),&mumps->id.ICNTL(26),NULL);CHKERRQ(ierr); 12642cd7d884SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_27","ICNTL(27): the blocking size for multiple right-hand sides","None",mumps->id.ICNTL(27),&mumps->id.ICNTL(27),NULL);CHKERRQ(ierr); 12650298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_28","ICNTL(28): use 1 for sequential analysis and ictnl(7) ordering, or 2 for parallel analysis and ictnl(29) ordering","None",mumps->id.ICNTL(28),&mumps->id.ICNTL(28),NULL);CHKERRQ(ierr); 1266d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_29","ICNTL(29): parallel ordering 1 = ptscotch, 2 = parmetis","None",mumps->id.ICNTL(29),&mumps->id.ICNTL(29),NULL);CHKERRQ(ierr); 12670298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_30","ICNTL(30): compute user-specified set of entries in inv(A)","None",mumps->id.ICNTL(30),&mumps->id.ICNTL(30),NULL);CHKERRQ(ierr); 1268d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_31","ICNTL(31): indicates which factors may be discarded during factorization","None",mumps->id.ICNTL(31),&mumps->id.ICNTL(31),NULL);CHKERRQ(ierr); 12694e34a73bSHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_32","ICNTL(32): performs the forward elemination of the right-hand sides during factorization","None",mumps->id.ICNTL(32),&mumps->id.ICNTL(32),NULL);CHKERRQ(ierr); -- not supported by PETSc API */ 12700298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_33","ICNTL(33): compute determinant","None",mumps->id.ICNTL(33),&mumps->id.ICNTL(33),NULL);CHKERRQ(ierr); 1271dcd589f8SShri Abhyankar 12720298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_1","CNTL(1): relative pivoting threshold","None",mumps->id.CNTL(1),&mumps->id.CNTL(1),NULL);CHKERRQ(ierr); 12730298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_2","CNTL(2): stopping criterion of refinement","None",mumps->id.CNTL(2),&mumps->id.CNTL(2),NULL);CHKERRQ(ierr); 12740298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_3","CNTL(3): absolute pivoting threshold","None",mumps->id.CNTL(3),&mumps->id.CNTL(3),NULL);CHKERRQ(ierr); 12750298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_4","CNTL(4): value for static pivoting","None",mumps->id.CNTL(4),&mumps->id.CNTL(4),NULL);CHKERRQ(ierr); 12760298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_5","CNTL(5): fixation for null pivots","None",mumps->id.CNTL(5),&mumps->id.CNTL(5),NULL);CHKERRQ(ierr); 1277e5bb22a1SHong Zhang 12780298fd71SBarry Smith ierr = PetscOptionsString("-mat_mumps_ooc_tmpdir", "out of core directory", "None", mumps->id.ooc_tmpdir, mumps->id.ooc_tmpdir, 256, NULL); 1279b34f08ffSHong Zhang 128016d797efSHong Zhang ierr = PetscOptionsIntArray("-mat_mumps_view_info","request INFO local to each processor","",info,&ninfo,NULL);CHKERRQ(ierr); 1281b34f08ffSHong Zhang if (ninfo) { 1282b34f08ffSHong Zhang if (ninfo > 40) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"number of INFO %d must <= 40\n",ninfo); 1283b34f08ffSHong Zhang ierr = PetscMalloc1(ninfo,&mumps->info);CHKERRQ(ierr); 1284b34f08ffSHong Zhang mumps->ninfo = ninfo; 1285b34f08ffSHong Zhang for (i=0; i<ninfo; i++) { 1286b34f08ffSHong Zhang if (info[i] < 0 || info[i]>40) { 1287b34f08ffSHong Zhang SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"index of INFO %d must between 1 and 40\n",ninfo); 1288b34f08ffSHong Zhang } else { 1289b34f08ffSHong Zhang mumps->info[i] = info[i]; 1290b34f08ffSHong Zhang } 1291b34f08ffSHong Zhang } 1292b34f08ffSHong Zhang } 1293b34f08ffSHong Zhang 1294dcd589f8SShri Abhyankar PetscOptionsEnd(); 1295dcd589f8SShri Abhyankar PetscFunctionReturn(0); 1296dcd589f8SShri Abhyankar } 1297dcd589f8SShri Abhyankar 1298dcd589f8SShri Abhyankar #undef __FUNCT__ 1299dcd589f8SShri Abhyankar #define __FUNCT__ "PetscInitializeMUMPS" 1300f697e70eSHong Zhang PetscErrorCode PetscInitializeMUMPS(Mat A,Mat_MUMPS *mumps) 1301dcd589f8SShri Abhyankar { 1302dcd589f8SShri Abhyankar PetscErrorCode ierr; 1303dcd589f8SShri Abhyankar 1304dcd589f8SShri Abhyankar PetscFunctionBegin; 1305ce94432eSBarry Smith ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)A), &mumps->myid); 1306ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)A),&mumps->size);CHKERRQ(ierr); 1307ce94432eSBarry Smith ierr = MPI_Comm_dup(PetscObjectComm((PetscObject)A),&(mumps->comm_mumps));CHKERRQ(ierr); 13082205254eSKarl Rupp 1309f697e70eSHong Zhang mumps->id.comm_fortran = MPI_Comm_c2f(mumps->comm_mumps); 1310f697e70eSHong Zhang 1311f697e70eSHong Zhang mumps->id.job = JOB_INIT; 1312f697e70eSHong Zhang mumps->id.par = 1; /* host participates factorizaton and solve */ 1313f697e70eSHong Zhang mumps->id.sym = mumps->sym; 13142907cef9SHong Zhang PetscMUMPS_c(&mumps->id); 1315f697e70eSHong Zhang 1316f697e70eSHong Zhang mumps->CleanUpMUMPS = PETSC_FALSE; 13170298fd71SBarry Smith mumps->scat_rhs = NULL; 13180298fd71SBarry Smith mumps->scat_sol = NULL; 13199a2535b5SHong Zhang 132070544d5fSHong Zhang /* set PETSc-MUMPS default options - override MUMPS default */ 13219a2535b5SHong Zhang mumps->id.ICNTL(3) = 0; 13229a2535b5SHong Zhang mumps->id.ICNTL(4) = 0; 13239a2535b5SHong Zhang if (mumps->size == 1) { 13249a2535b5SHong Zhang mumps->id.ICNTL(18) = 0; /* centralized assembled matrix input */ 13259a2535b5SHong Zhang } else { 13269a2535b5SHong Zhang mumps->id.ICNTL(18) = 3; /* distributed assembled matrix input */ 13274e34a73bSHong Zhang mumps->id.ICNTL(20) = 0; /* rhs is in dense format */ 132870544d5fSHong Zhang mumps->id.ICNTL(21) = 1; /* distributed solution */ 13299a2535b5SHong Zhang } 13306444a565SStefano Zampini 13316444a565SStefano Zampini /* schur */ 13326444a565SStefano Zampini mumps->id.size_schur = 0; 13336444a565SStefano Zampini mumps->id.listvar_schur = NULL; 13346444a565SStefano Zampini mumps->id.schur = NULL; 1335b5fa320bSStefano Zampini mumps->schur_second_solve = PETSC_FALSE; 1336b5fa320bSStefano Zampini mumps->sizeredrhs = 0; 1337b5fa320bSStefano Zampini mumps->schur_pivots = NULL; 1338b5fa320bSStefano Zampini mumps->schur_work = NULL; 133959ac8732SStefano Zampini mumps->schur_sol = NULL; 134059ac8732SStefano Zampini mumps->schur_sizesol = 0; 134159ac8732SStefano Zampini mumps->schur_restored = PETSC_TRUE; 134259ac8732SStefano Zampini mumps->schur_factored = PETSC_FALSE; 134359ac8732SStefano Zampini mumps->schur_inverted = PETSC_FALSE; 1344dcd589f8SShri Abhyankar PetscFunctionReturn(0); 1345dcd589f8SShri Abhyankar } 1346dcd589f8SShri Abhyankar 1347a5e57a09SHong Zhang /* Note Petsc r(=c) permutation is used when mumps->id.ICNTL(7)==1 with centralized assembled matrix input; otherwise r and c are ignored */ 1348397b6df1SKris Buschelman #undef __FUNCT__ 1349f0c56d0fSKris Buschelman #define __FUNCT__ "MatLUFactorSymbolic_AIJMUMPS" 13500481f469SBarry Smith PetscErrorCode MatLUFactorSymbolic_AIJMUMPS(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info) 1351b24902e0SBarry Smith { 1352a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1353dcd589f8SShri Abhyankar PetscErrorCode ierr; 135467877ebaSShri Abhyankar Vec b; 135567877ebaSShri Abhyankar IS is_iden; 135667877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1357397b6df1SKris Buschelman 1358397b6df1SKris Buschelman PetscFunctionBegin; 1359a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1360dcd589f8SShri Abhyankar 13619a2535b5SHong Zhang /* Set MUMPS options from the options database */ 13629a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1363dcd589f8SShri Abhyankar 1364a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 1365dcd589f8SShri Abhyankar 136667877ebaSShri Abhyankar /* analysis phase */ 136767877ebaSShri Abhyankar /*----------------*/ 1368a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1369a5e57a09SHong Zhang mumps->id.n = M; 1370a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 137167877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1372a5e57a09SHong Zhang if (!mumps->myid) { 1373a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1374a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1375940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 137667877ebaSShri Abhyankar } 1377a5e57a09SHong Zhang if (mumps->id.ICNTL(7) == 1) { /* use user-provide matrix ordering - assuming r = c ordering */ 13785248a706SHong Zhang /* 13795248a706SHong Zhang PetscBool flag; 13805248a706SHong Zhang ierr = ISEqual(r,c,&flag);CHKERRQ(ierr); 13815248a706SHong Zhang if (!flag) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"row_perm != col_perm"); 13825248a706SHong Zhang ierr = ISView(r,PETSC_VIEWER_STDOUT_SELF); 13835248a706SHong Zhang */ 1384a5e57a09SHong Zhang if (!mumps->myid) { 1385e0b74bf9SHong Zhang const PetscInt *idx; 1386e0b74bf9SHong Zhang PetscInt i,*perm_in; 13872205254eSKarl Rupp 1388785e854fSJed Brown ierr = PetscMalloc1(M,&perm_in);CHKERRQ(ierr); 1389e0b74bf9SHong Zhang ierr = ISGetIndices(r,&idx);CHKERRQ(ierr); 13902205254eSKarl Rupp 1391a5e57a09SHong Zhang mumps->id.perm_in = perm_in; 1392e0b74bf9SHong Zhang for (i=0; i<M; i++) perm_in[i] = idx[i]+1; /* perm_in[]: start from 1, not 0! */ 1393e0b74bf9SHong Zhang ierr = ISRestoreIndices(r,&idx);CHKERRQ(ierr); 1394e0b74bf9SHong Zhang } 1395e0b74bf9SHong Zhang } 139667877ebaSShri Abhyankar } 139767877ebaSShri Abhyankar break; 139867877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1399a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1400a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1401a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1402940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 140367877ebaSShri Abhyankar } 140467877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1405a5e57a09SHong Zhang if (!mumps->myid) { 14062cd7d884SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->rmap->N,&mumps->b_seq);CHKERRQ(ierr); 14072cd7d884SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,A->rmap->N,0,1,&is_iden);CHKERRQ(ierr); 140867877ebaSShri Abhyankar } else { 1409a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 141067877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 141167877ebaSShri Abhyankar } 14122a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1413a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 14146bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 14156bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 141667877ebaSShri Abhyankar break; 141767877ebaSShri Abhyankar } 1418a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1419a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 142067877ebaSShri Abhyankar 1421719d5645SBarry Smith F->ops->lufactornumeric = MatFactorNumeric_MUMPS; 1422dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 142351d5961aSHong Zhang F->ops->solvetranspose = MatSolveTranspose_MUMPS; 14244e34a73bSHong Zhang F->ops->matsolve = MatMatSolve_MUMPS; 1425b24902e0SBarry Smith PetscFunctionReturn(0); 1426b24902e0SBarry Smith } 1427b24902e0SBarry Smith 1428450b117fSShri Abhyankar /* Note the Petsc r and c permutations are ignored */ 1429450b117fSShri Abhyankar #undef __FUNCT__ 1430450b117fSShri Abhyankar #define __FUNCT__ "MatLUFactorSymbolic_BAIJMUMPS" 1431450b117fSShri Abhyankar PetscErrorCode MatLUFactorSymbolic_BAIJMUMPS(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info) 1432450b117fSShri Abhyankar { 1433a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1434dcd589f8SShri Abhyankar PetscErrorCode ierr; 143567877ebaSShri Abhyankar Vec b; 143667877ebaSShri Abhyankar IS is_iden; 143767877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1438450b117fSShri Abhyankar 1439450b117fSShri Abhyankar PetscFunctionBegin; 1440a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1441dcd589f8SShri Abhyankar 14429a2535b5SHong Zhang /* Set MUMPS options from the options database */ 14439a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1444dcd589f8SShri Abhyankar 1445a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 144667877ebaSShri Abhyankar 144767877ebaSShri Abhyankar /* analysis phase */ 144867877ebaSShri Abhyankar /*----------------*/ 1449a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1450a5e57a09SHong Zhang mumps->id.n = M; 1451a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 145267877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1453a5e57a09SHong Zhang if (!mumps->myid) { 1454a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1455a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1456940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 145767877ebaSShri Abhyankar } 145867877ebaSShri Abhyankar } 145967877ebaSShri Abhyankar break; 146067877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1461a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1462a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1463a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1464940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 146567877ebaSShri Abhyankar } 146667877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1467a5e57a09SHong Zhang if (!mumps->myid) { 1468a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr); 146967877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr); 147067877ebaSShri Abhyankar } else { 1471a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 147267877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 147367877ebaSShri Abhyankar } 14742a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1475a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 14766bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 14776bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 147867877ebaSShri Abhyankar break; 147967877ebaSShri Abhyankar } 1480a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1481a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 148267877ebaSShri Abhyankar 1483450b117fSShri Abhyankar F->ops->lufactornumeric = MatFactorNumeric_MUMPS; 1484dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 148551d5961aSHong Zhang F->ops->solvetranspose = MatSolveTranspose_MUMPS; 1486450b117fSShri Abhyankar PetscFunctionReturn(0); 1487450b117fSShri Abhyankar } 1488b24902e0SBarry Smith 1489141f4205SHong Zhang /* Note the Petsc r permutation and factor info are ignored */ 1490397b6df1SKris Buschelman #undef __FUNCT__ 149167877ebaSShri Abhyankar #define __FUNCT__ "MatCholeskyFactorSymbolic_MUMPS" 149267877ebaSShri Abhyankar PetscErrorCode MatCholeskyFactorSymbolic_MUMPS(Mat F,Mat A,IS r,const MatFactorInfo *info) 1493b24902e0SBarry Smith { 1494a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1495dcd589f8SShri Abhyankar PetscErrorCode ierr; 149667877ebaSShri Abhyankar Vec b; 149767877ebaSShri Abhyankar IS is_iden; 149867877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1499397b6df1SKris Buschelman 1500397b6df1SKris Buschelman PetscFunctionBegin; 1501a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1502dcd589f8SShri Abhyankar 15039a2535b5SHong Zhang /* Set MUMPS options from the options database */ 15049a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1505dcd589f8SShri Abhyankar 1506a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 1507dcd589f8SShri Abhyankar 150867877ebaSShri Abhyankar /* analysis phase */ 150967877ebaSShri Abhyankar /*----------------*/ 1510a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1511a5e57a09SHong Zhang mumps->id.n = M; 1512a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 151367877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1514a5e57a09SHong Zhang if (!mumps->myid) { 1515a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1516a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1517940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 151867877ebaSShri Abhyankar } 151967877ebaSShri Abhyankar } 152067877ebaSShri Abhyankar break; 152167877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1522a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1523a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1524a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1525940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 152667877ebaSShri Abhyankar } 152767877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1528a5e57a09SHong Zhang if (!mumps->myid) { 1529a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr); 153067877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr); 153167877ebaSShri Abhyankar } else { 1532a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 153367877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 153467877ebaSShri Abhyankar } 15352a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1536a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 15376bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 15386bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 153967877ebaSShri Abhyankar break; 154067877ebaSShri Abhyankar } 1541a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1542a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 154367877ebaSShri Abhyankar 15442792810eSHong Zhang F->ops->choleskyfactornumeric = MatFactorNumeric_MUMPS; 1545dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 154651d5961aSHong Zhang F->ops->solvetranspose = MatSolve_MUMPS; 15474e34a73bSHong Zhang F->ops->matsolve = MatMatSolve_MUMPS; 15484e34a73bSHong Zhang #if defined(PETSC_USE_COMPLEX) 15490298fd71SBarry Smith F->ops->getinertia = NULL; 15504e34a73bSHong Zhang #else 15514e34a73bSHong Zhang F->ops->getinertia = MatGetInertia_SBAIJMUMPS; 1552db4efbfdSBarry Smith #endif 1553b24902e0SBarry Smith PetscFunctionReturn(0); 1554b24902e0SBarry Smith } 1555b24902e0SBarry Smith 1556397b6df1SKris Buschelman #undef __FUNCT__ 155764e6c443SBarry Smith #define __FUNCT__ "MatView_MUMPS" 155864e6c443SBarry Smith PetscErrorCode MatView_MUMPS(Mat A,PetscViewer viewer) 155974ed9c26SBarry Smith { 1560f6c57405SHong Zhang PetscErrorCode ierr; 156164e6c443SBarry Smith PetscBool iascii; 156264e6c443SBarry Smith PetscViewerFormat format; 1563a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 1564f6c57405SHong Zhang 1565f6c57405SHong Zhang PetscFunctionBegin; 156664e6c443SBarry Smith /* check if matrix is mumps type */ 156764e6c443SBarry Smith if (A->ops->solve != MatSolve_MUMPS) PetscFunctionReturn(0); 156864e6c443SBarry Smith 1569251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 157064e6c443SBarry Smith if (iascii) { 157164e6c443SBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 157264e6c443SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO) { 157364e6c443SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"MUMPS run parameters:\n");CHKERRQ(ierr); 1574a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," SYM (matrix type): %d \n",mumps->id.sym);CHKERRQ(ierr); 1575a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," PAR (host participation): %d \n",mumps->id.par);CHKERRQ(ierr); 1576a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(1) (output for error): %d \n",mumps->id.ICNTL(1));CHKERRQ(ierr); 1577a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(2) (output of diagnostic msg): %d \n",mumps->id.ICNTL(2));CHKERRQ(ierr); 1578a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(3) (output for global info): %d \n",mumps->id.ICNTL(3));CHKERRQ(ierr); 1579a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(4) (level of printing): %d \n",mumps->id.ICNTL(4));CHKERRQ(ierr); 1580a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(5) (input mat struct): %d \n",mumps->id.ICNTL(5));CHKERRQ(ierr); 1581a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(6) (matrix prescaling): %d \n",mumps->id.ICNTL(6));CHKERRQ(ierr); 1582a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(7) (sequentia matrix ordering):%d \n",mumps->id.ICNTL(7));CHKERRQ(ierr); 1583a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(8) (scalling strategy): %d \n",mumps->id.ICNTL(8));CHKERRQ(ierr); 1584a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(10) (max num of refinements): %d \n",mumps->id.ICNTL(10));CHKERRQ(ierr); 1585a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(11) (error analysis): %d \n",mumps->id.ICNTL(11));CHKERRQ(ierr); 1586a5e57a09SHong Zhang if (mumps->id.ICNTL(11)>0) { 1587a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(4) (inf norm of input mat): %g\n",mumps->id.RINFOG(4));CHKERRQ(ierr); 1588a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(5) (inf norm of solution): %g\n",mumps->id.RINFOG(5));CHKERRQ(ierr); 1589a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(6) (inf norm of residual): %g\n",mumps->id.RINFOG(6));CHKERRQ(ierr); 1590a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(7),RINFOG(8) (backward error est): %g, %g\n",mumps->id.RINFOG(7),mumps->id.RINFOG(8));CHKERRQ(ierr); 1591a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(9) (error estimate): %g \n",mumps->id.RINFOG(9));CHKERRQ(ierr); 1592a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(10),RINFOG(11)(condition numbers): %g, %g\n",mumps->id.RINFOG(10),mumps->id.RINFOG(11));CHKERRQ(ierr); 1593f6c57405SHong Zhang } 1594a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(12) (efficiency control): %d \n",mumps->id.ICNTL(12));CHKERRQ(ierr); 1595a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(13) (efficiency control): %d \n",mumps->id.ICNTL(13));CHKERRQ(ierr); 1596a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(14) (percentage of estimated workspace increase): %d \n",mumps->id.ICNTL(14));CHKERRQ(ierr); 1597f6c57405SHong Zhang /* ICNTL(15-17) not used */ 1598a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(18) (input mat struct): %d \n",mumps->id.ICNTL(18));CHKERRQ(ierr); 1599a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(19) (Shur complement info): %d \n",mumps->id.ICNTL(19));CHKERRQ(ierr); 1600a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(20) (rhs sparse pattern): %d \n",mumps->id.ICNTL(20));CHKERRQ(ierr); 1601ca3dc52bSPierre Jolivet ierr = PetscViewerASCIIPrintf(viewer," ICNTL(21) (solution struct): %d \n",mumps->id.ICNTL(21));CHKERRQ(ierr); 1602a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(22) (in-core/out-of-core facility): %d \n",mumps->id.ICNTL(22));CHKERRQ(ierr); 1603a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(23) (max size of memory can be allocated locally):%d \n",mumps->id.ICNTL(23));CHKERRQ(ierr); 1604c0165424SHong Zhang 1605a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(24) (detection of null pivot rows): %d \n",mumps->id.ICNTL(24));CHKERRQ(ierr); 1606a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(25) (computation of a null space basis): %d \n",mumps->id.ICNTL(25));CHKERRQ(ierr); 1607a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(26) (Schur options for rhs or solution): %d \n",mumps->id.ICNTL(26));CHKERRQ(ierr); 1608a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(27) (experimental parameter): %d \n",mumps->id.ICNTL(27));CHKERRQ(ierr); 1609a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(28) (use parallel or sequential ordering): %d \n",mumps->id.ICNTL(28));CHKERRQ(ierr); 1610a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(29) (parallel ordering): %d \n",mumps->id.ICNTL(29));CHKERRQ(ierr); 161142179a6aSHong Zhang 1612a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(30) (user-specified set of entries in inv(A)): %d \n",mumps->id.ICNTL(30));CHKERRQ(ierr); 1613a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(31) (factors is discarded in the solve phase): %d \n",mumps->id.ICNTL(31));CHKERRQ(ierr); 1614a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(33) (compute determinant): %d \n",mumps->id.ICNTL(33));CHKERRQ(ierr); 1615f6c57405SHong Zhang 1616a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(1) (relative pivoting threshold): %g \n",mumps->id.CNTL(1));CHKERRQ(ierr); 1617a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(2) (stopping criterion of refinement): %g \n",mumps->id.CNTL(2));CHKERRQ(ierr); 1618ca3dc52bSPierre Jolivet ierr = PetscViewerASCIIPrintf(viewer," CNTL(3) (absolute pivoting threshold): %g \n",mumps->id.CNTL(3));CHKERRQ(ierr); 1619ca3dc52bSPierre Jolivet ierr = PetscViewerASCIIPrintf(viewer," CNTL(4) (value of static pivoting): %g \n",mumps->id.CNTL(4));CHKERRQ(ierr); 1620a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(5) (fixation for null pivots): %g \n",mumps->id.CNTL(5));CHKERRQ(ierr); 1621f6c57405SHong Zhang 1622f6c57405SHong Zhang /* infomation local to each processor */ 162334ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(1) (local estimated flops for the elimination after analysis): \n");CHKERRQ(ierr); 1624*1575c14dSBarry Smith ierr = PetscViewerASCIIPushSynchronized(viewer);CHKERRQ(ierr); 1625a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(1));CHKERRQ(ierr); 162634ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 162734ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(2) (local estimated flops for the assembly after factorization): \n");CHKERRQ(ierr); 1628a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(2));CHKERRQ(ierr); 162934ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 163034ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(3) (local estimated flops for the elimination after factorization): \n");CHKERRQ(ierr); 1631a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(3));CHKERRQ(ierr); 163234ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1633f6c57405SHong Zhang 163434ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(15) (estimated size of (in MB) MUMPS internal data for running numerical factorization): \n");CHKERRQ(ierr); 1635a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(15));CHKERRQ(ierr); 163634ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1637f6c57405SHong Zhang 163834ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(16) (size of (in MB) MUMPS internal data used during numerical factorization): \n");CHKERRQ(ierr); 1639a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(16));CHKERRQ(ierr); 164034ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1641f6c57405SHong Zhang 164234ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(23) (num of pivots eliminated on this processor after factorization): \n");CHKERRQ(ierr); 1643a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(23));CHKERRQ(ierr); 164434ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1645b34f08ffSHong Zhang 1646b34f08ffSHong Zhang if (mumps->ninfo && mumps->ninfo <= 40){ 1647b34f08ffSHong Zhang PetscInt i; 1648b34f08ffSHong Zhang for (i=0; i<mumps->ninfo; i++){ 1649b34f08ffSHong Zhang ierr = PetscViewerASCIIPrintf(viewer, " INFO(%d): \n",mumps->info[i]);CHKERRQ(ierr); 1650b34f08ffSHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(mumps->info[i]));CHKERRQ(ierr); 1651b34f08ffSHong Zhang ierr = PetscViewerFlush(viewer); 1652b34f08ffSHong Zhang } 1653b34f08ffSHong Zhang } 1654b34f08ffSHong Zhang 1655b34f08ffSHong Zhang 1656*1575c14dSBarry Smith ierr = PetscViewerASCIIPopSynchronized(viewer);CHKERRQ(ierr); 1657f6c57405SHong Zhang 1658a5e57a09SHong Zhang if (!mumps->myid) { /* information from the host */ 1659a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(1) (global estimated flops for the elimination after analysis): %g \n",mumps->id.RINFOG(1));CHKERRQ(ierr); 1660a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(2) (global estimated flops for the assembly after factorization): %g \n",mumps->id.RINFOG(2));CHKERRQ(ierr); 1661a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(3) (global estimated flops for the elimination after factorization): %g \n",mumps->id.RINFOG(3));CHKERRQ(ierr); 1662a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," (RINFOG(12) RINFOG(13))*2^INFOG(34) (determinant): (%g,%g)*(2^%d)\n",mumps->id.RINFOG(12),mumps->id.RINFOG(13),mumps->id.INFOG(34));CHKERRQ(ierr); 1663f6c57405SHong Zhang 1664a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(3) (estimated real workspace for factors on all processors after analysis): %d \n",mumps->id.INFOG(3));CHKERRQ(ierr); 1665a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(4) (estimated integer workspace for factors on all processors after analysis): %d \n",mumps->id.INFOG(4));CHKERRQ(ierr); 1666a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(5) (estimated maximum front size in the complete tree): %d \n",mumps->id.INFOG(5));CHKERRQ(ierr); 1667a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(6) (number of nodes in the complete tree): %d \n",mumps->id.INFOG(6));CHKERRQ(ierr); 1668a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(7) (ordering option effectively use after analysis): %d \n",mumps->id.INFOG(7));CHKERRQ(ierr); 1669a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(8) (structural symmetry in percent of the permuted matrix after analysis): %d \n",mumps->id.INFOG(8));CHKERRQ(ierr); 1670a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(9) (total real/complex workspace to store the matrix factors after factorization): %d \n",mumps->id.INFOG(9));CHKERRQ(ierr); 1671a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(10) (total integer space store the matrix factors after factorization): %d \n",mumps->id.INFOG(10));CHKERRQ(ierr); 1672a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(11) (order of largest frontal matrix after factorization): %d \n",mumps->id.INFOG(11));CHKERRQ(ierr); 1673a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(12) (number of off-diagonal pivots): %d \n",mumps->id.INFOG(12));CHKERRQ(ierr); 1674a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(13) (number of delayed pivots after factorization): %d \n",mumps->id.INFOG(13));CHKERRQ(ierr); 1675a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(14) (number of memory compress after factorization): %d \n",mumps->id.INFOG(14));CHKERRQ(ierr); 1676a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(15) (number of steps of iterative refinement after solution): %d \n",mumps->id.INFOG(15));CHKERRQ(ierr); 1677a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(16) (estimated size (in MB) of all MUMPS internal data for factorization after analysis: value on the most memory consuming processor): %d \n",mumps->id.INFOG(16));CHKERRQ(ierr); 1678a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(17) (estimated size of all MUMPS internal data for factorization after analysis: sum over all processors): %d \n",mumps->id.INFOG(17));CHKERRQ(ierr); 1679a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(18) (size of all MUMPS internal data allocated during factorization: value on the most memory consuming processor): %d \n",mumps->id.INFOG(18));CHKERRQ(ierr); 1680a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(19) (size of all MUMPS internal data allocated during factorization: sum over all processors): %d \n",mumps->id.INFOG(19));CHKERRQ(ierr); 1681a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(20) (estimated number of entries in the factors): %d \n",mumps->id.INFOG(20));CHKERRQ(ierr); 1682a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(21) (size in MB of memory effectively used during factorization - value on the most memory consuming processor): %d \n",mumps->id.INFOG(21));CHKERRQ(ierr); 1683a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(22) (size in MB of memory effectively used during factorization - sum over all processors): %d \n",mumps->id.INFOG(22));CHKERRQ(ierr); 1684a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(23) (after analysis: value of ICNTL(6) effectively used): %d \n",mumps->id.INFOG(23));CHKERRQ(ierr); 1685a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(24) (after analysis: value of ICNTL(12) effectively used): %d \n",mumps->id.INFOG(24));CHKERRQ(ierr); 1686a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(25) (after factorization: number of pivots modified by static pivoting): %d \n",mumps->id.INFOG(25));CHKERRQ(ierr); 168740d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(28) (after factorization: number of null pivots encountered): %d\n",mumps->id.INFOG(28));CHKERRQ(ierr); 168840d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(29) (after factorization: effective number of entries in the factors (sum over all processors)): %d\n",mumps->id.INFOG(29));CHKERRQ(ierr); 168940d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(30, 31) (after solution: size in Mbytes of memory used during solution phase): %d, %d\n",mumps->id.INFOG(30),mumps->id.INFOG(31));CHKERRQ(ierr); 169040d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(32) (after analysis: type of analysis done): %d\n",mumps->id.INFOG(32));CHKERRQ(ierr); 169140d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(33) (value used for ICNTL(8)): %d\n",mumps->id.INFOG(33));CHKERRQ(ierr); 169240d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(34) (exponent of the determinant if determinant is requested): %d\n",mumps->id.INFOG(34));CHKERRQ(ierr); 1693f6c57405SHong Zhang } 1694f6c57405SHong Zhang } 1695cb828f0fSHong Zhang } 1696f6c57405SHong Zhang PetscFunctionReturn(0); 1697f6c57405SHong Zhang } 1698f6c57405SHong Zhang 169935bd34faSBarry Smith #undef __FUNCT__ 170035bd34faSBarry Smith #define __FUNCT__ "MatGetInfo_MUMPS" 170135bd34faSBarry Smith PetscErrorCode MatGetInfo_MUMPS(Mat A,MatInfoType flag,MatInfo *info) 170235bd34faSBarry Smith { 1703cb828f0fSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)A->spptr; 170435bd34faSBarry Smith 170535bd34faSBarry Smith PetscFunctionBegin; 170635bd34faSBarry Smith info->block_size = 1.0; 1707cb828f0fSHong Zhang info->nz_allocated = mumps->id.INFOG(20); 1708cb828f0fSHong Zhang info->nz_used = mumps->id.INFOG(20); 170935bd34faSBarry Smith info->nz_unneeded = 0.0; 171035bd34faSBarry Smith info->assemblies = 0.0; 171135bd34faSBarry Smith info->mallocs = 0.0; 171235bd34faSBarry Smith info->memory = 0.0; 171335bd34faSBarry Smith info->fill_ratio_given = 0; 171435bd34faSBarry Smith info->fill_ratio_needed = 0; 171535bd34faSBarry Smith info->factor_mallocs = 0; 171635bd34faSBarry Smith PetscFunctionReturn(0); 171735bd34faSBarry Smith } 171835bd34faSBarry Smith 17195ccb76cbSHong Zhang /* -------------------------------------------------------------------------------------------*/ 17205ccb76cbSHong Zhang #undef __FUNCT__ 17216444a565SStefano Zampini #define __FUNCT__ "MatMumpsSetSchurIndices_MUMPS" 17226444a565SStefano Zampini PetscErrorCode MatMumpsSetSchurIndices_MUMPS(Mat F,PetscInt size,PetscInt idxs[]) 17236444a565SStefano Zampini { 17246444a565SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 17256444a565SStefano Zampini PetscErrorCode ierr; 17266444a565SStefano Zampini 17276444a565SStefano Zampini PetscFunctionBegin; 172859ac8732SStefano Zampini if (mumps->size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"MUMPS parallel Schur complements not yet supported from PETSc\n"); 17296444a565SStefano Zampini if (mumps->id.size_schur != size) { 17306444a565SStefano Zampini ierr = PetscFree2(mumps->id.listvar_schur,mumps->id.schur);CHKERRQ(ierr); 17316444a565SStefano Zampini mumps->id.size_schur = size; 17326444a565SStefano Zampini mumps->id.schur_lld = size; 17336444a565SStefano Zampini ierr = PetscMalloc2(size,&mumps->id.listvar_schur,size*size,&mumps->id.schur);CHKERRQ(ierr); 17346444a565SStefano Zampini } 17356444a565SStefano Zampini ierr = PetscMemcpy(mumps->id.listvar_schur,idxs,size*sizeof(PetscInt));CHKERRQ(ierr); 17366444a565SStefano Zampini if (F->factortype == MAT_FACTOR_LU) { 173759ac8732SStefano Zampini mumps->id.ICNTL(19) = 3; /* MUMPS returns full matrix */ 17386444a565SStefano Zampini } else { 173959ac8732SStefano Zampini mumps->id.ICNTL(19) = 2; /* MUMPS returns lower triangular part */ 17406444a565SStefano Zampini } 174159ac8732SStefano Zampini /* set a special value of ICNTL (not handled my MUMPS) to be used in the solve phase by PETSc */ 1742b5fa320bSStefano Zampini mumps->id.ICNTL(26) = -1; 17436444a565SStefano Zampini PetscFunctionReturn(0); 17446444a565SStefano Zampini } 17456444a565SStefano Zampini 17466444a565SStefano Zampini #undef __FUNCT__ 17476444a565SStefano Zampini #define __FUNCT__ "MatMumpsSetSchurIndices" 17486444a565SStefano Zampini /*@ 17496444a565SStefano Zampini MatMumpsSetSchurIndices - Set indices defining the Schur complement that MUMPS will compute during the factorization steps 17506444a565SStefano Zampini 17516444a565SStefano Zampini Logically Collective on Mat 17526444a565SStefano Zampini 17536444a565SStefano Zampini Input Parameters: 17546444a565SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 17556444a565SStefano Zampini . size - size of the Schur complement indices 17566444a565SStefano Zampini - idxs[] - array of Schur complement indices 17576444a565SStefano Zampini 17586444a565SStefano Zampini Notes: 175959ac8732SStefano Zampini The user has to free the array idxs[] since the indices are copied by the routine. 176059ac8732SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 17616444a565SStefano Zampini 17626444a565SStefano Zampini Level: advanced 17636444a565SStefano Zampini 17646444a565SStefano Zampini References: MUMPS Users' Guide 17656444a565SStefano Zampini 176659ac8732SStefano Zampini .seealso: MatGetFactor(), MatMumpsCreateSchurComplement(), MatMumpsGetSchurComplement() 17676444a565SStefano Zampini @*/ 17686444a565SStefano Zampini PetscErrorCode MatMumpsSetSchurIndices(Mat F,PetscInt size,PetscInt idxs[]) 17696444a565SStefano Zampini { 17706444a565SStefano Zampini PetscErrorCode ierr; 17716444a565SStefano Zampini 17726444a565SStefano Zampini PetscFunctionBegin; 1773e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 1774e807eca7SStefano Zampini if (size) PetscValidIntPointer(idxs,3); 17756444a565SStefano Zampini ierr = PetscTryMethod(F,"MatMumpsSetSchurIndices_C",(Mat,PetscInt,PetscInt[]),(F,size,idxs));CHKERRQ(ierr); 17766444a565SStefano Zampini PetscFunctionReturn(0); 17776444a565SStefano Zampini } 177859ac8732SStefano Zampini 17796444a565SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 17806444a565SStefano Zampini #undef __FUNCT__ 178159ac8732SStefano Zampini #define __FUNCT__ "MatMumpsCreateSchurComplement_MUMPS" 178259ac8732SStefano Zampini PetscErrorCode MatMumpsCreateSchurComplement_MUMPS(Mat F,Mat* S) 17836444a565SStefano Zampini { 17846444a565SStefano Zampini Mat St; 17856444a565SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 17866444a565SStefano Zampini PetscScalar *array; 17876444a565SStefano Zampini #if defined(PETSC_USE_COMPLEX) 17888ac429a0SStefano Zampini PetscScalar im = PetscSqrtScalar((PetscScalar)-1.0); 17896444a565SStefano Zampini #endif 17906444a565SStefano Zampini PetscErrorCode ierr; 17916444a565SStefano Zampini 17926444a565SStefano Zampini PetscFunctionBegin; 179359ac8732SStefano Zampini if (!mumps->CleanUpMUMPS) { /* CleanUpMUMPS is set to true after numerical factorization */ 179459ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Numerical factorization phase not yet performed! You should call MatFactorSymbolic/Numeric before"); 179559ac8732SStefano Zampini } else if (!mumps->id.ICNTL(19)) { 179659ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatMumpsSetSchurIndices to enable it"); 179759ac8732SStefano Zampini } else if (!mumps->id.size_schur) { 179859ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 179959ac8732SStefano Zampini } else if (!mumps->schur_restored) { 180059ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 18016444a565SStefano Zampini } 18026444a565SStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)F),&St);CHKERRQ(ierr); 18036444a565SStefano Zampini ierr = MatSetSizes(St,PETSC_DECIDE,PETSC_DECIDE,mumps->id.size_schur,mumps->id.size_schur);CHKERRQ(ierr); 18046444a565SStefano Zampini ierr = MatSetType(St,MATDENSE);CHKERRQ(ierr); 18056444a565SStefano Zampini ierr = MatSetUp(St);CHKERRQ(ierr); 18066444a565SStefano Zampini ierr = MatDenseGetArray(St,&array);CHKERRQ(ierr); 180759ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full matrix */ 18086444a565SStefano Zampini if (mumps->id.ICNTL(19) == 1) { /* stored by rows */ 18096444a565SStefano Zampini PetscInt i,j,N=mumps->id.size_schur; 18106444a565SStefano Zampini for (i=0;i<N;i++) { 18116444a565SStefano Zampini for (j=0;j<N;j++) { 18126444a565SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 18136444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j]; 18146444a565SStefano Zampini #else 18156444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j].r + im*mumps->id.schur[i*N+j].i; 18166444a565SStefano Zampini #endif 18176444a565SStefano Zampini array[j*N+i] = val; 18186444a565SStefano Zampini } 18196444a565SStefano Zampini } 18206444a565SStefano Zampini } else { /* stored by columns */ 18216444a565SStefano Zampini ierr = PetscMemcpy(array,mumps->id.schur,mumps->id.size_schur*mumps->id.size_schur*sizeof(PetscScalar));CHKERRQ(ierr); 18226444a565SStefano Zampini } 18236444a565SStefano Zampini } else { /* either full or lower-triangular (not packed) */ 18246444a565SStefano Zampini if (mumps->id.ICNTL(19) == 2) { /* lower triangular stored by columns */ 18256444a565SStefano Zampini PetscInt i,j,N=mumps->id.size_schur; 18266444a565SStefano Zampini for (i=0;i<N;i++) { 18276444a565SStefano Zampini for (j=i;j<N;j++) { 18286444a565SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 18296444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j]; 18306444a565SStefano Zampini #else 18316444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j].r + im*mumps->id.schur[i*N+j].i; 18326444a565SStefano Zampini #endif 18336444a565SStefano Zampini array[i*N+j] = val; 18346444a565SStefano Zampini array[j*N+i] = val; 18356444a565SStefano Zampini } 18366444a565SStefano Zampini } 18376444a565SStefano Zampini } else if (mumps->id.ICNTL(19) == 3) { /* full matrix */ 18386444a565SStefano Zampini ierr = PetscMemcpy(array,mumps->id.schur,mumps->id.size_schur*mumps->id.size_schur*sizeof(PetscScalar));CHKERRQ(ierr); 18396444a565SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 18406444a565SStefano Zampini PetscInt i,j,N=mumps->id.size_schur; 18416444a565SStefano Zampini for (i=0;i<N;i++) { 18426444a565SStefano Zampini for (j=0;j<i+1;j++) { 18436444a565SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 18446444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j]; 18456444a565SStefano Zampini #else 18466444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j].r + im*mumps->id.schur[i*N+j].i; 18476444a565SStefano Zampini #endif 18486444a565SStefano Zampini array[i*N+j] = val; 18496444a565SStefano Zampini array[j*N+i] = val; 18506444a565SStefano Zampini } 18516444a565SStefano Zampini } 18526444a565SStefano Zampini } 18536444a565SStefano Zampini } 18546444a565SStefano Zampini ierr = MatDenseRestoreArray(St,&array);CHKERRQ(ierr); 18556444a565SStefano Zampini *S = St; 18566444a565SStefano Zampini PetscFunctionReturn(0); 18576444a565SStefano Zampini } 18586444a565SStefano Zampini 18596444a565SStefano Zampini #undef __FUNCT__ 186059ac8732SStefano Zampini #define __FUNCT__ "MatMumpsCreateSchurComplement" 18616444a565SStefano Zampini /*@ 186259ac8732SStefano Zampini MatMumpsCreateSchurComplement - Create a Schur complement matrix object using Schur data computed by MUMPS during the factorization step 18636444a565SStefano Zampini 18646444a565SStefano Zampini Logically Collective on Mat 18656444a565SStefano Zampini 18666444a565SStefano Zampini Input Parameters: 18676444a565SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 18686444a565SStefano Zampini . *S - location where to return the Schur complement (MATDENSE) 18696444a565SStefano Zampini 18706444a565SStefano Zampini Notes: 187159ac8732SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 187259ac8732SStefano Zampini The routine provides a copy of the Schur data stored within MUMPS data strutures. The caller must destroy the object when it is no longer needed. 1873066565c5SStefano Zampini If MatMumpsInvertSchurComplement has been called, the routine gets back the inverse 18746444a565SStefano Zampini 18756444a565SStefano Zampini Level: advanced 18766444a565SStefano Zampini 18776444a565SStefano Zampini References: MUMPS Users' Guide 18786444a565SStefano Zampini 187959ac8732SStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices(), MatMumpsGetSchurComplement() 188059ac8732SStefano Zampini @*/ 188159ac8732SStefano Zampini PetscErrorCode MatMumpsCreateSchurComplement(Mat F,Mat* S) 188259ac8732SStefano Zampini { 188359ac8732SStefano Zampini PetscErrorCode ierr; 188459ac8732SStefano Zampini 188559ac8732SStefano Zampini PetscFunctionBegin; 1886e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 188759ac8732SStefano Zampini ierr = PetscTryMethod(F,"MatMumpsCreateSchurComplement_C",(Mat,Mat*),(F,S));CHKERRQ(ierr); 188859ac8732SStefano Zampini PetscFunctionReturn(0); 188959ac8732SStefano Zampini } 189059ac8732SStefano Zampini 189159ac8732SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 189259ac8732SStefano Zampini #undef __FUNCT__ 189359ac8732SStefano Zampini #define __FUNCT__ "MatMumpsGetSchurComplement_MUMPS" 189459ac8732SStefano Zampini PetscErrorCode MatMumpsGetSchurComplement_MUMPS(Mat F,Mat* S) 189559ac8732SStefano Zampini { 189659ac8732SStefano Zampini Mat St; 189759ac8732SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 189859ac8732SStefano Zampini PetscErrorCode ierr; 189959ac8732SStefano Zampini 190059ac8732SStefano Zampini PetscFunctionBegin; 190159ac8732SStefano Zampini if (!mumps->CleanUpMUMPS) { /* CleanUpMUMPS is set to true after numerical factorization */ 190259ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Numerical factorization phase not yet performed! You should call MatFactorSymbolic/Numeric before"); 190359ac8732SStefano Zampini } else if (!mumps->id.ICNTL(19)) { 190459ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatMumpsSetSchurIndices to enable it"); 190559ac8732SStefano Zampini } else if (!mumps->id.size_schur) { 190659ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 190759ac8732SStefano Zampini } else if (!mumps->schur_restored) { 190859ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 190959ac8732SStefano Zampini } 191059ac8732SStefano Zampini /* It should be the responsibility of the user to handle different ICNTL(19) cases if they want to work with the raw data */ 191159ac8732SStefano Zampini /* should I also add errors when the Schur complement has been already factored? */ 191259ac8732SStefano Zampini ierr = MatCreateSeqDense(PetscObjectComm((PetscObject)F),mumps->id.size_schur,mumps->id.size_schur,(PetscScalar*)mumps->id.schur,&St);CHKERRQ(ierr); 191359ac8732SStefano Zampini *S = St; 191459ac8732SStefano Zampini mumps->schur_restored = PETSC_FALSE; 191559ac8732SStefano Zampini PetscFunctionReturn(0); 191659ac8732SStefano Zampini } 191759ac8732SStefano Zampini 191859ac8732SStefano Zampini #undef __FUNCT__ 191959ac8732SStefano Zampini #define __FUNCT__ "MatMumpsGetSchurComplement" 192059ac8732SStefano Zampini /*@ 192159ac8732SStefano Zampini MatMumpsGetSchurComplement - Get a Schur complement matrix object using the current status of the raw Schur data computed by MUMPS during the factorization step 192259ac8732SStefano Zampini 192359ac8732SStefano Zampini Logically Collective on Mat 192459ac8732SStefano Zampini 192559ac8732SStefano Zampini Input Parameters: 192659ac8732SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 192759ac8732SStefano Zampini . *S - location where to return the Schur complement (MATDENSE) 192859ac8732SStefano Zampini 192959ac8732SStefano Zampini Notes: 193059ac8732SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 193159ac8732SStefano Zampini The routine uses the pointer to the raw data of the Schur Complement stored within MUMPS data strutures. The caller should call MatMumpsRestoreSchurComplement when the object is no longer needed. 1932066565c5SStefano Zampini If MatMumpsInvertSchurComplement has been called, the routine gets back the inverse 193359ac8732SStefano Zampini 193459ac8732SStefano Zampini Level: advanced 193559ac8732SStefano Zampini 193659ac8732SStefano Zampini References: MUMPS Users' Guide 193759ac8732SStefano Zampini 193859ac8732SStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices(), MatMumpsRestoreSchurComplement(), MatMumpsCreateSchurComplement() 19396444a565SStefano Zampini @*/ 19406444a565SStefano Zampini PetscErrorCode MatMumpsGetSchurComplement(Mat F,Mat* S) 19416444a565SStefano Zampini { 19426444a565SStefano Zampini PetscErrorCode ierr; 19436444a565SStefano Zampini 19446444a565SStefano Zampini PetscFunctionBegin; 1945e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 194659ac8732SStefano Zampini ierr = PetscUseMethod(F,"MatMumpsGetSchurComplement_C",(Mat,Mat*),(F,S));CHKERRQ(ierr); 194759ac8732SStefano Zampini PetscFunctionReturn(0); 194859ac8732SStefano Zampini } 194959ac8732SStefano Zampini 195059ac8732SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 195159ac8732SStefano Zampini #undef __FUNCT__ 195259ac8732SStefano Zampini #define __FUNCT__ "MatMumpsRestoreSchurComplement_MUMPS" 195359ac8732SStefano Zampini PetscErrorCode MatMumpsRestoreSchurComplement_MUMPS(Mat F,Mat* S) 195459ac8732SStefano Zampini { 195559ac8732SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 195659ac8732SStefano Zampini PetscErrorCode ierr; 195759ac8732SStefano Zampini 195859ac8732SStefano Zampini PetscFunctionBegin; 195959ac8732SStefano Zampini if (!mumps->CleanUpMUMPS) { /* CleanUpMUMPS is set to true after numerical factorization */ 196059ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Numerical factorization phase not yet performed! You should call MatFactorSymbolic/Numeric before"); 196159ac8732SStefano Zampini } else if (!mumps->id.ICNTL(19)) { 196259ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatMumpsSetSchurIndices to enable it"); 196359ac8732SStefano Zampini } else if (!mumps->id.size_schur) { 196459ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 1965066565c5SStefano Zampini } else if (mumps->schur_restored) { 1966066565c5SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has been already restored"); 196759ac8732SStefano Zampini } 196859ac8732SStefano Zampini ierr = MatDestroy(S);CHKERRQ(ierr); 196959ac8732SStefano Zampini *S = NULL; 197059ac8732SStefano Zampini mumps->schur_restored = PETSC_TRUE; 197159ac8732SStefano Zampini PetscFunctionReturn(0); 197259ac8732SStefano Zampini } 197359ac8732SStefano Zampini 197459ac8732SStefano Zampini #undef __FUNCT__ 197559ac8732SStefano Zampini #define __FUNCT__ "MatMumpsRestoreSchurComplement" 197659ac8732SStefano Zampini /*@ 197759ac8732SStefano Zampini MatMumpsRestoreSchurComplement - Restore the Schur complement matrix object obtained from a call to MatGetSchurComplement 197859ac8732SStefano Zampini 197959ac8732SStefano Zampini Logically Collective on Mat 198059ac8732SStefano Zampini 198159ac8732SStefano Zampini Input Parameters: 198259ac8732SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 198359ac8732SStefano Zampini . *S - location where the Schur complement is stored 198459ac8732SStefano Zampini 198559ac8732SStefano Zampini Notes: 198659ac8732SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 198759ac8732SStefano Zampini 198859ac8732SStefano Zampini Level: advanced 198959ac8732SStefano Zampini 199059ac8732SStefano Zampini References: MUMPS Users' Guide 199159ac8732SStefano Zampini 199259ac8732SStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices(), MatMumpsGetSchurComplement(), MatMumpsCreateSchurComplement() 199359ac8732SStefano Zampini @*/ 199459ac8732SStefano Zampini PetscErrorCode MatMumpsRestoreSchurComplement(Mat F,Mat* S) 199559ac8732SStefano Zampini { 199659ac8732SStefano Zampini PetscErrorCode ierr; 199759ac8732SStefano Zampini 199859ac8732SStefano Zampini PetscFunctionBegin; 1999e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 200059ac8732SStefano Zampini ierr = PetscUseMethod(F,"MatMumpsRestoreSchurComplement_C",(Mat,Mat*),(F,S));CHKERRQ(ierr); 200159ac8732SStefano Zampini PetscFunctionReturn(0); 200259ac8732SStefano Zampini } 200359ac8732SStefano Zampini 200459ac8732SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 200559ac8732SStefano Zampini #undef __FUNCT__ 200659ac8732SStefano Zampini #define __FUNCT__ "MatMumpsInvertSchurComplement_MUMPS" 200759ac8732SStefano Zampini PetscErrorCode MatMumpsInvertSchurComplement_MUMPS(Mat F) 200859ac8732SStefano Zampini { 200959ac8732SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 201059ac8732SStefano Zampini PetscErrorCode ierr; 201159ac8732SStefano Zampini 201259ac8732SStefano Zampini PetscFunctionBegin; 201359ac8732SStefano Zampini if (!mumps->id.ICNTL(19)) { /* do nothing */ 201459ac8732SStefano Zampini PetscFunctionReturn(0); 201559ac8732SStefano Zampini } 201659ac8732SStefano Zampini if (!mumps->CleanUpMUMPS) { /* CleanUpMUMPS is set to true after numerical factorization */ 201759ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Numerical factorization phase not yet performed! You should call MatFactorSymbolic/Numeric before"); 201859ac8732SStefano Zampini } else if (!mumps->id.size_schur) { 201959ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 202059ac8732SStefano Zampini } else if (!mumps->schur_restored) { 202159ac8732SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 202259ac8732SStefano Zampini } 202359ac8732SStefano Zampini ierr = MatMumpsInvertSchur_Private(mumps);CHKERRQ(ierr); 202459ac8732SStefano Zampini PetscFunctionReturn(0); 202559ac8732SStefano Zampini } 202659ac8732SStefano Zampini 202759ac8732SStefano Zampini #undef __FUNCT__ 202859ac8732SStefano Zampini #define __FUNCT__ "MatMumpsInvertSchurComplement" 202959ac8732SStefano Zampini /*@ 203059ac8732SStefano Zampini MatMumpsInvertSchurComplement - Invert the raw Schur data computed by MUMPS during the factorization step 203159ac8732SStefano Zampini 203259ac8732SStefano Zampini Logically Collective on Mat 203359ac8732SStefano Zampini 203459ac8732SStefano Zampini Input Parameters: 203559ac8732SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 203659ac8732SStefano Zampini 203759ac8732SStefano Zampini Notes: 203859ac8732SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 203959ac8732SStefano Zampini The routine uses the pointer to the raw data of the Schur Complement stored within MUMPS data strutures. 204059ac8732SStefano Zampini 204159ac8732SStefano Zampini Level: advanced 204259ac8732SStefano Zampini 204359ac8732SStefano Zampini References: MUMPS Users' Guide 204459ac8732SStefano Zampini 204559ac8732SStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices() 204659ac8732SStefano Zampini @*/ 204759ac8732SStefano Zampini PetscErrorCode MatMumpsInvertSchurComplement(Mat F) 204859ac8732SStefano Zampini { 204959ac8732SStefano Zampini PetscErrorCode ierr; 205059ac8732SStefano Zampini 205159ac8732SStefano Zampini PetscFunctionBegin; 2052e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 205359ac8732SStefano Zampini ierr = PetscTryMethod(F,"MatMumpsInvertSchurComplement_C",(Mat),(F));CHKERRQ(ierr); 20546444a565SStefano Zampini PetscFunctionReturn(0); 20556444a565SStefano Zampini } 20566444a565SStefano Zampini 20576444a565SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 20586444a565SStefano Zampini #undef __FUNCT__ 2059e807eca7SStefano Zampini #define __FUNCT__ "MatMumpsSolveSchurComplement_MUMPS" 2060e807eca7SStefano Zampini PetscErrorCode MatMumpsSolveSchurComplement_MUMPS(Mat F, Vec rhs, Vec sol) 2061e807eca7SStefano Zampini { 2062e807eca7SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2063e807eca7SStefano Zampini MumpsScalar *orhs; 2064e807eca7SStefano Zampini PetscScalar *osol,*nrhs,*nsol; 20659a3a5937SStefano Zampini PetscInt orhs_size,osol_size,olrhs_size; 2066e807eca7SStefano Zampini PetscErrorCode ierr; 2067e807eca7SStefano Zampini 2068e807eca7SStefano Zampini PetscFunctionBegin; 2069e807eca7SStefano Zampini if (!mumps->CleanUpMUMPS) { /* CleanUpMUMPS is set to true after numerical factorization */ 2070e807eca7SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Numerical factorization phase not yet performed! You should call MatFactorSymbolic/Numeric before"); 2071e807eca7SStefano Zampini } else if (!mumps->id.ICNTL(19)) { 2072e807eca7SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatMumpsSetSchurIndices to enable it"); 2073e807eca7SStefano Zampini } else if (!mumps->id.size_schur) { 2074e807eca7SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 2075e807eca7SStefano Zampini } else if (!mumps->schur_restored) { 2076e807eca7SStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 2077e807eca7SStefano Zampini } 2078e807eca7SStefano Zampini /* swap pointers */ 2079e807eca7SStefano Zampini orhs = mumps->id.redrhs; 20809a3a5937SStefano Zampini olrhs_size = mumps->id.lredrhs; 2081a12f35bfSStefano Zampini orhs_size = mumps->sizeredrhs; 2082e807eca7SStefano Zampini osol = mumps->schur_sol; 2083a12f35bfSStefano Zampini osol_size = mumps->schur_sizesol; 2084e807eca7SStefano Zampini ierr = VecGetArray(rhs,&nrhs);CHKERRQ(ierr); 2085e807eca7SStefano Zampini ierr = VecGetArray(sol,&nsol);CHKERRQ(ierr); 2086e807eca7SStefano Zampini mumps->id.redrhs = (MumpsScalar*)nrhs; 2087a12f35bfSStefano Zampini ierr = VecGetLocalSize(rhs,&mumps->sizeredrhs);CHKERRQ(ierr); 20889a3a5937SStefano Zampini mumps->id.lredrhs = mumps->sizeredrhs; 2089e807eca7SStefano Zampini mumps->schur_sol = nsol; 2090a12f35bfSStefano Zampini ierr = VecGetLocalSize(sol,&mumps->schur_sizesol);CHKERRQ(ierr); 2091a12f35bfSStefano Zampini 2092e807eca7SStefano Zampini /* solve Schur complement */ 2093e807eca7SStefano Zampini mumps->id.nrhs = 1; 2094e807eca7SStefano Zampini ierr = MatMumpsSolveSchur_Private(mumps,PETSC_FALSE);CHKERRQ(ierr); 2095e807eca7SStefano Zampini /* restore pointers */ 2096e807eca7SStefano Zampini ierr = VecRestoreArray(rhs,&nrhs);CHKERRQ(ierr); 2097e807eca7SStefano Zampini ierr = VecRestoreArray(sol,&nsol);CHKERRQ(ierr); 2098e807eca7SStefano Zampini mumps->id.redrhs = orhs; 20999a3a5937SStefano Zampini mumps->id.lredrhs = olrhs_size; 2100a12f35bfSStefano Zampini mumps->sizeredrhs = orhs_size; 2101e807eca7SStefano Zampini mumps->schur_sol = osol; 2102a12f35bfSStefano Zampini mumps->schur_sizesol = osol_size; 2103e807eca7SStefano Zampini PetscFunctionReturn(0); 2104e807eca7SStefano Zampini } 2105e807eca7SStefano Zampini 2106e807eca7SStefano Zampini #undef __FUNCT__ 2107e807eca7SStefano Zampini #define __FUNCT__ "MatMumpsSolveSchurComplement" 2108e807eca7SStefano Zampini /*@ 2109e807eca7SStefano Zampini MatMumpsSolveSchurComplement - Solve the Schur complement system computed by MUMPS during the factorization step 2110e807eca7SStefano Zampini 2111e807eca7SStefano Zampini Logically Collective on Mat 2112e807eca7SStefano Zampini 2113e807eca7SStefano Zampini Input Parameters: 2114e807eca7SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2115e807eca7SStefano Zampini . rhs - location where the right hand side of the Schur complement system is stored 2116e807eca7SStefano Zampini - sol - location where the solution of the Schur complement system has to be returned 2117e807eca7SStefano Zampini 2118e807eca7SStefano Zampini Notes: 2119e807eca7SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 2120e807eca7SStefano Zampini The sizes of the vectors should match the size of the Schur complement 2121e807eca7SStefano Zampini 2122e807eca7SStefano Zampini Level: advanced 2123e807eca7SStefano Zampini 2124e807eca7SStefano Zampini References: MUMPS Users' Guide 2125e807eca7SStefano Zampini 2126e807eca7SStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices() 2127e807eca7SStefano Zampini @*/ 2128e807eca7SStefano Zampini PetscErrorCode MatMumpsSolveSchurComplement(Mat F, Vec rhs, Vec sol) 2129e807eca7SStefano Zampini { 2130e807eca7SStefano Zampini PetscErrorCode ierr; 2131e807eca7SStefano Zampini 2132e807eca7SStefano Zampini PetscFunctionBegin; 2133e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 2134e807eca7SStefano Zampini PetscValidHeaderSpecific(rhs,VEC_CLASSID,2); 2135e807eca7SStefano Zampini PetscValidHeaderSpecific(sol,VEC_CLASSID,2); 2136e807eca7SStefano Zampini PetscCheckSameComm(F,1,rhs,2); 2137e807eca7SStefano Zampini PetscCheckSameComm(F,1,sol,3); 21387404bcfbSStefano Zampini ierr = PetscUseMethod(F,"MatMumpsSolveSchurComplement_C",(Mat,Vec,Vec),(F,rhs,sol));CHKERRQ(ierr); 21397404bcfbSStefano Zampini PetscFunctionReturn(0); 21407404bcfbSStefano Zampini } 21417404bcfbSStefano Zampini 21427404bcfbSStefano Zampini /* -------------------------------------------------------------------------------------------*/ 21437404bcfbSStefano Zampini #undef __FUNCT__ 21447404bcfbSStefano Zampini #define __FUNCT__ "MatMumpsSolveSchurComplementTranspose_MUMPS" 21457404bcfbSStefano Zampini PetscErrorCode MatMumpsSolveSchurComplementTranspose_MUMPS(Mat F, Vec rhs, Vec sol) 21467404bcfbSStefano Zampini { 21477404bcfbSStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 21487404bcfbSStefano Zampini MumpsScalar *orhs; 21497404bcfbSStefano Zampini PetscScalar *osol,*nrhs,*nsol; 2150a12f35bfSStefano Zampini PetscInt orhs_size,osol_size; 21517404bcfbSStefano Zampini PetscErrorCode ierr; 21527404bcfbSStefano Zampini 21537404bcfbSStefano Zampini PetscFunctionBegin; 21547404bcfbSStefano Zampini if (!mumps->CleanUpMUMPS) { /* CleanUpMUMPS is set to true after numerical factorization */ 21557404bcfbSStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Numerical factorization phase not yet performed! You should call MatFactorSymbolic/Numeric before"); 21567404bcfbSStefano Zampini } else if (!mumps->id.ICNTL(19)) { 21577404bcfbSStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatMumpsSetSchurIndices to enable it"); 21587404bcfbSStefano Zampini } else if (!mumps->id.size_schur) { 21597404bcfbSStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 21607404bcfbSStefano Zampini } else if (!mumps->schur_restored) { 21617404bcfbSStefano Zampini SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 21627404bcfbSStefano Zampini } 21637404bcfbSStefano Zampini /* swap pointers */ 21647404bcfbSStefano Zampini orhs = mumps->id.redrhs; 2165a12f35bfSStefano Zampini orhs_size = mumps->sizeredrhs; 21667404bcfbSStefano Zampini osol = mumps->schur_sol; 2167a12f35bfSStefano Zampini osol_size = mumps->schur_sizesol; 21687404bcfbSStefano Zampini ierr = VecGetArray(rhs,&nrhs);CHKERRQ(ierr); 21697404bcfbSStefano Zampini ierr = VecGetArray(sol,&nsol);CHKERRQ(ierr); 21707404bcfbSStefano Zampini mumps->id.redrhs = (MumpsScalar*)nrhs; 2171a12f35bfSStefano Zampini ierr = VecGetLocalSize(rhs,&mumps->sizeredrhs);CHKERRQ(ierr); 21727404bcfbSStefano Zampini mumps->schur_sol = nsol; 2173a12f35bfSStefano Zampini ierr = VecGetLocalSize(sol,&mumps->schur_sizesol);CHKERRQ(ierr); 2174a12f35bfSStefano Zampini 21757404bcfbSStefano Zampini /* solve Schur complement */ 21767404bcfbSStefano Zampini mumps->id.nrhs = 1; 21777404bcfbSStefano Zampini mumps->id.ICNTL(9) = 0; 21787404bcfbSStefano Zampini ierr = MatMumpsSolveSchur_Private(mumps,PETSC_FALSE);CHKERRQ(ierr); 21797404bcfbSStefano Zampini mumps->id.ICNTL(9) = 1; 21807404bcfbSStefano Zampini /* restore pointers */ 21817404bcfbSStefano Zampini ierr = VecRestoreArray(rhs,&nrhs);CHKERRQ(ierr); 21827404bcfbSStefano Zampini ierr = VecRestoreArray(sol,&nsol);CHKERRQ(ierr); 21837404bcfbSStefano Zampini mumps->id.redrhs = orhs; 2184a12f35bfSStefano Zampini mumps->sizeredrhs = orhs_size; 21857404bcfbSStefano Zampini mumps->schur_sol = osol; 2186a12f35bfSStefano Zampini mumps->schur_sizesol = osol_size; 21877404bcfbSStefano Zampini PetscFunctionReturn(0); 21887404bcfbSStefano Zampini } 21897404bcfbSStefano Zampini 21907404bcfbSStefano Zampini #undef __FUNCT__ 21917404bcfbSStefano Zampini #define __FUNCT__ "MatMumpsSolveSchurComplementTranspose" 21927404bcfbSStefano Zampini /*@ 21937404bcfbSStefano Zampini MatMumpsSolveSchurComplementTranspose - Solve the transpose of the Schur complement system computed by MUMPS during the factorization step 21947404bcfbSStefano Zampini 21957404bcfbSStefano Zampini Logically Collective on Mat 21967404bcfbSStefano Zampini 21977404bcfbSStefano Zampini Input Parameters: 21987404bcfbSStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 21997404bcfbSStefano Zampini . rhs - location where the right hand side of the Schur complement system is stored 22007404bcfbSStefano Zampini - sol - location where the solution of the Schur complement system has to be returned 22017404bcfbSStefano Zampini 22027404bcfbSStefano Zampini Notes: 22037404bcfbSStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 22047404bcfbSStefano Zampini The sizes of the vectors should match the size of the Schur complement 22057404bcfbSStefano Zampini 22067404bcfbSStefano Zampini Level: advanced 22077404bcfbSStefano Zampini 22087404bcfbSStefano Zampini References: MUMPS Users' Guide 22097404bcfbSStefano Zampini 22107404bcfbSStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices() 22117404bcfbSStefano Zampini @*/ 22127404bcfbSStefano Zampini PetscErrorCode MatMumpsSolveSchurComplementTranspose(Mat F, Vec rhs, Vec sol) 22137404bcfbSStefano Zampini { 22147404bcfbSStefano Zampini PetscErrorCode ierr; 22157404bcfbSStefano Zampini 22167404bcfbSStefano Zampini PetscFunctionBegin; 22177404bcfbSStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 22187404bcfbSStefano Zampini PetscValidHeaderSpecific(rhs,VEC_CLASSID,2); 22197404bcfbSStefano Zampini PetscValidHeaderSpecific(sol,VEC_CLASSID,2); 22207404bcfbSStefano Zampini PetscCheckSameComm(F,1,rhs,2); 22217404bcfbSStefano Zampini PetscCheckSameComm(F,1,sol,3); 22227404bcfbSStefano Zampini ierr = PetscUseMethod(F,"MatMumpsSolveSchurComplementTranspose_C",(Mat,Vec,Vec),(F,rhs,sol));CHKERRQ(ierr); 2223e807eca7SStefano Zampini PetscFunctionReturn(0); 2224e807eca7SStefano Zampini } 2225e807eca7SStefano Zampini 2226e807eca7SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 2227e807eca7SStefano Zampini #undef __FUNCT__ 22285ccb76cbSHong Zhang #define __FUNCT__ "MatMumpsSetIcntl_MUMPS" 22295ccb76cbSHong Zhang PetscErrorCode MatMumpsSetIcntl_MUMPS(Mat F,PetscInt icntl,PetscInt ival) 22305ccb76cbSHong Zhang { 2231a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 22325ccb76cbSHong Zhang 22335ccb76cbSHong Zhang PetscFunctionBegin; 2234a5e57a09SHong Zhang mumps->id.ICNTL(icntl) = ival; 22355ccb76cbSHong Zhang PetscFunctionReturn(0); 22365ccb76cbSHong Zhang } 22375ccb76cbSHong Zhang 22385ccb76cbSHong Zhang #undef __FUNCT__ 2239bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetIcntl_MUMPS" 2240bc6112feSHong Zhang PetscErrorCode MatMumpsGetIcntl_MUMPS(Mat F,PetscInt icntl,PetscInt *ival) 2241bc6112feSHong Zhang { 2242bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2243bc6112feSHong Zhang 2244bc6112feSHong Zhang PetscFunctionBegin; 2245bc6112feSHong Zhang *ival = mumps->id.ICNTL(icntl); 2246bc6112feSHong Zhang PetscFunctionReturn(0); 2247bc6112feSHong Zhang } 2248bc6112feSHong Zhang 2249bc6112feSHong Zhang #undef __FUNCT__ 22505ccb76cbSHong Zhang #define __FUNCT__ "MatMumpsSetIcntl" 22515ccb76cbSHong Zhang /*@ 22525ccb76cbSHong Zhang MatMumpsSetIcntl - Set MUMPS parameter ICNTL() 22535ccb76cbSHong Zhang 22545ccb76cbSHong Zhang Logically Collective on Mat 22555ccb76cbSHong Zhang 22565ccb76cbSHong Zhang Input Parameters: 22575ccb76cbSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 22585ccb76cbSHong Zhang . icntl - index of MUMPS parameter array ICNTL() 22595ccb76cbSHong Zhang - ival - value of MUMPS ICNTL(icntl) 22605ccb76cbSHong Zhang 22615ccb76cbSHong Zhang Options Database: 22625ccb76cbSHong Zhang . -mat_mumps_icntl_<icntl> <ival> 22635ccb76cbSHong Zhang 22645ccb76cbSHong Zhang Level: beginner 22655ccb76cbSHong Zhang 22665ccb76cbSHong Zhang References: MUMPS Users' Guide 22675ccb76cbSHong Zhang 22685ccb76cbSHong Zhang .seealso: MatGetFactor() 22695ccb76cbSHong Zhang @*/ 22705ccb76cbSHong Zhang PetscErrorCode MatMumpsSetIcntl(Mat F,PetscInt icntl,PetscInt ival) 22715ccb76cbSHong Zhang { 22725ccb76cbSHong Zhang PetscErrorCode ierr; 22735ccb76cbSHong Zhang 22745ccb76cbSHong Zhang PetscFunctionBegin; 22755ccb76cbSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 22765ccb76cbSHong Zhang PetscValidLogicalCollectiveInt(F,ival,3); 22775ccb76cbSHong Zhang ierr = PetscTryMethod(F,"MatMumpsSetIcntl_C",(Mat,PetscInt,PetscInt),(F,icntl,ival));CHKERRQ(ierr); 22785ccb76cbSHong Zhang PetscFunctionReturn(0); 22795ccb76cbSHong Zhang } 22805ccb76cbSHong Zhang 2281bc6112feSHong Zhang #undef __FUNCT__ 2282bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetIcntl" 2283a21f80fcSHong Zhang /*@ 2284a21f80fcSHong Zhang MatMumpsGetIcntl - Get MUMPS parameter ICNTL() 2285a21f80fcSHong Zhang 2286a21f80fcSHong Zhang Logically Collective on Mat 2287a21f80fcSHong Zhang 2288a21f80fcSHong Zhang Input Parameters: 2289a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2290a21f80fcSHong Zhang - icntl - index of MUMPS parameter array ICNTL() 2291a21f80fcSHong Zhang 2292a21f80fcSHong Zhang Output Parameter: 2293a21f80fcSHong Zhang . ival - value of MUMPS ICNTL(icntl) 2294a21f80fcSHong Zhang 2295a21f80fcSHong Zhang Level: beginner 2296a21f80fcSHong Zhang 2297a21f80fcSHong Zhang References: MUMPS Users' Guide 2298a21f80fcSHong Zhang 2299a21f80fcSHong Zhang .seealso: MatGetFactor() 2300a21f80fcSHong Zhang @*/ 2301bc6112feSHong Zhang PetscErrorCode MatMumpsGetIcntl(Mat F,PetscInt icntl,PetscInt *ival) 2302bc6112feSHong Zhang { 2303bc6112feSHong Zhang PetscErrorCode ierr; 2304bc6112feSHong Zhang 2305bc6112feSHong Zhang PetscFunctionBegin; 2306bc6112feSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 2307bc6112feSHong Zhang PetscValidIntPointer(ival,3); 2308bc6112feSHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetIcntl_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 2309bc6112feSHong Zhang PetscFunctionReturn(0); 2310bc6112feSHong Zhang } 2311bc6112feSHong Zhang 23128928b65cSHong Zhang /* -------------------------------------------------------------------------------------------*/ 23138928b65cSHong Zhang #undef __FUNCT__ 23148928b65cSHong Zhang #define __FUNCT__ "MatMumpsSetCntl_MUMPS" 23158928b65cSHong Zhang PetscErrorCode MatMumpsSetCntl_MUMPS(Mat F,PetscInt icntl,PetscReal val) 23168928b65cSHong Zhang { 23178928b65cSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 23188928b65cSHong Zhang 23198928b65cSHong Zhang PetscFunctionBegin; 23208928b65cSHong Zhang mumps->id.CNTL(icntl) = val; 23218928b65cSHong Zhang PetscFunctionReturn(0); 23228928b65cSHong Zhang } 23238928b65cSHong Zhang 23248928b65cSHong Zhang #undef __FUNCT__ 2325bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetCntl_MUMPS" 2326bc6112feSHong Zhang PetscErrorCode MatMumpsGetCntl_MUMPS(Mat F,PetscInt icntl,PetscReal *val) 2327bc6112feSHong Zhang { 2328bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2329bc6112feSHong Zhang 2330bc6112feSHong Zhang PetscFunctionBegin; 2331bc6112feSHong Zhang *val = mumps->id.CNTL(icntl); 2332bc6112feSHong Zhang PetscFunctionReturn(0); 2333bc6112feSHong Zhang } 2334bc6112feSHong Zhang 2335bc6112feSHong Zhang #undef __FUNCT__ 23368928b65cSHong Zhang #define __FUNCT__ "MatMumpsSetCntl" 23378928b65cSHong Zhang /*@ 23388928b65cSHong Zhang MatMumpsSetCntl - Set MUMPS parameter CNTL() 23398928b65cSHong Zhang 23408928b65cSHong Zhang Logically Collective on Mat 23418928b65cSHong Zhang 23428928b65cSHong Zhang Input Parameters: 23438928b65cSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 23448928b65cSHong Zhang . icntl - index of MUMPS parameter array CNTL() 23458928b65cSHong Zhang - val - value of MUMPS CNTL(icntl) 23468928b65cSHong Zhang 23478928b65cSHong Zhang Options Database: 23488928b65cSHong Zhang . -mat_mumps_cntl_<icntl> <val> 23498928b65cSHong Zhang 23508928b65cSHong Zhang Level: beginner 23518928b65cSHong Zhang 23528928b65cSHong Zhang References: MUMPS Users' Guide 23538928b65cSHong Zhang 23548928b65cSHong Zhang .seealso: MatGetFactor() 23558928b65cSHong Zhang @*/ 23568928b65cSHong Zhang PetscErrorCode MatMumpsSetCntl(Mat F,PetscInt icntl,PetscReal val) 23578928b65cSHong Zhang { 23588928b65cSHong Zhang PetscErrorCode ierr; 23598928b65cSHong Zhang 23608928b65cSHong Zhang PetscFunctionBegin; 23618928b65cSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 2362bc6112feSHong Zhang PetscValidLogicalCollectiveReal(F,val,3); 23638928b65cSHong Zhang ierr = PetscTryMethod(F,"MatMumpsSetCntl_C",(Mat,PetscInt,PetscReal),(F,icntl,val));CHKERRQ(ierr); 23648928b65cSHong Zhang PetscFunctionReturn(0); 23658928b65cSHong Zhang } 23668928b65cSHong Zhang 2367bc6112feSHong Zhang #undef __FUNCT__ 2368bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetCntl" 2369a21f80fcSHong Zhang /*@ 2370a21f80fcSHong Zhang MatMumpsGetCntl - Get MUMPS parameter CNTL() 2371a21f80fcSHong Zhang 2372a21f80fcSHong Zhang Logically Collective on Mat 2373a21f80fcSHong Zhang 2374a21f80fcSHong Zhang Input Parameters: 2375a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2376a21f80fcSHong Zhang - icntl - index of MUMPS parameter array CNTL() 2377a21f80fcSHong Zhang 2378a21f80fcSHong Zhang Output Parameter: 2379a21f80fcSHong Zhang . val - value of MUMPS CNTL(icntl) 2380a21f80fcSHong Zhang 2381a21f80fcSHong Zhang Level: beginner 2382a21f80fcSHong Zhang 2383a21f80fcSHong Zhang References: MUMPS Users' Guide 2384a21f80fcSHong Zhang 2385a21f80fcSHong Zhang .seealso: MatGetFactor() 2386a21f80fcSHong Zhang @*/ 2387bc6112feSHong Zhang PetscErrorCode MatMumpsGetCntl(Mat F,PetscInt icntl,PetscReal *val) 2388bc6112feSHong Zhang { 2389bc6112feSHong Zhang PetscErrorCode ierr; 2390bc6112feSHong Zhang 2391bc6112feSHong Zhang PetscFunctionBegin; 2392bc6112feSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 2393bc6112feSHong Zhang PetscValidRealPointer(val,3); 2394bc6112feSHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetCntl_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 2395bc6112feSHong Zhang PetscFunctionReturn(0); 2396bc6112feSHong Zhang } 2397bc6112feSHong Zhang 2398bc6112feSHong Zhang #undef __FUNCT__ 2399ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfo_MUMPS" 2400ca810319SHong Zhang PetscErrorCode MatMumpsGetInfo_MUMPS(Mat F,PetscInt icntl,PetscInt *info) 2401bc6112feSHong Zhang { 2402bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2403bc6112feSHong Zhang 2404bc6112feSHong Zhang PetscFunctionBegin; 2405bc6112feSHong Zhang *info = mumps->id.INFO(icntl); 2406bc6112feSHong Zhang PetscFunctionReturn(0); 2407bc6112feSHong Zhang } 2408bc6112feSHong Zhang 2409bc6112feSHong Zhang #undef __FUNCT__ 2410ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfog_MUMPS" 2411ca810319SHong Zhang PetscErrorCode MatMumpsGetInfog_MUMPS(Mat F,PetscInt icntl,PetscInt *infog) 2412bc6112feSHong Zhang { 2413bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2414bc6112feSHong Zhang 2415bc6112feSHong Zhang PetscFunctionBegin; 2416bc6112feSHong Zhang *infog = mumps->id.INFOG(icntl); 2417bc6112feSHong Zhang PetscFunctionReturn(0); 2418bc6112feSHong Zhang } 2419bc6112feSHong Zhang 2420bc6112feSHong Zhang #undef __FUNCT__ 2421ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfo_MUMPS" 2422ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfo_MUMPS(Mat F,PetscInt icntl,PetscReal *rinfo) 2423bc6112feSHong Zhang { 2424bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2425bc6112feSHong Zhang 2426bc6112feSHong Zhang PetscFunctionBegin; 2427bc6112feSHong Zhang *rinfo = mumps->id.RINFO(icntl); 2428bc6112feSHong Zhang PetscFunctionReturn(0); 2429bc6112feSHong Zhang } 2430bc6112feSHong Zhang 2431bc6112feSHong Zhang #undef __FUNCT__ 2432ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfog_MUMPS" 2433ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfog_MUMPS(Mat F,PetscInt icntl,PetscReal *rinfog) 2434bc6112feSHong Zhang { 2435bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2436bc6112feSHong Zhang 2437bc6112feSHong Zhang PetscFunctionBegin; 2438bc6112feSHong Zhang *rinfog = mumps->id.RINFOG(icntl); 2439bc6112feSHong Zhang PetscFunctionReturn(0); 2440bc6112feSHong Zhang } 2441bc6112feSHong Zhang 2442bc6112feSHong Zhang #undef __FUNCT__ 2443ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfo" 2444a21f80fcSHong Zhang /*@ 2445a21f80fcSHong Zhang MatMumpsGetInfo - Get MUMPS parameter INFO() 2446a21f80fcSHong Zhang 2447a21f80fcSHong Zhang Logically Collective on Mat 2448a21f80fcSHong Zhang 2449a21f80fcSHong Zhang Input Parameters: 2450a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2451a21f80fcSHong Zhang - icntl - index of MUMPS parameter array INFO() 2452a21f80fcSHong Zhang 2453a21f80fcSHong Zhang Output Parameter: 2454a21f80fcSHong Zhang . ival - value of MUMPS INFO(icntl) 2455a21f80fcSHong Zhang 2456a21f80fcSHong Zhang Level: beginner 2457a21f80fcSHong Zhang 2458a21f80fcSHong Zhang References: MUMPS Users' Guide 2459a21f80fcSHong Zhang 2460a21f80fcSHong Zhang .seealso: MatGetFactor() 2461a21f80fcSHong Zhang @*/ 2462ca810319SHong Zhang PetscErrorCode MatMumpsGetInfo(Mat F,PetscInt icntl,PetscInt *ival) 2463bc6112feSHong Zhang { 2464bc6112feSHong Zhang PetscErrorCode ierr; 2465bc6112feSHong Zhang 2466bc6112feSHong Zhang PetscFunctionBegin; 2467ca810319SHong Zhang PetscValidIntPointer(ival,3); 2468ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetInfo_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 2469bc6112feSHong Zhang PetscFunctionReturn(0); 2470bc6112feSHong Zhang } 2471bc6112feSHong Zhang 2472bc6112feSHong Zhang #undef __FUNCT__ 2473ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfog" 2474a21f80fcSHong Zhang /*@ 2475a21f80fcSHong Zhang MatMumpsGetInfog - Get MUMPS parameter INFOG() 2476a21f80fcSHong Zhang 2477a21f80fcSHong Zhang Logically Collective on Mat 2478a21f80fcSHong Zhang 2479a21f80fcSHong Zhang Input Parameters: 2480a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2481a21f80fcSHong Zhang - icntl - index of MUMPS parameter array INFOG() 2482a21f80fcSHong Zhang 2483a21f80fcSHong Zhang Output Parameter: 2484a21f80fcSHong Zhang . ival - value of MUMPS INFOG(icntl) 2485a21f80fcSHong Zhang 2486a21f80fcSHong Zhang Level: beginner 2487a21f80fcSHong Zhang 2488a21f80fcSHong Zhang References: MUMPS Users' Guide 2489a21f80fcSHong Zhang 2490a21f80fcSHong Zhang .seealso: MatGetFactor() 2491a21f80fcSHong Zhang @*/ 2492ca810319SHong Zhang PetscErrorCode MatMumpsGetInfog(Mat F,PetscInt icntl,PetscInt *ival) 2493bc6112feSHong Zhang { 2494bc6112feSHong Zhang PetscErrorCode ierr; 2495bc6112feSHong Zhang 2496bc6112feSHong Zhang PetscFunctionBegin; 2497ca810319SHong Zhang PetscValidIntPointer(ival,3); 2498ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetInfog_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 2499bc6112feSHong Zhang PetscFunctionReturn(0); 2500bc6112feSHong Zhang } 2501bc6112feSHong Zhang 2502bc6112feSHong Zhang #undef __FUNCT__ 2503ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfo" 2504a21f80fcSHong Zhang /*@ 2505a21f80fcSHong Zhang MatMumpsGetRinfo - Get MUMPS parameter RINFO() 2506a21f80fcSHong Zhang 2507a21f80fcSHong Zhang Logically Collective on Mat 2508a21f80fcSHong Zhang 2509a21f80fcSHong Zhang Input Parameters: 2510a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2511a21f80fcSHong Zhang - icntl - index of MUMPS parameter array RINFO() 2512a21f80fcSHong Zhang 2513a21f80fcSHong Zhang Output Parameter: 2514a21f80fcSHong Zhang . val - value of MUMPS RINFO(icntl) 2515a21f80fcSHong Zhang 2516a21f80fcSHong Zhang Level: beginner 2517a21f80fcSHong Zhang 2518a21f80fcSHong Zhang References: MUMPS Users' Guide 2519a21f80fcSHong Zhang 2520a21f80fcSHong Zhang .seealso: MatGetFactor() 2521a21f80fcSHong Zhang @*/ 2522ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfo(Mat F,PetscInt icntl,PetscReal *val) 2523bc6112feSHong Zhang { 2524bc6112feSHong Zhang PetscErrorCode ierr; 2525bc6112feSHong Zhang 2526bc6112feSHong Zhang PetscFunctionBegin; 2527bc6112feSHong Zhang PetscValidRealPointer(val,3); 2528ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetRinfo_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 2529bc6112feSHong Zhang PetscFunctionReturn(0); 2530bc6112feSHong Zhang } 2531bc6112feSHong Zhang 2532bc6112feSHong Zhang #undef __FUNCT__ 2533ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfog" 2534a21f80fcSHong Zhang /*@ 2535a21f80fcSHong Zhang MatMumpsGetRinfog - Get MUMPS parameter RINFOG() 2536a21f80fcSHong Zhang 2537a21f80fcSHong Zhang Logically Collective on Mat 2538a21f80fcSHong Zhang 2539a21f80fcSHong Zhang Input Parameters: 2540a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2541a21f80fcSHong Zhang - icntl - index of MUMPS parameter array RINFOG() 2542a21f80fcSHong Zhang 2543a21f80fcSHong Zhang Output Parameter: 2544a21f80fcSHong Zhang . val - value of MUMPS RINFOG(icntl) 2545a21f80fcSHong Zhang 2546a21f80fcSHong Zhang Level: beginner 2547a21f80fcSHong Zhang 2548a21f80fcSHong Zhang References: MUMPS Users' Guide 2549a21f80fcSHong Zhang 2550a21f80fcSHong Zhang .seealso: MatGetFactor() 2551a21f80fcSHong Zhang @*/ 2552ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfog(Mat F,PetscInt icntl,PetscReal *val) 2553bc6112feSHong Zhang { 2554bc6112feSHong Zhang PetscErrorCode ierr; 2555bc6112feSHong Zhang 2556bc6112feSHong Zhang PetscFunctionBegin; 2557bc6112feSHong Zhang PetscValidRealPointer(val,3); 2558ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetRinfog_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 2559bc6112feSHong Zhang PetscFunctionReturn(0); 2560bc6112feSHong Zhang } 2561bc6112feSHong Zhang 256224b6179bSKris Buschelman /*MC 25632692d6eeSBarry Smith MATSOLVERMUMPS - A matrix type providing direct solvers (LU and Cholesky) for 256424b6179bSKris Buschelman distributed and sequential matrices via the external package MUMPS. 256524b6179bSKris Buschelman 256641c8de11SBarry Smith Works with MATAIJ and MATSBAIJ matrices 256724b6179bSKris Buschelman 2568c2b89b5dSBarry Smith Use ./configure --download-mumps --download-scalapack --download-parmetis --download-metis --download-ptscotch to have PETSc installed with MUMPS 2569c2b89b5dSBarry Smith 2570c2b89b5dSBarry Smith Use -pc_type cholesky or lu -pc_factor_mat_solver_package mumps to us this direct solver 2571c2b89b5dSBarry Smith 257224b6179bSKris Buschelman Options Database Keys: 25734e34a73bSHong Zhang + -mat_mumps_icntl_1 <6>: ICNTL(1): output stream for error messages (None) 25744e34a73bSHong Zhang . -mat_mumps_icntl_2 <0>: ICNTL(2): output stream for diagnostic printing, statistics, and warning (None) 25754e34a73bSHong Zhang . -mat_mumps_icntl_3 <0>: ICNTL(3): output stream for global information, collected on the host (None) 25764e34a73bSHong Zhang . -mat_mumps_icntl_4 <0>: ICNTL(4): level of printing (0 to 4) (None) 25774e34a73bSHong Zhang . -mat_mumps_icntl_6 <7>: ICNTL(6): permutes to a zero-free diagonal and/or scale the matrix (0 to 7) (None) 25784e34a73bSHong Zhang . -mat_mumps_icntl_7 <7>: ICNTL(7): computes a symmetric permutation in sequential analysis (0 to 7). 3=Scotch, 4=PORD, 5=Metis (None) 25794e34a73bSHong Zhang . -mat_mumps_icntl_8 <77>: ICNTL(8): scaling strategy (-2 to 8 or 77) (None) 25804e34a73bSHong Zhang . -mat_mumps_icntl_10 <0>: ICNTL(10): max num of refinements (None) 25814e34a73bSHong Zhang . -mat_mumps_icntl_11 <0>: ICNTL(11): statistics related to an error analysis (via -ksp_view) (None) 25824e34a73bSHong Zhang . -mat_mumps_icntl_12 <1>: ICNTL(12): an ordering strategy for symmetric matrices (0 to 3) (None) 25834e34a73bSHong Zhang . -mat_mumps_icntl_13 <0>: ICNTL(13): parallelism of the root node (enable ScaLAPACK) and its splitting (None) 25844e34a73bSHong Zhang . -mat_mumps_icntl_14 <20>: ICNTL(14): percentage increase in the estimated working space (None) 25854e34a73bSHong Zhang . -mat_mumps_icntl_19 <0>: ICNTL(19): computes the Schur complement (None) 25864e34a73bSHong Zhang . -mat_mumps_icntl_22 <0>: ICNTL(22): in-core/out-of-core factorization and solve (0 or 1) (None) 25874e34a73bSHong Zhang . -mat_mumps_icntl_23 <0>: ICNTL(23): max size of the working memory (MB) that can allocate per processor (None) 25884e34a73bSHong Zhang . -mat_mumps_icntl_24 <0>: ICNTL(24): detection of null pivot rows (0 or 1) (None) 25894e34a73bSHong Zhang . -mat_mumps_icntl_25 <0>: ICNTL(25): compute a solution of a deficient matrix and a null space basis (None) 25904e34a73bSHong Zhang . -mat_mumps_icntl_26 <0>: ICNTL(26): drives the solution phase if a Schur complement matrix (None) 25914e34a73bSHong Zhang . -mat_mumps_icntl_28 <1>: ICNTL(28): use 1 for sequential analysis and ictnl(7) ordering, or 2 for parallel analysis and ictnl(29) ordering (None) 25924e34a73bSHong Zhang . -mat_mumps_icntl_29 <0>: ICNTL(29): parallel ordering 1 = ptscotch, 2 = parmetis (None) 25934e34a73bSHong Zhang . -mat_mumps_icntl_30 <0>: ICNTL(30): compute user-specified set of entries in inv(A) (None) 25944e34a73bSHong Zhang . -mat_mumps_icntl_31 <0>: ICNTL(31): indicates which factors may be discarded during factorization (None) 25954e34a73bSHong Zhang . -mat_mumps_icntl_33 <0>: ICNTL(33): compute determinant (None) 25964e34a73bSHong Zhang . -mat_mumps_cntl_1 <0.01>: CNTL(1): relative pivoting threshold (None) 25974e34a73bSHong Zhang . -mat_mumps_cntl_2 <1.49012e-08>: CNTL(2): stopping criterion of refinement (None) 25984e34a73bSHong Zhang . -mat_mumps_cntl_3 <0>: CNTL(3): absolute pivoting threshold (None) 25994e34a73bSHong Zhang . -mat_mumps_cntl_4 <-1>: CNTL(4): value for static pivoting (None) 26004e34a73bSHong Zhang - -mat_mumps_cntl_5 <0>: CNTL(5): fixation for null pivots (None) 260124b6179bSKris Buschelman 260224b6179bSKris Buschelman Level: beginner 260324b6179bSKris Buschelman 260441c8de11SBarry Smith .seealso: PCFactorSetMatSolverPackage(), MatSolverPackage 260541c8de11SBarry Smith 260624b6179bSKris Buschelman M*/ 260724b6179bSKris Buschelman 260835bd34faSBarry Smith #undef __FUNCT__ 260935bd34faSBarry Smith #define __FUNCT__ "MatFactorGetSolverPackage_mumps" 2610f7a08781SBarry Smith static PetscErrorCode MatFactorGetSolverPackage_mumps(Mat A,const MatSolverPackage *type) 261135bd34faSBarry Smith { 261235bd34faSBarry Smith PetscFunctionBegin; 26132692d6eeSBarry Smith *type = MATSOLVERMUMPS; 261435bd34faSBarry Smith PetscFunctionReturn(0); 261535bd34faSBarry Smith } 261635bd34faSBarry Smith 2617bccb9932SShri Abhyankar /* MatGetFactor for Seq and MPI AIJ matrices */ 26182877fffaSHong Zhang #undef __FUNCT__ 2619bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_aij_mumps" 26208cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_aij_mumps(Mat A,MatFactorType ftype,Mat *F) 26212877fffaSHong Zhang { 26222877fffaSHong Zhang Mat B; 26232877fffaSHong Zhang PetscErrorCode ierr; 26242877fffaSHong Zhang Mat_MUMPS *mumps; 2625ace3abfcSBarry Smith PetscBool isSeqAIJ; 26262877fffaSHong Zhang 26272877fffaSHong Zhang PetscFunctionBegin; 26282877fffaSHong Zhang /* Create the factorization matrix */ 2629251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQAIJ,&isSeqAIJ);CHKERRQ(ierr); 2630ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 26312877fffaSHong Zhang ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 26322877fffaSHong Zhang ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2633bccb9932SShri Abhyankar if (isSeqAIJ) { 26340298fd71SBarry Smith ierr = MatSeqAIJSetPreallocation(B,0,NULL);CHKERRQ(ierr); 2635bccb9932SShri Abhyankar } else { 26360298fd71SBarry Smith ierr = MatMPIAIJSetPreallocation(B,0,NULL,0,NULL);CHKERRQ(ierr); 2637bccb9932SShri Abhyankar } 26382877fffaSHong Zhang 2639b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 26402205254eSKarl Rupp 26412877fffaSHong Zhang B->ops->view = MatView_MUMPS; 264235bd34faSBarry Smith B->ops->getinfo = MatGetInfo_MUMPS; 264320be8e61SHong Zhang B->ops->getdiagonal = MatGetDiagonal_MUMPS; 26442205254eSKarl Rupp 2645bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 2646bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 2647bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 2648bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 2649bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 2650bc6112feSHong Zhang 2651ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 2652ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 2653ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 2654ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 26556444a565SStefano Zampini 26566444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetSchurIndices_C",MatMumpsSetSchurIndices_MUMPS);CHKERRQ(ierr); 265759ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsInvertSchurComplement_C",MatMumpsInvertSchurComplement_MUMPS);CHKERRQ(ierr); 265859ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsCreateSchurComplement_C",MatMumpsCreateSchurComplement_MUMPS);CHKERRQ(ierr); 26596444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetSchurComplement_C",MatMumpsGetSchurComplement_MUMPS);CHKERRQ(ierr); 266059ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsRestoreSchurComplement_C",MatMumpsRestoreSchurComplement_MUMPS);CHKERRQ(ierr); 2661e807eca7SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplement_C",MatMumpsSolveSchurComplement_MUMPS);CHKERRQ(ierr); 26627404bcfbSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplementTranspose_C",MatMumpsSolveSchurComplementTranspose_MUMPS);CHKERRQ(ierr); 2663e807eca7SStefano Zampini 2664450b117fSShri Abhyankar if (ftype == MAT_FACTOR_LU) { 2665450b117fSShri Abhyankar B->ops->lufactorsymbolic = MatLUFactorSymbolic_AIJMUMPS; 2666d5f3da31SBarry Smith B->factortype = MAT_FACTOR_LU; 2667bccb9932SShri Abhyankar if (isSeqAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqaij_seqaij; 2668bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpiaij_mpiaij; 2669746480a1SHong Zhang mumps->sym = 0; 2670dcd589f8SShri Abhyankar } else { 267167877ebaSShri Abhyankar B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_MUMPS; 2672450b117fSShri Abhyankar B->factortype = MAT_FACTOR_CHOLESKY; 2673bccb9932SShri Abhyankar if (isSeqAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqaij_seqsbaij; 2674bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpiaij_mpisbaij; 267559ac8732SStefano Zampini #if defined(PETSC_USE_COMPLEX) 267659ac8732SStefano Zampini mumps->sym = 2; 267759ac8732SStefano Zampini #else 26786fdc2a6dSBarry Smith if (A->spd_set && A->spd) mumps->sym = 1; 26796fdc2a6dSBarry Smith else mumps->sym = 2; 268059ac8732SStefano Zampini #endif 2681450b117fSShri Abhyankar } 26822877fffaSHong Zhang 26832877fffaSHong Zhang mumps->isAIJ = PETSC_TRUE; 2684bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 26852877fffaSHong Zhang B->ops->destroy = MatDestroy_MUMPS; 26862877fffaSHong Zhang B->spptr = (void*)mumps; 26872205254eSKarl Rupp 2688f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 2689746480a1SHong Zhang 26902877fffaSHong Zhang *F = B; 26912877fffaSHong Zhang PetscFunctionReturn(0); 26922877fffaSHong Zhang } 26932877fffaSHong Zhang 2694bccb9932SShri Abhyankar /* MatGetFactor for Seq and MPI SBAIJ matrices */ 26952877fffaSHong Zhang #undef __FUNCT__ 2696bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_sbaij_mumps" 26978cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_sbaij_mumps(Mat A,MatFactorType ftype,Mat *F) 26982877fffaSHong Zhang { 26992877fffaSHong Zhang Mat B; 27002877fffaSHong Zhang PetscErrorCode ierr; 27012877fffaSHong Zhang Mat_MUMPS *mumps; 2702ace3abfcSBarry Smith PetscBool isSeqSBAIJ; 27032877fffaSHong Zhang 27042877fffaSHong Zhang PetscFunctionBegin; 2705ce94432eSBarry Smith if (ftype != MAT_FACTOR_CHOLESKY) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with MUMPS LU, use AIJ matrix"); 2706ce94432eSBarry Smith if (A->rmap->bs > 1) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with block size > 1 with MUMPS Cholesky, use AIJ matrix instead"); 2707251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQSBAIJ,&isSeqSBAIJ);CHKERRQ(ierr); 27082877fffaSHong Zhang /* Create the factorization matrix */ 2709ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 27102877fffaSHong Zhang ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 27112877fffaSHong Zhang ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2712b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 2713bccb9932SShri Abhyankar if (isSeqSBAIJ) { 27140298fd71SBarry Smith ierr = MatSeqSBAIJSetPreallocation(B,1,0,NULL);CHKERRQ(ierr); 27152205254eSKarl Rupp 271616ebf90aSShri Abhyankar mumps->ConvertToTriples = MatConvertToTriples_seqsbaij_seqsbaij; 2717dcd589f8SShri Abhyankar } else { 27180298fd71SBarry Smith ierr = MatMPISBAIJSetPreallocation(B,1,0,NULL,0,NULL);CHKERRQ(ierr); 27192205254eSKarl Rupp 2720bccb9932SShri Abhyankar mumps->ConvertToTriples = MatConvertToTriples_mpisbaij_mpisbaij; 2721bccb9932SShri Abhyankar } 2722bccb9932SShri Abhyankar 272367877ebaSShri Abhyankar B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_MUMPS; 2724bccb9932SShri Abhyankar B->ops->view = MatView_MUMPS; 272520be8e61SHong Zhang B->ops->getdiagonal = MatGetDiagonal_MUMPS; 27262205254eSKarl Rupp 2727bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 2728b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 2729b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 2730b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 2731b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 2732bc6112feSHong Zhang 2733ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 2734ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 2735ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 2736ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 27372205254eSKarl Rupp 27386444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetSchurIndices_C",MatMumpsSetSchurIndices_MUMPS);CHKERRQ(ierr); 273959ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsInvertSchurComplement_C",MatMumpsInvertSchurComplement_MUMPS);CHKERRQ(ierr); 274059ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsCreateSchurComplement_C",MatMumpsCreateSchurComplement_MUMPS);CHKERRQ(ierr); 27416444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetSchurComplement_C",MatMumpsGetSchurComplement_MUMPS);CHKERRQ(ierr); 274259ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsRestoreSchurComplement_C",MatMumpsRestoreSchurComplement_MUMPS);CHKERRQ(ierr); 2743e807eca7SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplement_C",MatMumpsSolveSchurComplement_MUMPS);CHKERRQ(ierr); 27447404bcfbSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplementTranspose_C",MatMumpsSolveSchurComplementTranspose_MUMPS);CHKERRQ(ierr); 27456444a565SStefano Zampini 2746f4762488SHong Zhang B->factortype = MAT_FACTOR_CHOLESKY; 274759ac8732SStefano Zampini #if defined(PETSC_USE_COMPLEX) 274859ac8732SStefano Zampini mumps->sym = 2; 274959ac8732SStefano Zampini #else 27506fdc2a6dSBarry Smith if (A->spd_set && A->spd) mumps->sym = 1; 27516fdc2a6dSBarry Smith else mumps->sym = 2; 275259ac8732SStefano Zampini #endif 2753a214ac2aSShri Abhyankar 2754bccb9932SShri Abhyankar mumps->isAIJ = PETSC_FALSE; 2755bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 2756f3c0ef26SHong Zhang B->ops->destroy = MatDestroy_MUMPS; 27572877fffaSHong Zhang B->spptr = (void*)mumps; 27582205254eSKarl Rupp 2759f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 2760746480a1SHong Zhang 27612877fffaSHong Zhang *F = B; 27622877fffaSHong Zhang PetscFunctionReturn(0); 27632877fffaSHong Zhang } 276497969023SHong Zhang 2765450b117fSShri Abhyankar #undef __FUNCT__ 2766bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_baij_mumps" 27678cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_baij_mumps(Mat A,MatFactorType ftype,Mat *F) 276867877ebaSShri Abhyankar { 276967877ebaSShri Abhyankar Mat B; 277067877ebaSShri Abhyankar PetscErrorCode ierr; 277167877ebaSShri Abhyankar Mat_MUMPS *mumps; 2772ace3abfcSBarry Smith PetscBool isSeqBAIJ; 277367877ebaSShri Abhyankar 277467877ebaSShri Abhyankar PetscFunctionBegin; 277567877ebaSShri Abhyankar /* Create the factorization matrix */ 2776251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQBAIJ,&isSeqBAIJ);CHKERRQ(ierr); 2777ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 277867877ebaSShri Abhyankar ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 277967877ebaSShri Abhyankar ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2780bccb9932SShri Abhyankar if (isSeqBAIJ) { 27810298fd71SBarry Smith ierr = MatSeqBAIJSetPreallocation(B,A->rmap->bs,0,NULL);CHKERRQ(ierr); 2782bccb9932SShri Abhyankar } else { 27830298fd71SBarry Smith ierr = MatMPIBAIJSetPreallocation(B,A->rmap->bs,0,NULL,0,NULL);CHKERRQ(ierr); 2784bccb9932SShri Abhyankar } 2785450b117fSShri Abhyankar 2786b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 2787450b117fSShri Abhyankar if (ftype == MAT_FACTOR_LU) { 2788450b117fSShri Abhyankar B->ops->lufactorsymbolic = MatLUFactorSymbolic_BAIJMUMPS; 2789450b117fSShri Abhyankar B->factortype = MAT_FACTOR_LU; 2790bccb9932SShri Abhyankar if (isSeqBAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqbaij_seqaij; 2791bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpibaij_mpiaij; 2792746480a1SHong Zhang mumps->sym = 0; 2793f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Cannot use PETSc BAIJ matrices with MUMPS Cholesky, use SBAIJ or AIJ matrix instead\n"); 2794bccb9932SShri Abhyankar 2795450b117fSShri Abhyankar B->ops->view = MatView_MUMPS; 279620be8e61SHong Zhang B->ops->getdiagonal = MatGetDiagonal_MUMPS; 27972205254eSKarl Rupp 2798bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 2799bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 2800bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 2801bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 2802bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 2803bc6112feSHong Zhang 2804ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 2805ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 2806ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 2807ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 2808450b117fSShri Abhyankar 28096444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetSchurIndices_C",MatMumpsSetSchurIndices_MUMPS);CHKERRQ(ierr); 281059ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsInvertSchurComplement_C",MatMumpsInvertSchurComplement_MUMPS);CHKERRQ(ierr); 281159ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsCreateSchurComplement_C",MatMumpsCreateSchurComplement_MUMPS);CHKERRQ(ierr); 28126444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetSchurComplement_C",MatMumpsGetSchurComplement_MUMPS);CHKERRQ(ierr); 281359ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsRestoreSchurComplement_C",MatMumpsRestoreSchurComplement_MUMPS);CHKERRQ(ierr); 2814e807eca7SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplement_C",MatMumpsSolveSchurComplement_MUMPS);CHKERRQ(ierr); 28157404bcfbSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplementTranspose_C",MatMumpsSolveSchurComplementTranspose_MUMPS);CHKERRQ(ierr); 28166444a565SStefano Zampini 2817450b117fSShri Abhyankar mumps->isAIJ = PETSC_TRUE; 2818bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 2819450b117fSShri Abhyankar B->ops->destroy = MatDestroy_MUMPS; 2820450b117fSShri Abhyankar B->spptr = (void*)mumps; 28212205254eSKarl Rupp 2822f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 2823746480a1SHong Zhang 2824450b117fSShri Abhyankar *F = B; 2825450b117fSShri Abhyankar PetscFunctionReturn(0); 2826450b117fSShri Abhyankar } 282742c9c57cSBarry Smith 282842c9c57cSBarry Smith PETSC_EXTERN PetscErrorCode MatGetFactor_aij_mumps(Mat,MatFactorType,Mat*); 282942c9c57cSBarry Smith PETSC_EXTERN PetscErrorCode MatGetFactor_baij_mumps(Mat,MatFactorType,Mat*); 283042c9c57cSBarry Smith PETSC_EXTERN PetscErrorCode MatGetFactor_sbaij_mumps(Mat,MatFactorType,Mat*); 283142c9c57cSBarry Smith 283242c9c57cSBarry Smith #undef __FUNCT__ 283342c9c57cSBarry Smith #define __FUNCT__ "MatSolverPackageRegister_MUMPS" 283429b38603SBarry Smith PETSC_EXTERN PetscErrorCode MatSolverPackageRegister_MUMPS(void) 283542c9c57cSBarry Smith { 283642c9c57cSBarry Smith PetscErrorCode ierr; 283742c9c57cSBarry Smith 283842c9c57cSBarry Smith PetscFunctionBegin; 283942c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIAIJ,MAT_FACTOR_LU,MatGetFactor_aij_mumps);CHKERRQ(ierr); 284042c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_aij_mumps);CHKERRQ(ierr); 284142c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIBAIJ,MAT_FACTOR_LU,MatGetFactor_baij_mumps);CHKERRQ(ierr); 284242c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_baij_mumps);CHKERRQ(ierr); 284342c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPISBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_sbaij_mumps);CHKERRQ(ierr); 284442c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQAIJ,MAT_FACTOR_LU,MatGetFactor_aij_mumps);CHKERRQ(ierr); 284542c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_aij_mumps);CHKERRQ(ierr); 284642c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQBAIJ,MAT_FACTOR_LU,MatGetFactor_baij_mumps);CHKERRQ(ierr); 284742c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_baij_mumps);CHKERRQ(ierr); 284842c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQSBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_sbaij_mumps);CHKERRQ(ierr); 284942c9c57cSBarry Smith PetscFunctionReturn(0); 285042c9c57cSBarry Smith } 285142c9c57cSBarry Smith 2852