11c2a3de1SBarry Smith 2397b6df1SKris Buschelman /* 3c2b5dc30SHong Zhang Provides an interface to the MUMPS sparse solver 4397b6df1SKris Buschelman */ 551d5961aSHong Zhang 6c6db04a5SJed Brown #include <../src/mat/impls/aij/mpi/mpiaij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <../src/mat/impls/sbaij/mpi/mpisbaij.h> 8b5fa320bSStefano Zampini #include <petscblaslapack.h> 9397b6df1SKris Buschelman 10397b6df1SKris Buschelman EXTERN_C_BEGIN 11397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 122907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 132907cef9SHong Zhang #include <cmumps_c.h> 142907cef9SHong Zhang #else 15c6db04a5SJed Brown #include <zmumps_c.h> 162907cef9SHong Zhang #endif 172907cef9SHong Zhang #else 182907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 192907cef9SHong Zhang #include <smumps_c.h> 20397b6df1SKris Buschelman #else 21c6db04a5SJed Brown #include <dmumps_c.h> 22397b6df1SKris Buschelman #endif 232907cef9SHong Zhang #endif 24397b6df1SKris Buschelman EXTERN_C_END 25397b6df1SKris Buschelman #define JOB_INIT -1 263d472b54SHong Zhang #define JOB_FACTSYMBOLIC 1 273d472b54SHong Zhang #define JOB_FACTNUMERIC 2 283d472b54SHong Zhang #define JOB_SOLVE 3 29397b6df1SKris Buschelman #define JOB_END -2 303d472b54SHong Zhang 312907cef9SHong Zhang /* calls to MUMPS */ 322907cef9SHong Zhang #if defined(PETSC_USE_COMPLEX) 332907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 342907cef9SHong Zhang #define PetscMUMPS_c cmumps_c 352907cef9SHong Zhang #else 362907cef9SHong Zhang #define PetscMUMPS_c zmumps_c 372907cef9SHong Zhang #endif 382907cef9SHong Zhang #else 392907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 402907cef9SHong Zhang #define PetscMUMPS_c smumps_c 412907cef9SHong Zhang #else 422907cef9SHong Zhang #define PetscMUMPS_c dmumps_c 432907cef9SHong Zhang #endif 442907cef9SHong Zhang #endif 452907cef9SHong Zhang 46940cd9d6SSatish Balay /* declare MumpsScalar */ 47940cd9d6SSatish Balay #if defined(PETSC_USE_COMPLEX) 48940cd9d6SSatish Balay #if defined(PETSC_USE_REAL_SINGLE) 49940cd9d6SSatish Balay #define MumpsScalar mumps_complex 50940cd9d6SSatish Balay #else 51940cd9d6SSatish Balay #define MumpsScalar mumps_double_complex 52940cd9d6SSatish Balay #endif 53940cd9d6SSatish Balay #else 54940cd9d6SSatish Balay #define MumpsScalar PetscScalar 55940cd9d6SSatish Balay #endif 563d472b54SHong Zhang 57397b6df1SKris Buschelman /* macros s.t. indices match MUMPS documentation */ 58397b6df1SKris Buschelman #define ICNTL(I) icntl[(I)-1] 59397b6df1SKris Buschelman #define CNTL(I) cntl[(I)-1] 60397b6df1SKris Buschelman #define INFOG(I) infog[(I)-1] 61a7aca84bSHong Zhang #define INFO(I) info[(I)-1] 62397b6df1SKris Buschelman #define RINFOG(I) rinfog[(I)-1] 63adc1d99fSHong Zhang #define RINFO(I) rinfo[(I)-1] 64397b6df1SKris Buschelman 65397b6df1SKris Buschelman typedef struct { 66397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 672907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 682907cef9SHong Zhang CMUMPS_STRUC_C id; 692907cef9SHong Zhang #else 70397b6df1SKris Buschelman ZMUMPS_STRUC_C id; 712907cef9SHong Zhang #endif 722907cef9SHong Zhang #else 732907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 742907cef9SHong Zhang SMUMPS_STRUC_C id; 75397b6df1SKris Buschelman #else 76397b6df1SKris Buschelman DMUMPS_STRUC_C id; 77397b6df1SKris Buschelman #endif 782907cef9SHong Zhang #endif 792907cef9SHong Zhang 80397b6df1SKris Buschelman MatStructure matstruc; 81c1490034SHong Zhang PetscMPIInt myid,size; 82a5e57a09SHong Zhang PetscInt *irn,*jcn,nz,sym; 83397b6df1SKris Buschelman PetscScalar *val; 84397b6df1SKris Buschelman MPI_Comm comm_mumps; 85*6f3cc6f9SBarry Smith PetscBool isAIJ; 86a5e57a09SHong Zhang PetscInt ICNTL9_pre; /* check if ICNTL(9) is changed from previous MatSolve */ 87801fbe65SHong Zhang VecScatter scat_rhs, scat_sol; /* used by MatSolve() */ 88801fbe65SHong Zhang Vec b_seq,x_seq; 89b34f08ffSHong Zhang PetscInt ninfo,*info; /* display INFO */ 90b5fa320bSStefano Zampini PetscBool schur_second_solve; 91b5fa320bSStefano Zampini PetscInt sizeredrhs; 92b5fa320bSStefano Zampini PetscInt *schur_pivots; 9359ac8732SStefano Zampini PetscInt schur_B_lwork; 94b5fa320bSStefano Zampini PetscScalar *schur_work; 9559ac8732SStefano Zampini PetscScalar *schur_sol; 9659ac8732SStefano Zampini PetscInt schur_sizesol; 9759ac8732SStefano Zampini PetscBool schur_restored; 9859ac8732SStefano Zampini PetscBool schur_factored; 9959ac8732SStefano Zampini PetscBool schur_inverted; 1002205254eSKarl Rupp 101bf0cc555SLisandro Dalcin PetscErrorCode (*Destroy)(Mat); 102bccb9932SShri Abhyankar PetscErrorCode (*ConvertToTriples)(Mat, int, MatReuse, int*, int**, int**, PetscScalar**); 103f0c56d0fSKris Buschelman } Mat_MUMPS; 104f0c56d0fSKris Buschelman 10509573ac7SBarry Smith extern PetscErrorCode MatDuplicate_MUMPS(Mat,MatDuplicateOption,Mat*); 106b24902e0SBarry Smith 10759ac8732SStefano Zampini #undef __FUNCT__ 10859ac8732SStefano Zampini #define __FUNCT__ "MatMumpsResetSchur_Private" 10959ac8732SStefano Zampini static PetscErrorCode MatMumpsResetSchur_Private(Mat_MUMPS* mumps) 110b5fa320bSStefano Zampini { 111b5fa320bSStefano Zampini PetscErrorCode ierr; 112b5fa320bSStefano Zampini 113b5fa320bSStefano Zampini PetscFunctionBegin; 11459ac8732SStefano Zampini ierr = PetscFree2(mumps->id.listvar_schur,mumps->id.schur);CHKERRQ(ierr); 11559ac8732SStefano Zampini ierr = PetscFree(mumps->id.redrhs);CHKERRQ(ierr); 11659ac8732SStefano Zampini ierr = PetscFree(mumps->schur_sol);CHKERRQ(ierr); 11759ac8732SStefano Zampini ierr = PetscFree(mumps->schur_pivots);CHKERRQ(ierr); 11859ac8732SStefano Zampini ierr = PetscFree(mumps->schur_work);CHKERRQ(ierr); 11959ac8732SStefano Zampini if (!mumps->schur_restored) { 12059ac8732SStefano Zampini SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 12159ac8732SStefano Zampini } 12259ac8732SStefano Zampini mumps->id.size_schur = 0; 12359ac8732SStefano Zampini mumps->id.ICNTL(19) = 0; 12459ac8732SStefano Zampini PetscFunctionReturn(0); 12559ac8732SStefano Zampini } 12659ac8732SStefano Zampini 12759ac8732SStefano Zampini #undef __FUNCT__ 12859ac8732SStefano Zampini #define __FUNCT__ "MatMumpsFactorSchur_Private" 12959ac8732SStefano Zampini static PetscErrorCode MatMumpsFactorSchur_Private(Mat_MUMPS* mumps) 13059ac8732SStefano Zampini { 13159ac8732SStefano Zampini PetscBLASInt B_N,B_ierr,B_slda; 13259ac8732SStefano Zampini PetscErrorCode ierr; 13359ac8732SStefano Zampini 13459ac8732SStefano Zampini PetscFunctionBegin; 13559ac8732SStefano Zampini if (mumps->schur_factored) { 13659ac8732SStefano Zampini PetscFunctionReturn(0); 13759ac8732SStefano Zampini } 13859ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.size_schur,&B_N);CHKERRQ(ierr); 13959ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.schur_lld,&B_slda);CHKERRQ(ierr); 14059ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full Schur matrix */ 14159ac8732SStefano Zampini if (!mumps->schur_pivots) { 14259ac8732SStefano Zampini ierr = PetscMalloc1(B_N,&mumps->schur_pivots);CHKERRQ(ierr); 14359ac8732SStefano Zampini } 14459ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 14559ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetrf",LAPACKgetrf_(&B_N,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,&B_ierr)); 14659ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 14759ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GETRF Lapack routine %d",(int)B_ierr); 14859ac8732SStefano Zampini } else { /* either full or lower-triangular (not packed) */ 14959ac8732SStefano Zampini char ord[2]; 15059ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 15159ac8732SStefano Zampini sprintf(ord,"L"); 15259ac8732SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 15359ac8732SStefano Zampini sprintf(ord,"U"); 15459ac8732SStefano Zampini } 15559ac8732SStefano Zampini if (mumps->id.sym == 2) { 15659ac8732SStefano Zampini if (!mumps->schur_pivots) { 15759ac8732SStefano Zampini PetscScalar lwork; 15859ac8732SStefano Zampini 15959ac8732SStefano Zampini ierr = PetscMalloc1(B_N,&mumps->schur_pivots);CHKERRQ(ierr); 16059ac8732SStefano Zampini mumps->schur_B_lwork=-1; 16159ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 16259ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytrf",LAPACKsytrf_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,&lwork,&mumps->schur_B_lwork,&B_ierr)); 16359ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 16459ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SYTRF Lapack routine %d",(int)B_ierr); 16559ac8732SStefano Zampini ierr = PetscBLASIntCast((PetscInt)PetscRealPart(lwork),&mumps->schur_B_lwork);CHKERRQ(ierr); 16659ac8732SStefano Zampini ierr = PetscMalloc1(mumps->schur_B_lwork,&mumps->schur_work);CHKERRQ(ierr); 16759ac8732SStefano Zampini } 16859ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 16959ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytrf",LAPACKsytrf_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,mumps->schur_work,&mumps->schur_B_lwork,&B_ierr)); 17059ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 17159ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYTRF Lapack routine %d",(int)B_ierr); 17259ac8732SStefano Zampini } else { 17359ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 17459ac8732SStefano Zampini PetscStackCallBLAS("LAPACKpotrf",LAPACKpotrf_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,&B_ierr)); 17559ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 17659ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in POTRF Lapack routine %d",(int)B_ierr); 17759ac8732SStefano Zampini } 17859ac8732SStefano Zampini } 17959ac8732SStefano Zampini mumps->schur_factored = PETSC_TRUE; 18059ac8732SStefano Zampini PetscFunctionReturn(0); 18159ac8732SStefano Zampini } 18259ac8732SStefano Zampini 18359ac8732SStefano Zampini #undef __FUNCT__ 18459ac8732SStefano Zampini #define __FUNCT__ "MatMumpsInvertSchur_Private" 18559ac8732SStefano Zampini static PetscErrorCode MatMumpsInvertSchur_Private(Mat_MUMPS* mumps) 18659ac8732SStefano Zampini { 18759ac8732SStefano Zampini PetscBLASInt B_N,B_ierr,B_slda; 18859ac8732SStefano Zampini PetscErrorCode ierr; 18959ac8732SStefano Zampini 19059ac8732SStefano Zampini PetscFunctionBegin; 19159ac8732SStefano Zampini ierr = MatMumpsFactorSchur_Private(mumps);CHKERRQ(ierr); 19259ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.size_schur,&B_N);CHKERRQ(ierr); 19359ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.schur_lld,&B_slda);CHKERRQ(ierr); 19459ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full Schur matrix */ 19559ac8732SStefano Zampini if (!mumps->schur_work) { 19659ac8732SStefano Zampini PetscScalar lwork; 19759ac8732SStefano Zampini 19859ac8732SStefano Zampini mumps->schur_B_lwork = -1; 19959ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 20059ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetri",LAPACKgetri_(&B_N,(PetscScalar*)mumps->id.schur,&B_N,mumps->schur_pivots,&lwork,&mumps->schur_B_lwork,&B_ierr)); 20159ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 20259ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to GETRI Lapack routine %d",(int)B_ierr); 20359ac8732SStefano Zampini ierr = PetscBLASIntCast((PetscInt)PetscRealPart(lwork),&mumps->schur_B_lwork);CHKERRQ(ierr); 20459ac8732SStefano Zampini ierr = PetscMalloc1(mumps->schur_B_lwork,&mumps->schur_work);CHKERRQ(ierr); 20559ac8732SStefano Zampini } 20659ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 20759ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetri",LAPACKgetri_(&B_N,(PetscScalar*)mumps->id.schur,&B_N,mumps->schur_pivots,mumps->schur_work,&mumps->schur_B_lwork,&B_ierr)); 20859ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 20959ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GETRI Lapack routine %d",(int)B_ierr); 21059ac8732SStefano Zampini } else { /* either full or lower-triangular (not packed) */ 21159ac8732SStefano Zampini char ord[2]; 21259ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 21359ac8732SStefano Zampini sprintf(ord,"L"); 21459ac8732SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 21559ac8732SStefano Zampini sprintf(ord,"U"); 21659ac8732SStefano Zampini } 21759ac8732SStefano Zampini if (mumps->id.sym == 2) { 21859ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 21959ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytri",LAPACKsytri_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_N,mumps->schur_pivots,mumps->schur_work,&B_ierr)); 22059ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 22159ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYTRI Lapack routine %d",(int)B_ierr); 22259ac8732SStefano Zampini } else { 22359ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 22459ac8732SStefano Zampini PetscStackCallBLAS("LAPACKpotri",LAPACKpotri_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_N,&B_ierr)); 22559ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 22659ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in POTRI Lapack routine %d",(int)B_ierr); 22759ac8732SStefano Zampini } 22859ac8732SStefano Zampini } 22959ac8732SStefano Zampini mumps->schur_inverted = PETSC_TRUE; 23059ac8732SStefano Zampini PetscFunctionReturn(0); 23159ac8732SStefano Zampini } 23259ac8732SStefano Zampini 23359ac8732SStefano Zampini #undef __FUNCT__ 23459ac8732SStefano Zampini #define __FUNCT__ "MatMumpsSolveSchur_Private" 235e807eca7SStefano Zampini static PetscErrorCode MatMumpsSolveSchur_Private(Mat_MUMPS* mumps, PetscBool sol_in_redrhs) 23659ac8732SStefano Zampini { 23759ac8732SStefano Zampini PetscBLASInt B_N,B_Nrhs,B_ierr,B_slda,B_rlda; 23859ac8732SStefano Zampini PetscScalar one=1.,zero=0.; 23959ac8732SStefano Zampini PetscErrorCode ierr; 24059ac8732SStefano Zampini 24159ac8732SStefano Zampini PetscFunctionBegin; 24259ac8732SStefano Zampini ierr = MatMumpsFactorSchur_Private(mumps);CHKERRQ(ierr); 243b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.size_schur,&B_N);CHKERRQ(ierr); 244b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.schur_lld,&B_slda);CHKERRQ(ierr); 245b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.nrhs,&B_Nrhs);CHKERRQ(ierr); 246b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.lredrhs,&B_rlda);CHKERRQ(ierr); 24759ac8732SStefano Zampini if (mumps->schur_inverted) { 24859ac8732SStefano Zampini PetscInt sizesol = B_Nrhs*B_N; 24959ac8732SStefano Zampini if (!mumps->schur_sol || sizesol > mumps->schur_sizesol) { 25059ac8732SStefano Zampini ierr = PetscFree(mumps->schur_sol);CHKERRQ(ierr); 25159ac8732SStefano Zampini ierr = PetscMalloc1(sizesol,&mumps->schur_sol);CHKERRQ(ierr); 25259ac8732SStefano Zampini mumps->schur_sizesol = sizesol; 253b5fa320bSStefano Zampini } 25459ac8732SStefano Zampini if (!mumps->sym) { 25559ac8732SStefano Zampini char type[2]; 256b5fa320bSStefano Zampini if (mumps->id.ICNTL(19) == 1) { /* stored by rows */ 25759ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 25859ac8732SStefano Zampini sprintf(type,"N"); 259b5fa320bSStefano Zampini } else { 26059ac8732SStefano Zampini sprintf(type,"T"); 261b5fa320bSStefano Zampini } 26259ac8732SStefano Zampini } else { /* stored by columns */ 26359ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 26459ac8732SStefano Zampini sprintf(type,"T"); 26559ac8732SStefano Zampini } else { 26659ac8732SStefano Zampini sprintf(type,"N"); 26759ac8732SStefano Zampini } 26859ac8732SStefano Zampini } 26959ac8732SStefano Zampini PetscStackCallBLAS("BLASgemm",BLASgemm_(type,"N",&B_N,&B_Nrhs,&B_N,&one,(PetscScalar*)mumps->id.schur,&B_slda,(PetscScalar*)mumps->id.redrhs,&B_rlda,&zero,mumps->schur_sol,&B_rlda)); 27059ac8732SStefano Zampini } else { 27159ac8732SStefano Zampini char ord[2]; 27259ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 27359ac8732SStefano Zampini sprintf(ord,"L"); 27459ac8732SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 27559ac8732SStefano Zampini sprintf(ord,"U"); 27659ac8732SStefano Zampini } 27759ac8732SStefano Zampini PetscStackCallBLAS("BLASsymm",BLASsymm_("L",ord,&B_N,&B_Nrhs,&one,(PetscScalar*)mumps->id.schur,&B_slda,(PetscScalar*)mumps->id.redrhs,&B_rlda,&zero,mumps->schur_sol,&B_rlda)); 27859ac8732SStefano Zampini } 279e807eca7SStefano Zampini if (sol_in_redrhs) { 28059ac8732SStefano Zampini ierr = PetscMemcpy(mumps->id.redrhs,mumps->schur_sol,sizesol*sizeof(PetscScalar));CHKERRQ(ierr); 281e807eca7SStefano Zampini } 282a12f35bfSStefano Zampini } else { /* Schur complement has not been inverted */ 283a12f35bfSStefano Zampini MumpsScalar *orhs=NULL; 284a12f35bfSStefano Zampini 285a12f35bfSStefano Zampini if (!sol_in_redrhs) { 286a12f35bfSStefano Zampini PetscInt sizesol = B_Nrhs*B_N; 287a12f35bfSStefano Zampini if (!mumps->schur_sol || sizesol > mumps->schur_sizesol) { 288a12f35bfSStefano Zampini ierr = PetscFree(mumps->schur_sol);CHKERRQ(ierr); 289a12f35bfSStefano Zampini ierr = PetscMalloc1(sizesol,&mumps->schur_sol);CHKERRQ(ierr); 290a12f35bfSStefano Zampini mumps->schur_sizesol = sizesol; 291a12f35bfSStefano Zampini } 292a12f35bfSStefano Zampini orhs = mumps->id.redrhs; 293a12f35bfSStefano Zampini ierr = PetscMemcpy(mumps->schur_sol,mumps->id.redrhs,sizesol*sizeof(PetscScalar));CHKERRQ(ierr); 294a12f35bfSStefano Zampini mumps->id.redrhs = (MumpsScalar*)mumps->schur_sol; 295a12f35bfSStefano Zampini } 29659ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full Schur matrix */ 29759ac8732SStefano Zampini char type[2]; 29859ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 1) { /* stored by rows */ 29959ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 30059ac8732SStefano Zampini sprintf(type,"N"); 30159ac8732SStefano Zampini } else { 30259ac8732SStefano Zampini sprintf(type,"T"); 30359ac8732SStefano Zampini } 30459ac8732SStefano Zampini } else { /* stored by columns */ 30559ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 30659ac8732SStefano Zampini sprintf(type,"T"); 30759ac8732SStefano Zampini } else { 30859ac8732SStefano Zampini sprintf(type,"N"); 30959ac8732SStefano Zampini } 31059ac8732SStefano Zampini } 31159ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 31259ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetrs",LAPACKgetrs_(type,&B_N,&B_Nrhs,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,(PetscScalar*)mumps->id.redrhs,&B_rlda,&B_ierr)); 313b5fa320bSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 314b5fa320bSStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GETRS Lapack routine %d",(int)B_ierr); 315b5fa320bSStefano Zampini } else { /* either full or lower-triangular (not packed) */ 316b5fa320bSStefano Zampini char ord[2]; 317b5fa320bSStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 318b5fa320bSStefano Zampini sprintf(ord,"L"); 319b5fa320bSStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 320b5fa320bSStefano Zampini sprintf(ord,"U"); 321b5fa320bSStefano Zampini } 322b5fa320bSStefano Zampini if (mumps->id.sym == 2) { 323b5fa320bSStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 32459ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytrs",LAPACKsytrs_(ord,&B_N,&B_Nrhs,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,(PetscScalar*)mumps->id.redrhs,&B_rlda,&B_ierr)); 325b5fa320bSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 326b5fa320bSStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYTRS Lapack routine %d",(int)B_ierr); 327b5fa320bSStefano Zampini } else { 328b5fa320bSStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 32959ac8732SStefano Zampini PetscStackCallBLAS("LAPACKpotrs",LAPACKpotrs_(ord,&B_N,&B_Nrhs,(PetscScalar*)mumps->id.schur,&B_slda,(PetscScalar*)mumps->id.redrhs,&B_rlda,&B_ierr)); 330b5fa320bSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 331b5fa320bSStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in POTRS Lapack routine %d",(int)B_ierr); 332b5fa320bSStefano Zampini } 333b5fa320bSStefano Zampini } 334e807eca7SStefano Zampini if (!sol_in_redrhs) { 335a12f35bfSStefano Zampini mumps->id.redrhs = orhs; 336e807eca7SStefano Zampini } 33759ac8732SStefano Zampini } 338b5fa320bSStefano Zampini PetscFunctionReturn(0); 339b5fa320bSStefano Zampini } 340b5fa320bSStefano Zampini 34159ac8732SStefano Zampini #undef __FUNCT__ 34259ac8732SStefano Zampini #define __FUNCT__ "MatMumpsHandleSchur_Private" 343b5fa320bSStefano Zampini static PetscErrorCode MatMumpsHandleSchur_Private(Mat_MUMPS* mumps) 344b5fa320bSStefano Zampini { 345b5fa320bSStefano Zampini PetscErrorCode ierr; 346b5fa320bSStefano Zampini 347b5fa320bSStefano Zampini PetscFunctionBegin; 348b5fa320bSStefano Zampini if (!mumps->id.ICNTL(19)) { /* do nothing when Schur complement has not been computed */ 349b5fa320bSStefano Zampini PetscFunctionReturn(0); 350b5fa320bSStefano Zampini } 351b5fa320bSStefano Zampini if (!mumps->schur_second_solve) { /* prepare for the condensation step */ 352b5fa320bSStefano Zampini /* check if schur complement has been computed 353e807eca7SStefano Zampini We set by default ICNTL(26) == -1 when Schur indices have been provided by the user. 354b5fa320bSStefano Zampini According to MUMPS (5.0.0) manual, any value should be harmful during the factorization phase 355b5fa320bSStefano Zampini Unless the user provides a valid value for ICNTL(26), MatSolve and MatMatSolve routines solve the full system. 356b5fa320bSStefano Zampini This requires an extra call to PetscMUMPS_c and the computation of the factors for S, handled setting double_schur_solve to PETSC_TRUE */ 357b5fa320bSStefano Zampini if (mumps->id.ICNTL(26) < 0 || mumps->id.ICNTL(26) > 2) { 358b5fa320bSStefano Zampini PetscInt sizeredrhs = mumps->id.nrhs*mumps->id.size_schur; 359b5fa320bSStefano Zampini /* allocate MUMPS internal array to store reduced right-hand sides */ 360b5fa320bSStefano Zampini if (!mumps->id.redrhs || sizeredrhs > mumps->sizeredrhs) { 361b5fa320bSStefano Zampini ierr = PetscFree(mumps->id.redrhs);CHKERRQ(ierr); 362b5fa320bSStefano Zampini mumps->id.lredrhs = mumps->id.size_schur; 363b5fa320bSStefano Zampini ierr = PetscMalloc1(mumps->id.nrhs*mumps->id.lredrhs,&mumps->id.redrhs);CHKERRQ(ierr); 364b5fa320bSStefano Zampini mumps->sizeredrhs = mumps->id.nrhs*mumps->id.lredrhs; 365b5fa320bSStefano Zampini } 366b5fa320bSStefano Zampini mumps->schur_second_solve = PETSC_TRUE; 367b5fa320bSStefano Zampini mumps->id.ICNTL(26) = 1; /* condensation phase */ 368b5fa320bSStefano Zampini } 369b5fa320bSStefano Zampini } else { /* prepare for the expansion step */ 370b5fa320bSStefano Zampini /* solve Schur complement (this should be done by the MUMPS user, so basically us) */ 371e807eca7SStefano Zampini ierr = MatMumpsSolveSchur_Private(mumps,PETSC_TRUE);CHKERRQ(ierr); 372b5fa320bSStefano Zampini mumps->id.ICNTL(26) = 2; /* expansion phase */ 373b5fa320bSStefano Zampini PetscMUMPS_c(&mumps->id); 374b5fa320bSStefano Zampini if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 375b5fa320bSStefano Zampini /* restore defaults */ 376b5fa320bSStefano Zampini mumps->id.ICNTL(26) = -1; 377b5fa320bSStefano Zampini mumps->schur_second_solve = PETSC_FALSE; 378b5fa320bSStefano Zampini } 379b5fa320bSStefano Zampini PetscFunctionReturn(0); 380b5fa320bSStefano Zampini } 381b5fa320bSStefano Zampini 382397b6df1SKris Buschelman /* 383d341cd04SHong Zhang MatConvertToTriples_A_B - convert Petsc matrix to triples: row[nz], col[nz], val[nz] 384d341cd04SHong Zhang 385397b6df1SKris Buschelman input: 38667877ebaSShri Abhyankar A - matrix in aij,baij or sbaij (bs=1) format 387397b6df1SKris Buschelman shift - 0: C style output triple; 1: Fortran style output triple. 388bccb9932SShri Abhyankar reuse - MAT_INITIAL_MATRIX: spaces are allocated and values are set for the triple 389bccb9932SShri Abhyankar MAT_REUSE_MATRIX: only the values in v array are updated 390397b6df1SKris Buschelman output: 391397b6df1SKris Buschelman nnz - dim of r, c, and v (number of local nonzero entries of A) 392397b6df1SKris Buschelman r, c, v - row and col index, matrix values (matrix triples) 393eb9baa12SBarry Smith 394eb9baa12SBarry Smith The returned values r, c, and sometimes v are obtained in a single PetscMalloc(). Then in MatDestroy_MUMPS() it is 395eb9baa12SBarry Smith freed with PetscFree((mumps->irn); This is not ideal code, the fact that v is ONLY sometimes part of mumps->irn means 396eb9baa12SBarry Smith that the PetscMalloc() cannot easily be replaced with a PetscMalloc3(). 397eb9baa12SBarry Smith 398397b6df1SKris Buschelman */ 39916ebf90aSShri Abhyankar 40016ebf90aSShri Abhyankar #undef __FUNCT__ 40116ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqaij_seqaij" 402bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqaij_seqaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 403b24902e0SBarry Smith { 404185f6596SHong Zhang const PetscInt *ai,*aj,*ajj,M=A->rmap->n; 40567877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 406dfbe8321SBarry Smith PetscErrorCode ierr; 407c1490034SHong Zhang PetscInt *row,*col; 40816ebf90aSShri Abhyankar Mat_SeqAIJ *aa=(Mat_SeqAIJ*)A->data; 409397b6df1SKris Buschelman 410397b6df1SKris Buschelman PetscFunctionBegin; 41116ebf90aSShri Abhyankar *v=aa->a; 412bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 4132205254eSKarl Rupp nz = aa->nz; 4142205254eSKarl Rupp ai = aa->i; 4152205254eSKarl Rupp aj = aa->j; 41616ebf90aSShri Abhyankar *nnz = nz; 417785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 418185f6596SHong Zhang col = row + nz; 419185f6596SHong Zhang 42016ebf90aSShri Abhyankar nz = 0; 42116ebf90aSShri Abhyankar for (i=0; i<M; i++) { 42216ebf90aSShri Abhyankar rnz = ai[i+1] - ai[i]; 42367877ebaSShri Abhyankar ajj = aj + ai[i]; 42467877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 42567877ebaSShri Abhyankar row[nz] = i+shift; col[nz++] = ajj[j] + shift; 42616ebf90aSShri Abhyankar } 42716ebf90aSShri Abhyankar } 42816ebf90aSShri Abhyankar *r = row; *c = col; 42916ebf90aSShri Abhyankar } 43016ebf90aSShri Abhyankar PetscFunctionReturn(0); 43116ebf90aSShri Abhyankar } 432397b6df1SKris Buschelman 43316ebf90aSShri Abhyankar #undef __FUNCT__ 43467877ebaSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqbaij_seqaij" 435bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqbaij_seqaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 43667877ebaSShri Abhyankar { 43767877ebaSShri Abhyankar Mat_SeqBAIJ *aa=(Mat_SeqBAIJ*)A->data; 43833d57670SJed Brown const PetscInt *ai,*aj,*ajj,bs2 = aa->bs2; 43933d57670SJed Brown PetscInt bs,M,nz,idx=0,rnz,i,j,k,m; 44067877ebaSShri Abhyankar PetscErrorCode ierr; 44167877ebaSShri Abhyankar PetscInt *row,*col; 44267877ebaSShri Abhyankar 44367877ebaSShri Abhyankar PetscFunctionBegin; 44433d57670SJed Brown ierr = MatGetBlockSize(A,&bs);CHKERRQ(ierr); 44533d57670SJed Brown M = A->rmap->N/bs; 446cf3759fdSShri Abhyankar *v = aa->a; 447bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 448cf3759fdSShri Abhyankar ai = aa->i; aj = aa->j; 44967877ebaSShri Abhyankar nz = bs2*aa->nz; 45067877ebaSShri Abhyankar *nnz = nz; 451785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 452185f6596SHong Zhang col = row + nz; 453185f6596SHong Zhang 45467877ebaSShri Abhyankar for (i=0; i<M; i++) { 45567877ebaSShri Abhyankar ajj = aj + ai[i]; 45667877ebaSShri Abhyankar rnz = ai[i+1] - ai[i]; 45767877ebaSShri Abhyankar for (k=0; k<rnz; k++) { 45867877ebaSShri Abhyankar for (j=0; j<bs; j++) { 45967877ebaSShri Abhyankar for (m=0; m<bs; m++) { 46067877ebaSShri Abhyankar row[idx] = i*bs + m + shift; 461cf3759fdSShri Abhyankar col[idx++] = bs*(ajj[k]) + j + shift; 46267877ebaSShri Abhyankar } 46367877ebaSShri Abhyankar } 46467877ebaSShri Abhyankar } 46567877ebaSShri Abhyankar } 466cf3759fdSShri Abhyankar *r = row; *c = col; 46767877ebaSShri Abhyankar } 46867877ebaSShri Abhyankar PetscFunctionReturn(0); 46967877ebaSShri Abhyankar } 47067877ebaSShri Abhyankar 47167877ebaSShri Abhyankar #undef __FUNCT__ 47216ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqsbaij_seqsbaij" 473bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqsbaij_seqsbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 47416ebf90aSShri Abhyankar { 47567877ebaSShri Abhyankar const PetscInt *ai, *aj,*ajj,M=A->rmap->n; 47667877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 47716ebf90aSShri Abhyankar PetscErrorCode ierr; 47816ebf90aSShri Abhyankar PetscInt *row,*col; 47916ebf90aSShri Abhyankar Mat_SeqSBAIJ *aa=(Mat_SeqSBAIJ*)A->data; 48016ebf90aSShri Abhyankar 48116ebf90aSShri Abhyankar PetscFunctionBegin; 482882afa5aSHong Zhang *v = aa->a; 483bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 4842205254eSKarl Rupp nz = aa->nz; 4852205254eSKarl Rupp ai = aa->i; 4862205254eSKarl Rupp aj = aa->j; 4872205254eSKarl Rupp *v = aa->a; 48816ebf90aSShri Abhyankar *nnz = nz; 489785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 490185f6596SHong Zhang col = row + nz; 491185f6596SHong Zhang 49216ebf90aSShri Abhyankar nz = 0; 49316ebf90aSShri Abhyankar for (i=0; i<M; i++) { 49416ebf90aSShri Abhyankar rnz = ai[i+1] - ai[i]; 49567877ebaSShri Abhyankar ajj = aj + ai[i]; 49667877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 49767877ebaSShri Abhyankar row[nz] = i+shift; col[nz++] = ajj[j] + shift; 49816ebf90aSShri Abhyankar } 49916ebf90aSShri Abhyankar } 50016ebf90aSShri Abhyankar *r = row; *c = col; 50116ebf90aSShri Abhyankar } 50216ebf90aSShri Abhyankar PetscFunctionReturn(0); 50316ebf90aSShri Abhyankar } 50416ebf90aSShri Abhyankar 50516ebf90aSShri Abhyankar #undef __FUNCT__ 50616ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqaij_seqsbaij" 507bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqaij_seqsbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 50816ebf90aSShri Abhyankar { 50967877ebaSShri Abhyankar const PetscInt *ai,*aj,*ajj,*adiag,M=A->rmap->n; 51067877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 51167877ebaSShri Abhyankar const PetscScalar *av,*v1; 51216ebf90aSShri Abhyankar PetscScalar *val; 51316ebf90aSShri Abhyankar PetscErrorCode ierr; 51416ebf90aSShri Abhyankar PetscInt *row,*col; 515829b1710SHong Zhang Mat_SeqAIJ *aa=(Mat_SeqAIJ*)A->data; 51616ebf90aSShri Abhyankar 51716ebf90aSShri Abhyankar PetscFunctionBegin; 51816ebf90aSShri Abhyankar ai =aa->i; aj=aa->j;av=aa->a; 51916ebf90aSShri Abhyankar adiag=aa->diag; 520bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 521829b1710SHong Zhang /* count nz in the uppper triangular part of A */ 522829b1710SHong Zhang nz = 0; 523829b1710SHong Zhang for (i=0; i<M; i++) nz += ai[i+1] - adiag[i]; 52416ebf90aSShri Abhyankar *nnz = nz; 525829b1710SHong Zhang 526185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 527185f6596SHong Zhang col = row + nz; 528185f6596SHong Zhang val = (PetscScalar*)(col + nz); 529185f6596SHong Zhang 53016ebf90aSShri Abhyankar nz = 0; 53116ebf90aSShri Abhyankar for (i=0; i<M; i++) { 53216ebf90aSShri Abhyankar rnz = ai[i+1] - adiag[i]; 53367877ebaSShri Abhyankar ajj = aj + adiag[i]; 534cf3759fdSShri Abhyankar v1 = av + adiag[i]; 53567877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 53667877ebaSShri Abhyankar row[nz] = i+shift; col[nz] = ajj[j] + shift; val[nz++] = v1[j]; 53716ebf90aSShri Abhyankar } 53816ebf90aSShri Abhyankar } 53916ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 540397b6df1SKris Buschelman } else { 54116ebf90aSShri Abhyankar nz = 0; val = *v; 54216ebf90aSShri Abhyankar for (i=0; i <M; i++) { 54316ebf90aSShri Abhyankar rnz = ai[i+1] - adiag[i]; 54467877ebaSShri Abhyankar ajj = aj + adiag[i]; 54567877ebaSShri Abhyankar v1 = av + adiag[i]; 54667877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 54767877ebaSShri Abhyankar val[nz++] = v1[j]; 54816ebf90aSShri Abhyankar } 54916ebf90aSShri Abhyankar } 55016ebf90aSShri Abhyankar } 55116ebf90aSShri Abhyankar PetscFunctionReturn(0); 55216ebf90aSShri Abhyankar } 55316ebf90aSShri Abhyankar 55416ebf90aSShri Abhyankar #undef __FUNCT__ 55516ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpisbaij_mpisbaij" 556bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpisbaij_mpisbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 55716ebf90aSShri Abhyankar { 55816ebf90aSShri Abhyankar const PetscInt *ai, *aj, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 55916ebf90aSShri Abhyankar PetscErrorCode ierr; 56016ebf90aSShri Abhyankar PetscInt rstart,nz,i,j,jj,irow,countA,countB; 56116ebf90aSShri Abhyankar PetscInt *row,*col; 56216ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 56316ebf90aSShri Abhyankar PetscScalar *val; 564397b6df1SKris Buschelman Mat_MPISBAIJ *mat = (Mat_MPISBAIJ*)A->data; 565397b6df1SKris Buschelman Mat_SeqSBAIJ *aa = (Mat_SeqSBAIJ*)(mat->A)->data; 566397b6df1SKris Buschelman Mat_SeqBAIJ *bb = (Mat_SeqBAIJ*)(mat->B)->data; 56716ebf90aSShri Abhyankar 56816ebf90aSShri Abhyankar PetscFunctionBegin; 569d0f46423SBarry Smith ai=aa->i; aj=aa->j; bi=bb->i; bj=bb->j; rstart= A->rmap->rstart; 570397b6df1SKris Buschelman av=aa->a; bv=bb->a; 571397b6df1SKris Buschelman 5722205254eSKarl Rupp garray = mat->garray; 5732205254eSKarl Rupp 574bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 57516ebf90aSShri Abhyankar nz = aa->nz + bb->nz; 57616ebf90aSShri Abhyankar *nnz = nz; 577185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 578185f6596SHong Zhang col = row + nz; 579185f6596SHong Zhang val = (PetscScalar*)(col + nz); 580185f6596SHong Zhang 581397b6df1SKris Buschelman *r = row; *c = col; *v = val; 582397b6df1SKris Buschelman } else { 583397b6df1SKris Buschelman row = *r; col = *c; val = *v; 584397b6df1SKris Buschelman } 585397b6df1SKris Buschelman 586028e57e8SHong Zhang jj = 0; irow = rstart; 587397b6df1SKris Buschelman for (i=0; i<m; i++) { 588397b6df1SKris Buschelman ajj = aj + ai[i]; /* ptr to the beginning of this row */ 589397b6df1SKris Buschelman countA = ai[i+1] - ai[i]; 590397b6df1SKris Buschelman countB = bi[i+1] - bi[i]; 591397b6df1SKris Buschelman bjj = bj + bi[i]; 59216ebf90aSShri Abhyankar v1 = av + ai[i]; 59316ebf90aSShri Abhyankar v2 = bv + bi[i]; 594397b6df1SKris Buschelman 595397b6df1SKris Buschelman /* A-part */ 596397b6df1SKris Buschelman for (j=0; j<countA; j++) { 597bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 598397b6df1SKris Buschelman row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 599397b6df1SKris Buschelman } 60016ebf90aSShri Abhyankar val[jj++] = v1[j]; 601397b6df1SKris Buschelman } 60216ebf90aSShri Abhyankar 60316ebf90aSShri Abhyankar /* B-part */ 60416ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 605bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 606397b6df1SKris Buschelman row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 607397b6df1SKris Buschelman } 60816ebf90aSShri Abhyankar val[jj++] = v2[j]; 60916ebf90aSShri Abhyankar } 61016ebf90aSShri Abhyankar irow++; 61116ebf90aSShri Abhyankar } 61216ebf90aSShri Abhyankar PetscFunctionReturn(0); 61316ebf90aSShri Abhyankar } 61416ebf90aSShri Abhyankar 61516ebf90aSShri Abhyankar #undef __FUNCT__ 61616ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpiaij_mpiaij" 617bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpiaij_mpiaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 61816ebf90aSShri Abhyankar { 61916ebf90aSShri Abhyankar const PetscInt *ai, *aj, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 62016ebf90aSShri Abhyankar PetscErrorCode ierr; 62116ebf90aSShri Abhyankar PetscInt rstart,nz,i,j,jj,irow,countA,countB; 62216ebf90aSShri Abhyankar PetscInt *row,*col; 62316ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 62416ebf90aSShri Abhyankar PetscScalar *val; 62516ebf90aSShri Abhyankar Mat_MPIAIJ *mat = (Mat_MPIAIJ*)A->data; 62616ebf90aSShri Abhyankar Mat_SeqAIJ *aa = (Mat_SeqAIJ*)(mat->A)->data; 62716ebf90aSShri Abhyankar Mat_SeqAIJ *bb = (Mat_SeqAIJ*)(mat->B)->data; 62816ebf90aSShri Abhyankar 62916ebf90aSShri Abhyankar PetscFunctionBegin; 63016ebf90aSShri Abhyankar ai=aa->i; aj=aa->j; bi=bb->i; bj=bb->j; rstart= A->rmap->rstart; 63116ebf90aSShri Abhyankar av=aa->a; bv=bb->a; 63216ebf90aSShri Abhyankar 6332205254eSKarl Rupp garray = mat->garray; 6342205254eSKarl Rupp 635bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 63616ebf90aSShri Abhyankar nz = aa->nz + bb->nz; 63716ebf90aSShri Abhyankar *nnz = nz; 638185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 639185f6596SHong Zhang col = row + nz; 640185f6596SHong Zhang val = (PetscScalar*)(col + nz); 641185f6596SHong Zhang 64216ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 64316ebf90aSShri Abhyankar } else { 64416ebf90aSShri Abhyankar row = *r; col = *c; val = *v; 64516ebf90aSShri Abhyankar } 64616ebf90aSShri Abhyankar 64716ebf90aSShri Abhyankar jj = 0; irow = rstart; 64816ebf90aSShri Abhyankar for (i=0; i<m; i++) { 64916ebf90aSShri Abhyankar ajj = aj + ai[i]; /* ptr to the beginning of this row */ 65016ebf90aSShri Abhyankar countA = ai[i+1] - ai[i]; 65116ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 65216ebf90aSShri Abhyankar bjj = bj + bi[i]; 65316ebf90aSShri Abhyankar v1 = av + ai[i]; 65416ebf90aSShri Abhyankar v2 = bv + bi[i]; 65516ebf90aSShri Abhyankar 65616ebf90aSShri Abhyankar /* A-part */ 65716ebf90aSShri Abhyankar for (j=0; j<countA; j++) { 658bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 65916ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 66016ebf90aSShri Abhyankar } 66116ebf90aSShri Abhyankar val[jj++] = v1[j]; 66216ebf90aSShri Abhyankar } 66316ebf90aSShri Abhyankar 66416ebf90aSShri Abhyankar /* B-part */ 66516ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 666bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 66716ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 66816ebf90aSShri Abhyankar } 66916ebf90aSShri Abhyankar val[jj++] = v2[j]; 67016ebf90aSShri Abhyankar } 67116ebf90aSShri Abhyankar irow++; 67216ebf90aSShri Abhyankar } 67316ebf90aSShri Abhyankar PetscFunctionReturn(0); 67416ebf90aSShri Abhyankar } 67516ebf90aSShri Abhyankar 67616ebf90aSShri Abhyankar #undef __FUNCT__ 67767877ebaSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpibaij_mpiaij" 678bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpibaij_mpiaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 67967877ebaSShri Abhyankar { 68067877ebaSShri Abhyankar Mat_MPIBAIJ *mat = (Mat_MPIBAIJ*)A->data; 68167877ebaSShri Abhyankar Mat_SeqBAIJ *aa = (Mat_SeqBAIJ*)(mat->A)->data; 68267877ebaSShri Abhyankar Mat_SeqBAIJ *bb = (Mat_SeqBAIJ*)(mat->B)->data; 68367877ebaSShri Abhyankar const PetscInt *ai = aa->i, *bi = bb->i, *aj = aa->j, *bj = bb->j,*ajj, *bjj; 684d985c460SShri Abhyankar const PetscInt *garray = mat->garray,mbs=mat->mbs,rstart=A->rmap->rstart; 68533d57670SJed Brown const PetscInt bs2=mat->bs2; 68667877ebaSShri Abhyankar PetscErrorCode ierr; 68733d57670SJed Brown PetscInt bs,nz,i,j,k,n,jj,irow,countA,countB,idx; 68867877ebaSShri Abhyankar PetscInt *row,*col; 68967877ebaSShri Abhyankar const PetscScalar *av=aa->a, *bv=bb->a,*v1,*v2; 69067877ebaSShri Abhyankar PetscScalar *val; 69167877ebaSShri Abhyankar 69267877ebaSShri Abhyankar PetscFunctionBegin; 69333d57670SJed Brown ierr = MatGetBlockSize(A,&bs);CHKERRQ(ierr); 694bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 69567877ebaSShri Abhyankar nz = bs2*(aa->nz + bb->nz); 69667877ebaSShri Abhyankar *nnz = nz; 697185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 698185f6596SHong Zhang col = row + nz; 699185f6596SHong Zhang val = (PetscScalar*)(col + nz); 700185f6596SHong Zhang 70167877ebaSShri Abhyankar *r = row; *c = col; *v = val; 70267877ebaSShri Abhyankar } else { 70367877ebaSShri Abhyankar row = *r; col = *c; val = *v; 70467877ebaSShri Abhyankar } 70567877ebaSShri Abhyankar 706d985c460SShri Abhyankar jj = 0; irow = rstart; 70767877ebaSShri Abhyankar for (i=0; i<mbs; i++) { 70867877ebaSShri Abhyankar countA = ai[i+1] - ai[i]; 70967877ebaSShri Abhyankar countB = bi[i+1] - bi[i]; 71067877ebaSShri Abhyankar ajj = aj + ai[i]; 71167877ebaSShri Abhyankar bjj = bj + bi[i]; 71267877ebaSShri Abhyankar v1 = av + bs2*ai[i]; 71367877ebaSShri Abhyankar v2 = bv + bs2*bi[i]; 71467877ebaSShri Abhyankar 71567877ebaSShri Abhyankar idx = 0; 71667877ebaSShri Abhyankar /* A-part */ 71767877ebaSShri Abhyankar for (k=0; k<countA; k++) { 71867877ebaSShri Abhyankar for (j=0; j<bs; j++) { 71967877ebaSShri Abhyankar for (n=0; n<bs; n++) { 720bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 721d985c460SShri Abhyankar row[jj] = irow + n + shift; 722d985c460SShri Abhyankar col[jj] = rstart + bs*ajj[k] + j + shift; 72367877ebaSShri Abhyankar } 72467877ebaSShri Abhyankar val[jj++] = v1[idx++]; 72567877ebaSShri Abhyankar } 72667877ebaSShri Abhyankar } 72767877ebaSShri Abhyankar } 72867877ebaSShri Abhyankar 72967877ebaSShri Abhyankar idx = 0; 73067877ebaSShri Abhyankar /* B-part */ 73167877ebaSShri Abhyankar for (k=0; k<countB; k++) { 73267877ebaSShri Abhyankar for (j=0; j<bs; j++) { 73367877ebaSShri Abhyankar for (n=0; n<bs; n++) { 734bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 735d985c460SShri Abhyankar row[jj] = irow + n + shift; 736d985c460SShri Abhyankar col[jj] = bs*garray[bjj[k]] + j + shift; 73767877ebaSShri Abhyankar } 738d985c460SShri Abhyankar val[jj++] = v2[idx++]; 73967877ebaSShri Abhyankar } 74067877ebaSShri Abhyankar } 74167877ebaSShri Abhyankar } 742d985c460SShri Abhyankar irow += bs; 74367877ebaSShri Abhyankar } 74467877ebaSShri Abhyankar PetscFunctionReturn(0); 74567877ebaSShri Abhyankar } 74667877ebaSShri Abhyankar 74767877ebaSShri Abhyankar #undef __FUNCT__ 74816ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpiaij_mpisbaij" 749bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpiaij_mpisbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 75016ebf90aSShri Abhyankar { 75116ebf90aSShri Abhyankar const PetscInt *ai, *aj,*adiag, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 75216ebf90aSShri Abhyankar PetscErrorCode ierr; 753e0bace9bSHong Zhang PetscInt rstart,nz,nza,nzb,i,j,jj,irow,countA,countB; 75416ebf90aSShri Abhyankar PetscInt *row,*col; 75516ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 75616ebf90aSShri Abhyankar PetscScalar *val; 75716ebf90aSShri Abhyankar Mat_MPIAIJ *mat = (Mat_MPIAIJ*)A->data; 75816ebf90aSShri Abhyankar Mat_SeqAIJ *aa =(Mat_SeqAIJ*)(mat->A)->data; 75916ebf90aSShri Abhyankar Mat_SeqAIJ *bb =(Mat_SeqAIJ*)(mat->B)->data; 76016ebf90aSShri Abhyankar 76116ebf90aSShri Abhyankar PetscFunctionBegin; 76216ebf90aSShri Abhyankar ai=aa->i; aj=aa->j; adiag=aa->diag; 76316ebf90aSShri Abhyankar bi=bb->i; bj=bb->j; garray = mat->garray; 76416ebf90aSShri Abhyankar av=aa->a; bv=bb->a; 7652205254eSKarl Rupp 76616ebf90aSShri Abhyankar rstart = A->rmap->rstart; 76716ebf90aSShri Abhyankar 768bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 769e0bace9bSHong Zhang nza = 0; /* num of upper triangular entries in mat->A, including diagonals */ 770e0bace9bSHong Zhang nzb = 0; /* num of upper triangular entries in mat->B */ 77116ebf90aSShri Abhyankar for (i=0; i<m; i++) { 772e0bace9bSHong Zhang nza += (ai[i+1] - adiag[i]); 77316ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 77416ebf90aSShri Abhyankar bjj = bj + bi[i]; 775e0bace9bSHong Zhang for (j=0; j<countB; j++) { 776e0bace9bSHong Zhang if (garray[bjj[j]] > rstart) nzb++; 777e0bace9bSHong Zhang } 778e0bace9bSHong Zhang } 77916ebf90aSShri Abhyankar 780e0bace9bSHong Zhang nz = nza + nzb; /* total nz of upper triangular part of mat */ 78116ebf90aSShri Abhyankar *nnz = nz; 782185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 783185f6596SHong Zhang col = row + nz; 784185f6596SHong Zhang val = (PetscScalar*)(col + nz); 785185f6596SHong Zhang 78616ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 78716ebf90aSShri Abhyankar } else { 78816ebf90aSShri Abhyankar row = *r; col = *c; val = *v; 78916ebf90aSShri Abhyankar } 79016ebf90aSShri Abhyankar 79116ebf90aSShri Abhyankar jj = 0; irow = rstart; 79216ebf90aSShri Abhyankar for (i=0; i<m; i++) { 79316ebf90aSShri Abhyankar ajj = aj + adiag[i]; /* ptr to the beginning of the diagonal of this row */ 79416ebf90aSShri Abhyankar v1 = av + adiag[i]; 79516ebf90aSShri Abhyankar countA = ai[i+1] - adiag[i]; 79616ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 79716ebf90aSShri Abhyankar bjj = bj + bi[i]; 79816ebf90aSShri Abhyankar v2 = bv + bi[i]; 79916ebf90aSShri Abhyankar 80016ebf90aSShri Abhyankar /* A-part */ 80116ebf90aSShri Abhyankar for (j=0; j<countA; j++) { 802bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 80316ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 80416ebf90aSShri Abhyankar } 80516ebf90aSShri Abhyankar val[jj++] = v1[j]; 80616ebf90aSShri Abhyankar } 80716ebf90aSShri Abhyankar 80816ebf90aSShri Abhyankar /* B-part */ 80916ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 81016ebf90aSShri Abhyankar if (garray[bjj[j]] > rstart) { 811bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 81216ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 81316ebf90aSShri Abhyankar } 81416ebf90aSShri Abhyankar val[jj++] = v2[j]; 81516ebf90aSShri Abhyankar } 816397b6df1SKris Buschelman } 817397b6df1SKris Buschelman irow++; 818397b6df1SKris Buschelman } 819397b6df1SKris Buschelman PetscFunctionReturn(0); 820397b6df1SKris Buschelman } 821397b6df1SKris Buschelman 822397b6df1SKris Buschelman #undef __FUNCT__ 82320be8e61SHong Zhang #define __FUNCT__ "MatGetDiagonal_MUMPS" 82420be8e61SHong Zhang PetscErrorCode MatGetDiagonal_MUMPS(Mat A,Vec v) 82520be8e61SHong Zhang { 82620be8e61SHong Zhang PetscFunctionBegin; 82720be8e61SHong Zhang SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Mat type: MUMPS factor"); 82820be8e61SHong Zhang PetscFunctionReturn(0); 82920be8e61SHong Zhang } 83020be8e61SHong Zhang 83120be8e61SHong Zhang #undef __FUNCT__ 8323924e44cSKris Buschelman #define __FUNCT__ "MatDestroy_MUMPS" 833dfbe8321SBarry Smith PetscErrorCode MatDestroy_MUMPS(Mat A) 834dfbe8321SBarry Smith { 835a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 836dfbe8321SBarry Smith PetscErrorCode ierr; 837b24902e0SBarry Smith 838397b6df1SKris Buschelman PetscFunctionBegin; 839a5e57a09SHong Zhang ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr); 840a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_rhs);CHKERRQ(ierr); 841a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 842801fbe65SHong Zhang ierr = VecDestroy(&mumps->b_seq);CHKERRQ(ierr); 843a5e57a09SHong Zhang ierr = VecDestroy(&mumps->x_seq);CHKERRQ(ierr); 844a5e57a09SHong Zhang ierr = PetscFree(mumps->id.perm_in);CHKERRQ(ierr); 845a5e57a09SHong Zhang ierr = PetscFree(mumps->irn);CHKERRQ(ierr); 846b34f08ffSHong Zhang ierr = PetscFree(mumps->info);CHKERRQ(ierr); 84759ac8732SStefano Zampini ierr = MatMumpsResetSchur_Private(mumps);CHKERRQ(ierr); 848a5e57a09SHong Zhang mumps->id.job = JOB_END; 849a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 850*6f3cc6f9SBarry Smith ierr = MPI_Comm_free(&mumps->comm_mumps);CHKERRQ(ierr); 851a5e57a09SHong Zhang if (mumps->Destroy) { 852a5e57a09SHong Zhang ierr = (mumps->Destroy)(A);CHKERRQ(ierr); 853bf0cc555SLisandro Dalcin } 854bf0cc555SLisandro Dalcin ierr = PetscFree(A->spptr);CHKERRQ(ierr); 855bf0cc555SLisandro Dalcin 85697969023SHong Zhang /* clear composed functions */ 857bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatFactorGetSolverPackage_C",NULL);CHKERRQ(ierr); 858bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetIcntl_C",NULL);CHKERRQ(ierr); 859bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetIcntl_C",NULL);CHKERRQ(ierr); 860bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetCntl_C",NULL);CHKERRQ(ierr); 861bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetCntl_C",NULL);CHKERRQ(ierr); 862bc6112feSHong Zhang 863ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetInfo_C",NULL);CHKERRQ(ierr); 864ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetInfog_C",NULL);CHKERRQ(ierr); 865ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetRinfo_C",NULL);CHKERRQ(ierr); 866ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetRinfog_C",NULL);CHKERRQ(ierr); 8676444a565SStefano Zampini 8686444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetSchurIndices_C",NULL);CHKERRQ(ierr); 86959ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsInvertSchurComplement_C",NULL);CHKERRQ(ierr); 87059ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsCreateSchurComplement_C",NULL);CHKERRQ(ierr); 8716444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetSchurComplement_C",NULL);CHKERRQ(ierr); 87259ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsRestoreSchurComplement_C",NULL);CHKERRQ(ierr); 873e807eca7SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSolveSchurComplement_C",NULL);CHKERRQ(ierr); 8747404bcfbSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSolveSchurComplementTranspose_C",NULL);CHKERRQ(ierr); 875397b6df1SKris Buschelman PetscFunctionReturn(0); 876397b6df1SKris Buschelman } 877397b6df1SKris Buschelman 878397b6df1SKris Buschelman #undef __FUNCT__ 879f6c57405SHong Zhang #define __FUNCT__ "MatSolve_MUMPS" 880b24902e0SBarry Smith PetscErrorCode MatSolve_MUMPS(Mat A,Vec b,Vec x) 881b24902e0SBarry Smith { 882a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 883d54de34fSKris Buschelman PetscScalar *array; 88467877ebaSShri Abhyankar Vec b_seq; 885329ec9b3SHong Zhang IS is_iden,is_petsc; 886dfbe8321SBarry Smith PetscErrorCode ierr; 887329ec9b3SHong Zhang PetscInt i; 888883f2eb9SBarry Smith static PetscBool cite1 = PETSC_FALSE,cite2 = PETSC_FALSE; 889397b6df1SKris Buschelman 890397b6df1SKris Buschelman PetscFunctionBegin; 891883f2eb9SBarry Smith ierr = PetscCitationsRegister("@article{MUMPS01,\n author = {P.~R. Amestoy and I.~S. Duff and J.-Y. L'Excellent and J. Koster},\n title = {A fully asynchronous multifrontal solver using distributed dynamic scheduling},\n journal = {SIAM Journal on Matrix Analysis and Applications},\n volume = {23},\n number = {1},\n pages = {15--41},\n year = {2001}\n}\n",&cite1);CHKERRQ(ierr); 892883f2eb9SBarry Smith ierr = PetscCitationsRegister("@article{MUMPS02,\n author = {P.~R. Amestoy and A. Guermouche and J.-Y. L'Excellent and S. Pralet},\n title = {Hybrid scheduling for the parallel solution of linear systems},\n journal = {Parallel Computing},\n volume = {32},\n number = {2},\n pages = {136--156},\n year = {2006}\n}\n",&cite2);CHKERRQ(ierr); 893a5e57a09SHong Zhang mumps->id.nrhs = 1; 894a5e57a09SHong Zhang b_seq = mumps->b_seq; 895a5e57a09SHong Zhang if (mumps->size > 1) { 896329ec9b3SHong Zhang /* MUMPS only supports centralized rhs. Scatter b into a seqential rhs vector */ 897a5e57a09SHong Zhang ierr = VecScatterBegin(mumps->scat_rhs,b,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 898a5e57a09SHong Zhang ierr = VecScatterEnd(mumps->scat_rhs,b,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 899a5e57a09SHong Zhang if (!mumps->myid) {ierr = VecGetArray(b_seq,&array);CHKERRQ(ierr);} 900397b6df1SKris Buschelman } else { /* size == 1 */ 901397b6df1SKris Buschelman ierr = VecCopy(b,x);CHKERRQ(ierr); 902397b6df1SKris Buschelman ierr = VecGetArray(x,&array);CHKERRQ(ierr); 903397b6df1SKris Buschelman } 904a5e57a09SHong Zhang if (!mumps->myid) { /* define rhs on the host */ 905a5e57a09SHong Zhang mumps->id.nrhs = 1; 906940cd9d6SSatish Balay mumps->id.rhs = (MumpsScalar*)array; 907397b6df1SKris Buschelman } 908397b6df1SKris Buschelman 909b5fa320bSStefano Zampini /* handle condensation step of Schur complement (if any) */ 910b5fa320bSStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps);CHKERRQ(ierr); 911b5fa320bSStefano Zampini 912397b6df1SKris Buschelman /* solve phase */ 913329ec9b3SHong Zhang /*-------------*/ 914a5e57a09SHong Zhang mumps->id.job = JOB_SOLVE; 915a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 916a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 917397b6df1SKris Buschelman 918b5fa320bSStefano Zampini /* handle expansion step of Schur complement (if any) */ 919b5fa320bSStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps);CHKERRQ(ierr); 920b5fa320bSStefano Zampini 921a5e57a09SHong Zhang if (mumps->size > 1) { /* convert mumps distributed solution to petsc mpi x */ 922a5e57a09SHong Zhang if (mumps->scat_sol && mumps->ICNTL9_pre != mumps->id.ICNTL(9)) { 923a5e57a09SHong Zhang /* when id.ICNTL(9) changes, the contents of lsol_loc may change (not its size, lsol_loc), recreates scat_sol */ 924a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 925397b6df1SKris Buschelman } 926a5e57a09SHong Zhang if (!mumps->scat_sol) { /* create scatter scat_sol */ 927a5e57a09SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,mumps->id.lsol_loc,0,1,&is_iden);CHKERRQ(ierr); /* from */ 928a5e57a09SHong Zhang for (i=0; i<mumps->id.lsol_loc; i++) { 929a5e57a09SHong Zhang mumps->id.isol_loc[i] -= 1; /* change Fortran style to C style */ 930a5e57a09SHong Zhang } 931a5e57a09SHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,mumps->id.lsol_loc,mumps->id.isol_loc,PETSC_COPY_VALUES,&is_petsc);CHKERRQ(ierr); /* to */ 932a5e57a09SHong Zhang ierr = VecScatterCreate(mumps->x_seq,is_iden,x,is_petsc,&mumps->scat_sol);CHKERRQ(ierr); 9336bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 9346bf464f9SBarry Smith ierr = ISDestroy(&is_petsc);CHKERRQ(ierr); 9352205254eSKarl Rupp 936a5e57a09SHong Zhang mumps->ICNTL9_pre = mumps->id.ICNTL(9); /* save current value of id.ICNTL(9) */ 937397b6df1SKris Buschelman } 938a5e57a09SHong Zhang 939a5e57a09SHong Zhang ierr = VecScatterBegin(mumps->scat_sol,mumps->x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 940a5e57a09SHong Zhang ierr = VecScatterEnd(mumps->scat_sol,mumps->x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 941329ec9b3SHong Zhang } 942397b6df1SKris Buschelman PetscFunctionReturn(0); 943397b6df1SKris Buschelman } 944397b6df1SKris Buschelman 94551d5961aSHong Zhang #undef __FUNCT__ 94651d5961aSHong Zhang #define __FUNCT__ "MatSolveTranspose_MUMPS" 94751d5961aSHong Zhang PetscErrorCode MatSolveTranspose_MUMPS(Mat A,Vec b,Vec x) 94851d5961aSHong Zhang { 949a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 95051d5961aSHong Zhang PetscErrorCode ierr; 95151d5961aSHong Zhang 95251d5961aSHong Zhang PetscFunctionBegin; 953a5e57a09SHong Zhang mumps->id.ICNTL(9) = 0; 9540ad0caddSJed Brown ierr = MatSolve_MUMPS(A,b,x);CHKERRQ(ierr); 955a5e57a09SHong Zhang mumps->id.ICNTL(9) = 1; 95651d5961aSHong Zhang PetscFunctionReturn(0); 95751d5961aSHong Zhang } 95851d5961aSHong Zhang 959e0b74bf9SHong Zhang #undef __FUNCT__ 960e0b74bf9SHong Zhang #define __FUNCT__ "MatMatSolve_MUMPS" 961e0b74bf9SHong Zhang PetscErrorCode MatMatSolve_MUMPS(Mat A,Mat B,Mat X) 962e0b74bf9SHong Zhang { 963bda8bf91SBarry Smith PetscErrorCode ierr; 964bda8bf91SBarry Smith PetscBool flg; 9654e34a73bSHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 966334c5f61SHong Zhang PetscInt i,nrhs,M; 9672cd7d884SHong Zhang PetscScalar *array,*bray; 968bda8bf91SBarry Smith 969e0b74bf9SHong Zhang PetscFunctionBegin; 9700298fd71SBarry Smith ierr = PetscObjectTypeCompareAny((PetscObject)B,&flg,MATSEQDENSE,MATMPIDENSE,NULL);CHKERRQ(ierr); 971801fbe65SHong Zhang if (!flg) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_ARG_WRONG,"Matrix B must be MATDENSE matrix"); 9720298fd71SBarry Smith ierr = PetscObjectTypeCompareAny((PetscObject)X,&flg,MATSEQDENSE,MATMPIDENSE,NULL);CHKERRQ(ierr); 973801fbe65SHong Zhang if (!flg) SETERRQ(PetscObjectComm((PetscObject)X),PETSC_ERR_ARG_WRONG,"Matrix X must be MATDENSE matrix"); 974801fbe65SHong Zhang if (B->rmap->n != X->rmap->n) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_ARG_WRONG,"Matrix B and X must have same row distribution"); 9754e34a73bSHong Zhang 9762cd7d884SHong Zhang ierr = MatGetSize(B,&M,&nrhs);CHKERRQ(ierr); 977334c5f61SHong Zhang mumps->id.nrhs = nrhs; 978334c5f61SHong Zhang mumps->id.lrhs = M; 9794e34a73bSHong Zhang 9802cd7d884SHong Zhang if (mumps->size == 1) { 9812cd7d884SHong Zhang /* copy B to X */ 9822cd7d884SHong Zhang ierr = MatDenseGetArray(B,&bray);CHKERRQ(ierr); 9832cd7d884SHong Zhang ierr = MatDenseGetArray(X,&array);CHKERRQ(ierr); 9846444a565SStefano Zampini ierr = PetscMemcpy(array,bray,M*nrhs*sizeof(PetscScalar));CHKERRQ(ierr); 9852cd7d884SHong Zhang ierr = MatDenseRestoreArray(B,&bray);CHKERRQ(ierr); 986940cd9d6SSatish Balay mumps->id.rhs = (MumpsScalar*)array; 987b5fa320bSStefano Zampini /* handle condensation step of Schur complement (if any) */ 988b5fa320bSStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps);CHKERRQ(ierr); 989801fbe65SHong Zhang 9902cd7d884SHong Zhang /* solve phase */ 9912cd7d884SHong Zhang /*-------------*/ 9922cd7d884SHong Zhang mumps->id.job = JOB_SOLVE; 9932cd7d884SHong Zhang PetscMUMPS_c(&mumps->id); 9942cd7d884SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 995b5fa320bSStefano Zampini 996b5fa320bSStefano Zampini /* handle expansion step of Schur complement (if any) */ 997b5fa320bSStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps);CHKERRQ(ierr); 9982cd7d884SHong Zhang ierr = MatDenseRestoreArray(X,&array);CHKERRQ(ierr); 999334c5f61SHong Zhang } else { /*--------- parallel case --------*/ 100071aed81dSHong Zhang PetscInt lsol_loc,nlsol_loc,*isol_loc,*idx,*iidx,*idxx,*isol_loc_save; 10011070efccSSatish Balay MumpsScalar *sol_loc,*sol_loc_save; 1002801fbe65SHong Zhang IS is_to,is_from; 1003334c5f61SHong Zhang PetscInt k,proc,j,m; 1004801fbe65SHong Zhang const PetscInt *rstart; 1005334c5f61SHong Zhang Vec v_mpi,b_seq,x_seq; 1006334c5f61SHong Zhang VecScatter scat_rhs,scat_sol; 1007801fbe65SHong Zhang 1008801fbe65SHong Zhang /* create x_seq to hold local solution */ 100971aed81dSHong Zhang isol_loc_save = mumps->id.isol_loc; /* save it for MatSovle() */ 101071aed81dSHong Zhang sol_loc_save = mumps->id.sol_loc; 1011801fbe65SHong Zhang 101271aed81dSHong Zhang lsol_loc = mumps->id.INFO(23); 101371aed81dSHong Zhang nlsol_loc = nrhs*lsol_loc; /* length of sol_loc */ 101471aed81dSHong Zhang ierr = PetscMalloc2(nlsol_loc,&sol_loc,nlsol_loc,&isol_loc);CHKERRQ(ierr); 1015940cd9d6SSatish Balay mumps->id.sol_loc = (MumpsScalar*)sol_loc; 1016801fbe65SHong Zhang mumps->id.isol_loc = isol_loc; 1017801fbe65SHong Zhang 10181070efccSSatish Balay ierr = VecCreateSeqWithArray(PETSC_COMM_SELF,1,nlsol_loc,(PetscScalar*)sol_loc,&x_seq);CHKERRQ(ierr); 10192cd7d884SHong Zhang 102074f0fcc7SHong Zhang /* copy rhs matrix B into vector v_mpi */ 1021334c5f61SHong Zhang ierr = MatGetLocalSize(B,&m,NULL);CHKERRQ(ierr); 1022801fbe65SHong Zhang ierr = MatDenseGetArray(B,&bray);CHKERRQ(ierr); 102374f0fcc7SHong Zhang ierr = VecCreateMPIWithArray(PetscObjectComm((PetscObject)B),1,nrhs*m,nrhs*M,(const PetscScalar*)bray,&v_mpi);CHKERRQ(ierr); 1024801fbe65SHong Zhang ierr = MatDenseRestoreArray(B,&bray);CHKERRQ(ierr); 1025801fbe65SHong Zhang 1026334c5f61SHong Zhang /* scatter v_mpi to b_seq because MUMPS only supports centralized rhs */ 102774f0fcc7SHong Zhang /* idx: maps from k-th index of v_mpi to (i,j)-th global entry of B; 1028801fbe65SHong Zhang iidx: inverse of idx, will be used by scattering xx_seq -> X */ 1029801fbe65SHong Zhang ierr = PetscMalloc2(nrhs*M,&idx,nrhs*M,&iidx);CHKERRQ(ierr); 1030801fbe65SHong Zhang ierr = MatGetOwnershipRanges(B,&rstart);CHKERRQ(ierr); 1031801fbe65SHong Zhang k = 0; 1032801fbe65SHong Zhang for (proc=0; proc<mumps->size; proc++){ 1033801fbe65SHong Zhang for (j=0; j<nrhs; j++){ 1034801fbe65SHong Zhang for (i=rstart[proc]; i<rstart[proc+1]; i++){ 1035801fbe65SHong Zhang iidx[j*M + i] = k; 1036801fbe65SHong Zhang idx[k++] = j*M + i; 1037801fbe65SHong Zhang } 1038801fbe65SHong Zhang } 10392cd7d884SHong Zhang } 10402cd7d884SHong Zhang 1041801fbe65SHong Zhang if (!mumps->myid) { 1042334c5f61SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,nrhs*M,&b_seq);CHKERRQ(ierr); 1043801fbe65SHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,nrhs*M,idx,PETSC_COPY_VALUES,&is_to);CHKERRQ(ierr); 1044801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,nrhs*M,0,1,&is_from);CHKERRQ(ierr); 1045801fbe65SHong Zhang } else { 1046334c5f61SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&b_seq);CHKERRQ(ierr); 1047801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_to);CHKERRQ(ierr); 1048801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_from);CHKERRQ(ierr); 1049801fbe65SHong Zhang } 1050334c5f61SHong Zhang ierr = VecScatterCreate(v_mpi,is_from,b_seq,is_to,&scat_rhs);CHKERRQ(ierr); 1051334c5f61SHong Zhang ierr = VecScatterBegin(scat_rhs,v_mpi,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1052801fbe65SHong Zhang ierr = ISDestroy(&is_to);CHKERRQ(ierr); 1053801fbe65SHong Zhang ierr = ISDestroy(&is_from);CHKERRQ(ierr); 1054334c5f61SHong Zhang ierr = VecScatterEnd(scat_rhs,v_mpi,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1055801fbe65SHong Zhang 1056801fbe65SHong Zhang if (!mumps->myid) { /* define rhs on the host */ 1057334c5f61SHong Zhang ierr = VecGetArray(b_seq,&bray);CHKERRQ(ierr); 1058940cd9d6SSatish Balay mumps->id.rhs = (MumpsScalar*)bray; 1059334c5f61SHong Zhang ierr = VecRestoreArray(b_seq,&bray);CHKERRQ(ierr); 1060801fbe65SHong Zhang } 1061801fbe65SHong Zhang 1062801fbe65SHong Zhang /* solve phase */ 1063801fbe65SHong Zhang /*-------------*/ 1064801fbe65SHong Zhang mumps->id.job = JOB_SOLVE; 1065801fbe65SHong Zhang PetscMUMPS_c(&mumps->id); 1066801fbe65SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 1067801fbe65SHong Zhang 1068334c5f61SHong Zhang /* scatter mumps distributed solution to petsc vector v_mpi, which shares local arrays with solution matrix X */ 106974f0fcc7SHong Zhang ierr = MatDenseGetArray(X,&array);CHKERRQ(ierr); 107074f0fcc7SHong Zhang ierr = VecPlaceArray(v_mpi,array);CHKERRQ(ierr); 1071801fbe65SHong Zhang 1072334c5f61SHong Zhang /* create scatter scat_sol */ 107371aed81dSHong Zhang ierr = PetscMalloc1(nlsol_loc,&idxx);CHKERRQ(ierr); 107471aed81dSHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,nlsol_loc,0,1,&is_from);CHKERRQ(ierr); 107571aed81dSHong Zhang for (i=0; i<lsol_loc; i++) { 1076334c5f61SHong Zhang isol_loc[i] -= 1; /* change Fortran style to C style */ 1077334c5f61SHong Zhang idxx[i] = iidx[isol_loc[i]]; 1078801fbe65SHong Zhang for (j=1; j<nrhs; j++){ 1079334c5f61SHong Zhang idxx[j*lsol_loc+i] = iidx[isol_loc[i]+j*M]; 1080801fbe65SHong Zhang } 1081801fbe65SHong Zhang } 108271aed81dSHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,nlsol_loc,idxx,PETSC_COPY_VALUES,&is_to);CHKERRQ(ierr); 1083334c5f61SHong Zhang ierr = VecScatterCreate(x_seq,is_from,v_mpi,is_to,&scat_sol);CHKERRQ(ierr); 1084334c5f61SHong Zhang ierr = VecScatterBegin(scat_sol,x_seq,v_mpi,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1085801fbe65SHong Zhang ierr = ISDestroy(&is_from);CHKERRQ(ierr); 1086801fbe65SHong Zhang ierr = ISDestroy(&is_to);CHKERRQ(ierr); 1087334c5f61SHong Zhang ierr = VecScatterEnd(scat_sol,x_seq,v_mpi,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1088801fbe65SHong Zhang ierr = MatDenseRestoreArray(X,&array);CHKERRQ(ierr); 108971aed81dSHong Zhang 109071aed81dSHong Zhang /* free spaces */ 109171aed81dSHong Zhang mumps->id.sol_loc = sol_loc_save; 109271aed81dSHong Zhang mumps->id.isol_loc = isol_loc_save; 109371aed81dSHong Zhang 109471aed81dSHong Zhang ierr = PetscFree2(sol_loc,isol_loc);CHKERRQ(ierr); 1095801fbe65SHong Zhang ierr = PetscFree2(idx,iidx);CHKERRQ(ierr); 1096801fbe65SHong Zhang ierr = PetscFree(idxx);CHKERRQ(ierr); 109771aed81dSHong Zhang ierr = VecDestroy(&x_seq);CHKERRQ(ierr); 109874f0fcc7SHong Zhang ierr = VecDestroy(&v_mpi);CHKERRQ(ierr); 1099334c5f61SHong Zhang ierr = VecDestroy(&b_seq);CHKERRQ(ierr); 1100334c5f61SHong Zhang ierr = VecScatterDestroy(&scat_rhs);CHKERRQ(ierr); 1101334c5f61SHong Zhang ierr = VecScatterDestroy(&scat_sol);CHKERRQ(ierr); 1102801fbe65SHong Zhang } 1103e0b74bf9SHong Zhang PetscFunctionReturn(0); 1104e0b74bf9SHong Zhang } 1105e0b74bf9SHong Zhang 1106ace3df97SHong Zhang #if !defined(PETSC_USE_COMPLEX) 1107a58c3f20SHong Zhang /* 1108a58c3f20SHong Zhang input: 1109a58c3f20SHong Zhang F: numeric factor 1110a58c3f20SHong Zhang output: 1111a58c3f20SHong Zhang nneg: total number of negative pivots 1112a58c3f20SHong Zhang nzero: 0 1113a58c3f20SHong Zhang npos: (global dimension of F) - nneg 1114a58c3f20SHong Zhang */ 1115a58c3f20SHong Zhang 1116a58c3f20SHong Zhang #undef __FUNCT__ 1117a58c3f20SHong Zhang #define __FUNCT__ "MatGetInertia_SBAIJMUMPS" 1118dfbe8321SBarry Smith PetscErrorCode MatGetInertia_SBAIJMUMPS(Mat F,int *nneg,int *nzero,int *npos) 1119a58c3f20SHong Zhang { 1120a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 1121dfbe8321SBarry Smith PetscErrorCode ierr; 1122c1490034SHong Zhang PetscMPIInt size; 1123a58c3f20SHong Zhang 1124a58c3f20SHong Zhang PetscFunctionBegin; 1125ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)F),&size);CHKERRQ(ierr); 1126bcb30aebSHong Zhang /* MUMPS 4.3.1 calls ScaLAPACK when ICNTL(13)=0 (default), which does not offer the possibility to compute the inertia of a dense matrix. Set ICNTL(13)=1 to skip ScaLAPACK */ 1127a5e57a09SHong Zhang if (size > 1 && mumps->id.ICNTL(13) != 1) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"ICNTL(13)=%d. -mat_mumps_icntl_13 must be set as 1 for correct global matrix inertia\n",mumps->id.INFOG(13)); 1128ed85ac9fSHong Zhang 1129710ac8efSHong Zhang if (nneg) *nneg = mumps->id.INFOG(12); 1130ed85ac9fSHong Zhang if (nzero || npos) { 1131ed85ac9fSHong Zhang if (mumps->id.ICNTL(24) != 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"-mat_mumps_icntl_24 must be set as 1 for null pivot row detection"); 1132710ac8efSHong Zhang if (nzero) *nzero = mumps->id.INFOG(28); 1133710ac8efSHong Zhang if (npos) *npos = F->rmap->N - (mumps->id.INFOG(12) + mumps->id.INFOG(28)); 1134a58c3f20SHong Zhang } 1135a58c3f20SHong Zhang PetscFunctionReturn(0); 1136a58c3f20SHong Zhang } 1137ace3df97SHong Zhang #endif /* !defined(PETSC_USE_COMPLEX) */ 1138a58c3f20SHong Zhang 1139397b6df1SKris Buschelman #undef __FUNCT__ 1140f6c57405SHong Zhang #define __FUNCT__ "MatFactorNumeric_MUMPS" 11410481f469SBarry Smith PetscErrorCode MatFactorNumeric_MUMPS(Mat F,Mat A,const MatFactorInfo *info) 1142af281ebdSHong Zhang { 1143a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)(F)->spptr; 11446849ba73SBarry Smith PetscErrorCode ierr; 1145e09efc27SHong Zhang Mat F_diag; 1146ace3abfcSBarry Smith PetscBool isMPIAIJ; 1147397b6df1SKris Buschelman 1148397b6df1SKris Buschelman PetscFunctionBegin; 1149a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_REUSE_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 1150397b6df1SKris Buschelman 1151397b6df1SKris Buschelman /* numerical factorization phase */ 1152329ec9b3SHong Zhang /*-------------------------------*/ 1153a5e57a09SHong Zhang mumps->id.job = JOB_FACTNUMERIC; 11544e34a73bSHong Zhang if (!mumps->id.ICNTL(18)) { /* A is centralized */ 1155a5e57a09SHong Zhang if (!mumps->myid) { 1156940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 1157397b6df1SKris Buschelman } 1158397b6df1SKris Buschelman } else { 1159940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 1160397b6df1SKris Buschelman } 1161a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1162a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) { 1163151787a6SHong Zhang if (mumps->id.INFO(1) == -13) { 1164151787a6SHong Zhang if (mumps->id.INFO(2) < 0) { 1165151787a6SHong Zhang SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: Cannot allocate required memory %d megabytes\n",-mumps->id.INFO(2)); 1166151787a6SHong Zhang } else { 1167151787a6SHong Zhang SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: Cannot allocate required memory %d bytes\n",mumps->id.INFO(2)); 1168151787a6SHong Zhang } 1169151787a6SHong Zhang } else SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: INFO(1)=%d, INFO(2)=%d\n",mumps->id.INFO(1),mumps->id.INFO(2)); 1170397b6df1SKris Buschelman } 1171a5e57a09SHong Zhang if (!mumps->myid && mumps->id.ICNTL(16) > 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB," mumps->id.ICNTL(16):=%d\n",mumps->id.INFOG(16)); 1172397b6df1SKris Buschelman 1173dcd589f8SShri Abhyankar (F)->assembled = PETSC_TRUE; 1174a5e57a09SHong Zhang mumps->matstruc = SAME_NONZERO_PATTERN; 1175b5fa320bSStefano Zampini mumps->schur_factored = PETSC_FALSE; 117659ac8732SStefano Zampini mumps->schur_inverted = PETSC_FALSE; 117767877ebaSShri Abhyankar 1178066565c5SStefano Zampini /* just to be sure that ICNTL(19) value returned by a call from MatMumpsGetIcntl is always consistent */ 1179066565c5SStefano Zampini if (!mumps->sym && mumps->id.ICNTL(19) && mumps->id.ICNTL(19) != 1) mumps->id.ICNTL(19) = 3; 1180066565c5SStefano Zampini 1181a5e57a09SHong Zhang if (mumps->size > 1) { 118267877ebaSShri Abhyankar PetscInt lsol_loc; 118367877ebaSShri Abhyankar PetscScalar *sol_loc; 11842205254eSKarl Rupp 1185c2093ab7SHong Zhang ierr = PetscObjectTypeCompare((PetscObject)A,MATMPIAIJ,&isMPIAIJ);CHKERRQ(ierr); 1186c2093ab7SHong Zhang if (isMPIAIJ) F_diag = ((Mat_MPIAIJ*)(F)->data)->A; 1187c2093ab7SHong Zhang else F_diag = ((Mat_MPISBAIJ*)(F)->data)->A; 1188c2093ab7SHong Zhang F_diag->assembled = PETSC_TRUE; 1189c2093ab7SHong Zhang 1190c2093ab7SHong Zhang /* distributed solution; Create x_seq=sol_loc for repeated use */ 1191c2093ab7SHong Zhang if (mumps->x_seq) { 1192c2093ab7SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 1193c2093ab7SHong Zhang ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr); 1194c2093ab7SHong Zhang ierr = VecDestroy(&mumps->x_seq);CHKERRQ(ierr); 1195c2093ab7SHong Zhang } 1196a5e57a09SHong Zhang lsol_loc = mumps->id.INFO(23); /* length of sol_loc */ 1197dcca6d9dSJed Brown ierr = PetscMalloc2(lsol_loc,&sol_loc,lsol_loc,&mumps->id.isol_loc);CHKERRQ(ierr); 1198a5e57a09SHong Zhang mumps->id.lsol_loc = lsol_loc; 1199940cd9d6SSatish Balay mumps->id.sol_loc = (MumpsScalar*)sol_loc; 1200a5e57a09SHong Zhang ierr = VecCreateSeqWithArray(PETSC_COMM_SELF,1,lsol_loc,sol_loc,&mumps->x_seq);CHKERRQ(ierr); 120167877ebaSShri Abhyankar } 1202397b6df1SKris Buschelman PetscFunctionReturn(0); 1203397b6df1SKris Buschelman } 1204397b6df1SKris Buschelman 12059a2535b5SHong Zhang /* Sets MUMPS options from the options database */ 1206dcd589f8SShri Abhyankar #undef __FUNCT__ 12079a2535b5SHong Zhang #define __FUNCT__ "PetscSetMUMPSFromOptions" 12089a2535b5SHong Zhang PetscErrorCode PetscSetMUMPSFromOptions(Mat F, Mat A) 1209dcd589f8SShri Abhyankar { 12109a2535b5SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1211dcd589f8SShri Abhyankar PetscErrorCode ierr; 1212b34f08ffSHong Zhang PetscInt icntl,info[40],i,ninfo=40; 1213ace3abfcSBarry Smith PetscBool flg; 1214dcd589f8SShri Abhyankar 1215dcd589f8SShri Abhyankar PetscFunctionBegin; 1216ce94432eSBarry Smith ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)A),((PetscObject)A)->prefix,"MUMPS Options","Mat");CHKERRQ(ierr); 12179a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_1","ICNTL(1): output stream for error messages","None",mumps->id.ICNTL(1),&icntl,&flg);CHKERRQ(ierr); 12189a2535b5SHong Zhang if (flg) mumps->id.ICNTL(1) = icntl; 12199a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_2","ICNTL(2): output stream for diagnostic printing, statistics, and warning","None",mumps->id.ICNTL(2),&icntl,&flg);CHKERRQ(ierr); 12209a2535b5SHong Zhang if (flg) mumps->id.ICNTL(2) = icntl; 12219a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_3","ICNTL(3): output stream for global information, collected on the host","None",mumps->id.ICNTL(3),&icntl,&flg);CHKERRQ(ierr); 12229a2535b5SHong Zhang if (flg) mumps->id.ICNTL(3) = icntl; 1223dcd589f8SShri Abhyankar 12249a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_4","ICNTL(4): level of printing (0 to 4)","None",mumps->id.ICNTL(4),&icntl,&flg);CHKERRQ(ierr); 12259a2535b5SHong Zhang if (flg) mumps->id.ICNTL(4) = icntl; 12269a2535b5SHong Zhang if (mumps->id.ICNTL(4) || PetscLogPrintInfo) mumps->id.ICNTL(3) = 6; /* resume MUMPS default id.ICNTL(3) = 6 */ 12279a2535b5SHong Zhang 1228d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_6","ICNTL(6): permutes to a zero-free diagonal and/or scale the matrix (0 to 7)","None",mumps->id.ICNTL(6),&icntl,&flg);CHKERRQ(ierr); 12299a2535b5SHong Zhang if (flg) mumps->id.ICNTL(6) = icntl; 12309a2535b5SHong Zhang 1231d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_7","ICNTL(7): computes a symmetric permutation in sequential analysis (0 to 7). 3=Scotch, 4=PORD, 5=Metis","None",mumps->id.ICNTL(7),&icntl,&flg);CHKERRQ(ierr); 1232dcd589f8SShri Abhyankar if (flg) { 12332205254eSKarl Rupp if (icntl== 1 && mumps->size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"pivot order be set by the user in PERM_IN -- not supported by the PETSc/MUMPS interface\n"); 12342205254eSKarl Rupp else mumps->id.ICNTL(7) = icntl; 1235dcd589f8SShri Abhyankar } 1236e0b74bf9SHong Zhang 12370298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_8","ICNTL(8): scaling strategy (-2 to 8 or 77)","None",mumps->id.ICNTL(8),&mumps->id.ICNTL(8),NULL);CHKERRQ(ierr); 1238d341cd04SHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_9","ICNTL(9): computes the solution using A or A^T","None",mumps->id.ICNTL(9),&mumps->id.ICNTL(9),NULL);CHKERRQ(ierr); handled by MatSolveTranspose_MUMPS() */ 12390298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_10","ICNTL(10): max num of refinements","None",mumps->id.ICNTL(10),&mumps->id.ICNTL(10),NULL);CHKERRQ(ierr); 1240d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_11","ICNTL(11): statistics related to an error analysis (via -ksp_view)","None",mumps->id.ICNTL(11),&mumps->id.ICNTL(11),NULL);CHKERRQ(ierr); 1241d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_12","ICNTL(12): an ordering strategy for symmetric matrices (0 to 3)","None",mumps->id.ICNTL(12),&mumps->id.ICNTL(12),NULL);CHKERRQ(ierr); 1242d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_13","ICNTL(13): parallelism of the root node (enable ScaLAPACK) and its splitting","None",mumps->id.ICNTL(13),&mumps->id.ICNTL(13),NULL);CHKERRQ(ierr); 1243d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_14","ICNTL(14): percentage increase in the estimated working space","None",mumps->id.ICNTL(14),&mumps->id.ICNTL(14),NULL);CHKERRQ(ierr); 1244d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_19","ICNTL(19): computes the Schur complement","None",mumps->id.ICNTL(19),&mumps->id.ICNTL(19),NULL);CHKERRQ(ierr); 124559ac8732SStefano Zampini if (mumps->id.ICNTL(19) <= 0 || mumps->id.ICNTL(19) > 3) { /* reset any schur data (if any) */ 124659ac8732SStefano Zampini ierr = MatMumpsResetSchur_Private(mumps);CHKERRQ(ierr); 124759ac8732SStefano Zampini } 12484e34a73bSHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_20","ICNTL(20): the format (dense or sparse) of the right-hand sides","None",mumps->id.ICNTL(20),&mumps->id.ICNTL(20),NULL);CHKERRQ(ierr); -- sparse rhs is not supported in PETSc API */ 1249d341cd04SHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_21","ICNTL(21): the distribution (centralized or distributed) of the solution vectors","None",mumps->id.ICNTL(21),&mumps->id.ICNTL(21),NULL);CHKERRQ(ierr); we only use distributed solution vector */ 12509a2535b5SHong Zhang 1251d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_22","ICNTL(22): in-core/out-of-core factorization and solve (0 or 1)","None",mumps->id.ICNTL(22),&mumps->id.ICNTL(22),NULL);CHKERRQ(ierr); 12520298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_23","ICNTL(23): max size of the working memory (MB) that can allocate per processor","None",mumps->id.ICNTL(23),&mumps->id.ICNTL(23),NULL);CHKERRQ(ierr); 12530298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_24","ICNTL(24): detection of null pivot rows (0 or 1)","None",mumps->id.ICNTL(24),&mumps->id.ICNTL(24),NULL);CHKERRQ(ierr); 12549a2535b5SHong Zhang if (mumps->id.ICNTL(24)) { 12559a2535b5SHong Zhang mumps->id.ICNTL(13) = 1; /* turn-off ScaLAPACK to help with the correct detection of null pivots */ 1256d7ebd59bSHong Zhang } 1257d7ebd59bSHong Zhang 1258d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_25","ICNTL(25): compute a solution of a deficient matrix and a null space basis","None",mumps->id.ICNTL(25),&mumps->id.ICNTL(25),NULL);CHKERRQ(ierr); 1259d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_26","ICNTL(26): drives the solution phase if a Schur complement matrix","None",mumps->id.ICNTL(26),&mumps->id.ICNTL(26),NULL);CHKERRQ(ierr); 12602cd7d884SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_27","ICNTL(27): the blocking size for multiple right-hand sides","None",mumps->id.ICNTL(27),&mumps->id.ICNTL(27),NULL);CHKERRQ(ierr); 12610298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_28","ICNTL(28): use 1 for sequential analysis and ictnl(7) ordering, or 2 for parallel analysis and ictnl(29) ordering","None",mumps->id.ICNTL(28),&mumps->id.ICNTL(28),NULL);CHKERRQ(ierr); 1262d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_29","ICNTL(29): parallel ordering 1 = ptscotch, 2 = parmetis","None",mumps->id.ICNTL(29),&mumps->id.ICNTL(29),NULL);CHKERRQ(ierr); 12630298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_30","ICNTL(30): compute user-specified set of entries in inv(A)","None",mumps->id.ICNTL(30),&mumps->id.ICNTL(30),NULL);CHKERRQ(ierr); 1264d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_31","ICNTL(31): indicates which factors may be discarded during factorization","None",mumps->id.ICNTL(31),&mumps->id.ICNTL(31),NULL);CHKERRQ(ierr); 12654e34a73bSHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_32","ICNTL(32): performs the forward elemination of the right-hand sides during factorization","None",mumps->id.ICNTL(32),&mumps->id.ICNTL(32),NULL);CHKERRQ(ierr); -- not supported by PETSc API */ 12660298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_33","ICNTL(33): compute determinant","None",mumps->id.ICNTL(33),&mumps->id.ICNTL(33),NULL);CHKERRQ(ierr); 1267dcd589f8SShri Abhyankar 12680298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_1","CNTL(1): relative pivoting threshold","None",mumps->id.CNTL(1),&mumps->id.CNTL(1),NULL);CHKERRQ(ierr); 12690298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_2","CNTL(2): stopping criterion of refinement","None",mumps->id.CNTL(2),&mumps->id.CNTL(2),NULL);CHKERRQ(ierr); 12700298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_3","CNTL(3): absolute pivoting threshold","None",mumps->id.CNTL(3),&mumps->id.CNTL(3),NULL);CHKERRQ(ierr); 12710298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_4","CNTL(4): value for static pivoting","None",mumps->id.CNTL(4),&mumps->id.CNTL(4),NULL);CHKERRQ(ierr); 12720298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_5","CNTL(5): fixation for null pivots","None",mumps->id.CNTL(5),&mumps->id.CNTL(5),NULL);CHKERRQ(ierr); 1273e5bb22a1SHong Zhang 12740298fd71SBarry Smith ierr = PetscOptionsString("-mat_mumps_ooc_tmpdir", "out of core directory", "None", mumps->id.ooc_tmpdir, mumps->id.ooc_tmpdir, 256, NULL); 1275b34f08ffSHong Zhang 127616d797efSHong Zhang ierr = PetscOptionsIntArray("-mat_mumps_view_info","request INFO local to each processor","",info,&ninfo,NULL);CHKERRQ(ierr); 1277b34f08ffSHong Zhang if (ninfo) { 1278b34f08ffSHong Zhang if (ninfo > 40) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"number of INFO %d must <= 40\n",ninfo); 1279b34f08ffSHong Zhang ierr = PetscMalloc1(ninfo,&mumps->info);CHKERRQ(ierr); 1280b34f08ffSHong Zhang mumps->ninfo = ninfo; 1281b34f08ffSHong Zhang for (i=0; i<ninfo; i++) { 1282b34f08ffSHong Zhang if (info[i] < 0 || info[i]>40) { 1283b34f08ffSHong Zhang SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"index of INFO %d must between 1 and 40\n",ninfo); 1284b34f08ffSHong Zhang } else { 1285b34f08ffSHong Zhang mumps->info[i] = info[i]; 1286b34f08ffSHong Zhang } 1287b34f08ffSHong Zhang } 1288b34f08ffSHong Zhang } 1289b34f08ffSHong Zhang 1290dcd589f8SShri Abhyankar PetscOptionsEnd(); 1291dcd589f8SShri Abhyankar PetscFunctionReturn(0); 1292dcd589f8SShri Abhyankar } 1293dcd589f8SShri Abhyankar 1294dcd589f8SShri Abhyankar #undef __FUNCT__ 1295dcd589f8SShri Abhyankar #define __FUNCT__ "PetscInitializeMUMPS" 1296f697e70eSHong Zhang PetscErrorCode PetscInitializeMUMPS(Mat A,Mat_MUMPS *mumps) 1297dcd589f8SShri Abhyankar { 1298dcd589f8SShri Abhyankar PetscErrorCode ierr; 1299dcd589f8SShri Abhyankar 1300dcd589f8SShri Abhyankar PetscFunctionBegin; 1301ce94432eSBarry Smith ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)A), &mumps->myid); 1302ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)A),&mumps->size);CHKERRQ(ierr); 1303ce94432eSBarry Smith ierr = MPI_Comm_dup(PetscObjectComm((PetscObject)A),&(mumps->comm_mumps));CHKERRQ(ierr); 13042205254eSKarl Rupp 1305f697e70eSHong Zhang mumps->id.comm_fortran = MPI_Comm_c2f(mumps->comm_mumps); 1306f697e70eSHong Zhang 1307f697e70eSHong Zhang mumps->id.job = JOB_INIT; 1308f697e70eSHong Zhang mumps->id.par = 1; /* host participates factorizaton and solve */ 1309f697e70eSHong Zhang mumps->id.sym = mumps->sym; 13102907cef9SHong Zhang PetscMUMPS_c(&mumps->id); 1311f697e70eSHong Zhang 13120298fd71SBarry Smith mumps->scat_rhs = NULL; 13130298fd71SBarry Smith mumps->scat_sol = NULL; 13149a2535b5SHong Zhang 131570544d5fSHong Zhang /* set PETSc-MUMPS default options - override MUMPS default */ 13169a2535b5SHong Zhang mumps->id.ICNTL(3) = 0; 13179a2535b5SHong Zhang mumps->id.ICNTL(4) = 0; 13189a2535b5SHong Zhang if (mumps->size == 1) { 13199a2535b5SHong Zhang mumps->id.ICNTL(18) = 0; /* centralized assembled matrix input */ 13209a2535b5SHong Zhang } else { 13219a2535b5SHong Zhang mumps->id.ICNTL(18) = 3; /* distributed assembled matrix input */ 13224e34a73bSHong Zhang mumps->id.ICNTL(20) = 0; /* rhs is in dense format */ 132370544d5fSHong Zhang mumps->id.ICNTL(21) = 1; /* distributed solution */ 13249a2535b5SHong Zhang } 13256444a565SStefano Zampini 13266444a565SStefano Zampini /* schur */ 13276444a565SStefano Zampini mumps->id.size_schur = 0; 13286444a565SStefano Zampini mumps->id.listvar_schur = NULL; 13296444a565SStefano Zampini mumps->id.schur = NULL; 1330b5fa320bSStefano Zampini mumps->schur_second_solve = PETSC_FALSE; 1331b5fa320bSStefano Zampini mumps->sizeredrhs = 0; 1332b5fa320bSStefano Zampini mumps->schur_pivots = NULL; 1333b5fa320bSStefano Zampini mumps->schur_work = NULL; 133459ac8732SStefano Zampini mumps->schur_sol = NULL; 133559ac8732SStefano Zampini mumps->schur_sizesol = 0; 133659ac8732SStefano Zampini mumps->schur_restored = PETSC_TRUE; 133759ac8732SStefano Zampini mumps->schur_factored = PETSC_FALSE; 133859ac8732SStefano Zampini mumps->schur_inverted = PETSC_FALSE; 1339dcd589f8SShri Abhyankar PetscFunctionReturn(0); 1340dcd589f8SShri Abhyankar } 1341dcd589f8SShri Abhyankar 1342a5e57a09SHong Zhang /* Note Petsc r(=c) permutation is used when mumps->id.ICNTL(7)==1 with centralized assembled matrix input; otherwise r and c are ignored */ 1343397b6df1SKris Buschelman #undef __FUNCT__ 1344f0c56d0fSKris Buschelman #define __FUNCT__ "MatLUFactorSymbolic_AIJMUMPS" 13450481f469SBarry Smith PetscErrorCode MatLUFactorSymbolic_AIJMUMPS(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info) 1346b24902e0SBarry Smith { 1347a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1348dcd589f8SShri Abhyankar PetscErrorCode ierr; 134967877ebaSShri Abhyankar Vec b; 135067877ebaSShri Abhyankar IS is_iden; 135167877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1352397b6df1SKris Buschelman 1353397b6df1SKris Buschelman PetscFunctionBegin; 1354a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1355dcd589f8SShri Abhyankar 13569a2535b5SHong Zhang /* Set MUMPS options from the options database */ 13579a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1358dcd589f8SShri Abhyankar 1359a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 1360dcd589f8SShri Abhyankar 136167877ebaSShri Abhyankar /* analysis phase */ 136267877ebaSShri Abhyankar /*----------------*/ 1363a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1364a5e57a09SHong Zhang mumps->id.n = M; 1365a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 136667877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1367a5e57a09SHong Zhang if (!mumps->myid) { 1368a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1369a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1370940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 137167877ebaSShri Abhyankar } 1372a5e57a09SHong Zhang if (mumps->id.ICNTL(7) == 1) { /* use user-provide matrix ordering - assuming r = c ordering */ 13735248a706SHong Zhang /* 13745248a706SHong Zhang PetscBool flag; 13755248a706SHong Zhang ierr = ISEqual(r,c,&flag);CHKERRQ(ierr); 13765248a706SHong Zhang if (!flag) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"row_perm != col_perm"); 13775248a706SHong Zhang ierr = ISView(r,PETSC_VIEWER_STDOUT_SELF); 13785248a706SHong Zhang */ 1379a5e57a09SHong Zhang if (!mumps->myid) { 1380e0b74bf9SHong Zhang const PetscInt *idx; 1381e0b74bf9SHong Zhang PetscInt i,*perm_in; 13822205254eSKarl Rupp 1383785e854fSJed Brown ierr = PetscMalloc1(M,&perm_in);CHKERRQ(ierr); 1384e0b74bf9SHong Zhang ierr = ISGetIndices(r,&idx);CHKERRQ(ierr); 13852205254eSKarl Rupp 1386a5e57a09SHong Zhang mumps->id.perm_in = perm_in; 1387e0b74bf9SHong Zhang for (i=0; i<M; i++) perm_in[i] = idx[i]+1; /* perm_in[]: start from 1, not 0! */ 1388e0b74bf9SHong Zhang ierr = ISRestoreIndices(r,&idx);CHKERRQ(ierr); 1389e0b74bf9SHong Zhang } 1390e0b74bf9SHong Zhang } 139167877ebaSShri Abhyankar } 139267877ebaSShri Abhyankar break; 139367877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1394a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1395a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1396a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1397940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 139867877ebaSShri Abhyankar } 139967877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1400a5e57a09SHong Zhang if (!mumps->myid) { 14012cd7d884SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->rmap->N,&mumps->b_seq);CHKERRQ(ierr); 14022cd7d884SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,A->rmap->N,0,1,&is_iden);CHKERRQ(ierr); 140367877ebaSShri Abhyankar } else { 1404a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 140567877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 140667877ebaSShri Abhyankar } 14072a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1408a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 14096bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 14106bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 141167877ebaSShri Abhyankar break; 141267877ebaSShri Abhyankar } 1413a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1414a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 141567877ebaSShri Abhyankar 1416719d5645SBarry Smith F->ops->lufactornumeric = MatFactorNumeric_MUMPS; 1417dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 141851d5961aSHong Zhang F->ops->solvetranspose = MatSolveTranspose_MUMPS; 14194e34a73bSHong Zhang F->ops->matsolve = MatMatSolve_MUMPS; 1420b24902e0SBarry Smith PetscFunctionReturn(0); 1421b24902e0SBarry Smith } 1422b24902e0SBarry Smith 1423450b117fSShri Abhyankar /* Note the Petsc r and c permutations are ignored */ 1424450b117fSShri Abhyankar #undef __FUNCT__ 1425450b117fSShri Abhyankar #define __FUNCT__ "MatLUFactorSymbolic_BAIJMUMPS" 1426450b117fSShri Abhyankar PetscErrorCode MatLUFactorSymbolic_BAIJMUMPS(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info) 1427450b117fSShri Abhyankar { 1428a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1429dcd589f8SShri Abhyankar PetscErrorCode ierr; 143067877ebaSShri Abhyankar Vec b; 143167877ebaSShri Abhyankar IS is_iden; 143267877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1433450b117fSShri Abhyankar 1434450b117fSShri Abhyankar PetscFunctionBegin; 1435a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1436dcd589f8SShri Abhyankar 14379a2535b5SHong Zhang /* Set MUMPS options from the options database */ 14389a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1439dcd589f8SShri Abhyankar 1440a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 144167877ebaSShri Abhyankar 144267877ebaSShri Abhyankar /* analysis phase */ 144367877ebaSShri Abhyankar /*----------------*/ 1444a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1445a5e57a09SHong Zhang mumps->id.n = M; 1446a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 144767877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1448a5e57a09SHong Zhang if (!mumps->myid) { 1449a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1450a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1451940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 145267877ebaSShri Abhyankar } 145367877ebaSShri Abhyankar } 145467877ebaSShri Abhyankar break; 145567877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1456a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1457a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1458a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1459940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 146067877ebaSShri Abhyankar } 146167877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1462a5e57a09SHong Zhang if (!mumps->myid) { 1463a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr); 146467877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr); 146567877ebaSShri Abhyankar } else { 1466a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 146767877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 146867877ebaSShri Abhyankar } 14692a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1470a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 14716bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 14726bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 147367877ebaSShri Abhyankar break; 147467877ebaSShri Abhyankar } 1475a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1476a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 147767877ebaSShri Abhyankar 1478450b117fSShri Abhyankar F->ops->lufactornumeric = MatFactorNumeric_MUMPS; 1479dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 148051d5961aSHong Zhang F->ops->solvetranspose = MatSolveTranspose_MUMPS; 1481450b117fSShri Abhyankar PetscFunctionReturn(0); 1482450b117fSShri Abhyankar } 1483b24902e0SBarry Smith 1484141f4205SHong Zhang /* Note the Petsc r permutation and factor info are ignored */ 1485397b6df1SKris Buschelman #undef __FUNCT__ 148667877ebaSShri Abhyankar #define __FUNCT__ "MatCholeskyFactorSymbolic_MUMPS" 148767877ebaSShri Abhyankar PetscErrorCode MatCholeskyFactorSymbolic_MUMPS(Mat F,Mat A,IS r,const MatFactorInfo *info) 1488b24902e0SBarry Smith { 1489a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1490dcd589f8SShri Abhyankar PetscErrorCode ierr; 149167877ebaSShri Abhyankar Vec b; 149267877ebaSShri Abhyankar IS is_iden; 149367877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1494397b6df1SKris Buschelman 1495397b6df1SKris Buschelman PetscFunctionBegin; 1496a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1497dcd589f8SShri Abhyankar 14989a2535b5SHong Zhang /* Set MUMPS options from the options database */ 14999a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1500dcd589f8SShri Abhyankar 1501a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 1502dcd589f8SShri Abhyankar 150367877ebaSShri Abhyankar /* analysis phase */ 150467877ebaSShri Abhyankar /*----------------*/ 1505a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1506a5e57a09SHong Zhang mumps->id.n = M; 1507a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 150867877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1509a5e57a09SHong Zhang if (!mumps->myid) { 1510a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1511a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1512940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 151367877ebaSShri Abhyankar } 151467877ebaSShri Abhyankar } 151567877ebaSShri Abhyankar break; 151667877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1517a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1518a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1519a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1520940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 152167877ebaSShri Abhyankar } 152267877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1523a5e57a09SHong Zhang if (!mumps->myid) { 1524a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr); 152567877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr); 152667877ebaSShri Abhyankar } else { 1527a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 152867877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 152967877ebaSShri Abhyankar } 15302a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1531a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 15326bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 15336bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 153467877ebaSShri Abhyankar break; 153567877ebaSShri Abhyankar } 1536a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1537a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 153867877ebaSShri Abhyankar 15392792810eSHong Zhang F->ops->choleskyfactornumeric = MatFactorNumeric_MUMPS; 1540dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 154151d5961aSHong Zhang F->ops->solvetranspose = MatSolve_MUMPS; 15424e34a73bSHong Zhang F->ops->matsolve = MatMatSolve_MUMPS; 15434e34a73bSHong Zhang #if defined(PETSC_USE_COMPLEX) 15440298fd71SBarry Smith F->ops->getinertia = NULL; 15454e34a73bSHong Zhang #else 15464e34a73bSHong Zhang F->ops->getinertia = MatGetInertia_SBAIJMUMPS; 1547db4efbfdSBarry Smith #endif 1548b24902e0SBarry Smith PetscFunctionReturn(0); 1549b24902e0SBarry Smith } 1550b24902e0SBarry Smith 1551397b6df1SKris Buschelman #undef __FUNCT__ 155264e6c443SBarry Smith #define __FUNCT__ "MatView_MUMPS" 155364e6c443SBarry Smith PetscErrorCode MatView_MUMPS(Mat A,PetscViewer viewer) 155474ed9c26SBarry Smith { 1555f6c57405SHong Zhang PetscErrorCode ierr; 155664e6c443SBarry Smith PetscBool iascii; 155764e6c443SBarry Smith PetscViewerFormat format; 1558a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 1559f6c57405SHong Zhang 1560f6c57405SHong Zhang PetscFunctionBegin; 156164e6c443SBarry Smith /* check if matrix is mumps type */ 156264e6c443SBarry Smith if (A->ops->solve != MatSolve_MUMPS) PetscFunctionReturn(0); 156364e6c443SBarry Smith 1564251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 156564e6c443SBarry Smith if (iascii) { 156664e6c443SBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 156764e6c443SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO) { 156864e6c443SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"MUMPS run parameters:\n");CHKERRQ(ierr); 1569a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," SYM (matrix type): %d \n",mumps->id.sym);CHKERRQ(ierr); 1570a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," PAR (host participation): %d \n",mumps->id.par);CHKERRQ(ierr); 1571a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(1) (output for error): %d \n",mumps->id.ICNTL(1));CHKERRQ(ierr); 1572a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(2) (output of diagnostic msg): %d \n",mumps->id.ICNTL(2));CHKERRQ(ierr); 1573a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(3) (output for global info): %d \n",mumps->id.ICNTL(3));CHKERRQ(ierr); 1574a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(4) (level of printing): %d \n",mumps->id.ICNTL(4));CHKERRQ(ierr); 1575a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(5) (input mat struct): %d \n",mumps->id.ICNTL(5));CHKERRQ(ierr); 1576a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(6) (matrix prescaling): %d \n",mumps->id.ICNTL(6));CHKERRQ(ierr); 1577a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(7) (sequentia matrix ordering):%d \n",mumps->id.ICNTL(7));CHKERRQ(ierr); 1578a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(8) (scalling strategy): %d \n",mumps->id.ICNTL(8));CHKERRQ(ierr); 1579a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(10) (max num of refinements): %d \n",mumps->id.ICNTL(10));CHKERRQ(ierr); 1580a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(11) (error analysis): %d \n",mumps->id.ICNTL(11));CHKERRQ(ierr); 1581a5e57a09SHong Zhang if (mumps->id.ICNTL(11)>0) { 1582a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(4) (inf norm of input mat): %g\n",mumps->id.RINFOG(4));CHKERRQ(ierr); 1583a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(5) (inf norm of solution): %g\n",mumps->id.RINFOG(5));CHKERRQ(ierr); 1584a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(6) (inf norm of residual): %g\n",mumps->id.RINFOG(6));CHKERRQ(ierr); 1585a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(7),RINFOG(8) (backward error est): %g, %g\n",mumps->id.RINFOG(7),mumps->id.RINFOG(8));CHKERRQ(ierr); 1586a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(9) (error estimate): %g \n",mumps->id.RINFOG(9));CHKERRQ(ierr); 1587a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(10),RINFOG(11)(condition numbers): %g, %g\n",mumps->id.RINFOG(10),mumps->id.RINFOG(11));CHKERRQ(ierr); 1588f6c57405SHong Zhang } 1589a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(12) (efficiency control): %d \n",mumps->id.ICNTL(12));CHKERRQ(ierr); 1590a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(13) (efficiency control): %d \n",mumps->id.ICNTL(13));CHKERRQ(ierr); 1591a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(14) (percentage of estimated workspace increase): %d \n",mumps->id.ICNTL(14));CHKERRQ(ierr); 1592f6c57405SHong Zhang /* ICNTL(15-17) not used */ 1593a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(18) (input mat struct): %d \n",mumps->id.ICNTL(18));CHKERRQ(ierr); 1594a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(19) (Shur complement info): %d \n",mumps->id.ICNTL(19));CHKERRQ(ierr); 1595a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(20) (rhs sparse pattern): %d \n",mumps->id.ICNTL(20));CHKERRQ(ierr); 1596ca3dc52bSPierre Jolivet ierr = PetscViewerASCIIPrintf(viewer," ICNTL(21) (solution struct): %d \n",mumps->id.ICNTL(21));CHKERRQ(ierr); 1597a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(22) (in-core/out-of-core facility): %d \n",mumps->id.ICNTL(22));CHKERRQ(ierr); 1598a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(23) (max size of memory can be allocated locally):%d \n",mumps->id.ICNTL(23));CHKERRQ(ierr); 1599c0165424SHong Zhang 1600a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(24) (detection of null pivot rows): %d \n",mumps->id.ICNTL(24));CHKERRQ(ierr); 1601a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(25) (computation of a null space basis): %d \n",mumps->id.ICNTL(25));CHKERRQ(ierr); 1602a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(26) (Schur options for rhs or solution): %d \n",mumps->id.ICNTL(26));CHKERRQ(ierr); 1603a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(27) (experimental parameter): %d \n",mumps->id.ICNTL(27));CHKERRQ(ierr); 1604a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(28) (use parallel or sequential ordering): %d \n",mumps->id.ICNTL(28));CHKERRQ(ierr); 1605a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(29) (parallel ordering): %d \n",mumps->id.ICNTL(29));CHKERRQ(ierr); 160642179a6aSHong Zhang 1607a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(30) (user-specified set of entries in inv(A)): %d \n",mumps->id.ICNTL(30));CHKERRQ(ierr); 1608a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(31) (factors is discarded in the solve phase): %d \n",mumps->id.ICNTL(31));CHKERRQ(ierr); 1609a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(33) (compute determinant): %d \n",mumps->id.ICNTL(33));CHKERRQ(ierr); 1610f6c57405SHong Zhang 1611a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(1) (relative pivoting threshold): %g \n",mumps->id.CNTL(1));CHKERRQ(ierr); 1612a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(2) (stopping criterion of refinement): %g \n",mumps->id.CNTL(2));CHKERRQ(ierr); 1613ca3dc52bSPierre Jolivet ierr = PetscViewerASCIIPrintf(viewer," CNTL(3) (absolute pivoting threshold): %g \n",mumps->id.CNTL(3));CHKERRQ(ierr); 1614ca3dc52bSPierre Jolivet ierr = PetscViewerASCIIPrintf(viewer," CNTL(4) (value of static pivoting): %g \n",mumps->id.CNTL(4));CHKERRQ(ierr); 1615a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(5) (fixation for null pivots): %g \n",mumps->id.CNTL(5));CHKERRQ(ierr); 1616f6c57405SHong Zhang 1617f6c57405SHong Zhang /* infomation local to each processor */ 161834ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(1) (local estimated flops for the elimination after analysis): \n");CHKERRQ(ierr); 16191575c14dSBarry Smith ierr = PetscViewerASCIIPushSynchronized(viewer);CHKERRQ(ierr); 1620a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(1));CHKERRQ(ierr); 162134ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 162234ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(2) (local estimated flops for the assembly after factorization): \n");CHKERRQ(ierr); 1623a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(2));CHKERRQ(ierr); 162434ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 162534ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(3) (local estimated flops for the elimination after factorization): \n");CHKERRQ(ierr); 1626a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(3));CHKERRQ(ierr); 162734ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1628f6c57405SHong Zhang 162934ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(15) (estimated size of (in MB) MUMPS internal data for running numerical factorization): \n");CHKERRQ(ierr); 1630a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(15));CHKERRQ(ierr); 163134ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1632f6c57405SHong Zhang 163334ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(16) (size of (in MB) MUMPS internal data used during numerical factorization): \n");CHKERRQ(ierr); 1634a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(16));CHKERRQ(ierr); 163534ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1636f6c57405SHong Zhang 163734ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(23) (num of pivots eliminated on this processor after factorization): \n");CHKERRQ(ierr); 1638a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(23));CHKERRQ(ierr); 163934ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1640b34f08ffSHong Zhang 1641b34f08ffSHong Zhang if (mumps->ninfo && mumps->ninfo <= 40){ 1642b34f08ffSHong Zhang PetscInt i; 1643b34f08ffSHong Zhang for (i=0; i<mumps->ninfo; i++){ 1644b34f08ffSHong Zhang ierr = PetscViewerASCIIPrintf(viewer, " INFO(%d): \n",mumps->info[i]);CHKERRQ(ierr); 1645b34f08ffSHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(mumps->info[i]));CHKERRQ(ierr); 1646b34f08ffSHong Zhang ierr = PetscViewerFlush(viewer); 1647b34f08ffSHong Zhang } 1648b34f08ffSHong Zhang } 1649b34f08ffSHong Zhang 1650b34f08ffSHong Zhang 16511575c14dSBarry Smith ierr = PetscViewerASCIIPopSynchronized(viewer);CHKERRQ(ierr); 1652f6c57405SHong Zhang 1653a5e57a09SHong Zhang if (!mumps->myid) { /* information from the host */ 1654a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(1) (global estimated flops for the elimination after analysis): %g \n",mumps->id.RINFOG(1));CHKERRQ(ierr); 1655a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(2) (global estimated flops for the assembly after factorization): %g \n",mumps->id.RINFOG(2));CHKERRQ(ierr); 1656a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(3) (global estimated flops for the elimination after factorization): %g \n",mumps->id.RINFOG(3));CHKERRQ(ierr); 1657a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," (RINFOG(12) RINFOG(13))*2^INFOG(34) (determinant): (%g,%g)*(2^%d)\n",mumps->id.RINFOG(12),mumps->id.RINFOG(13),mumps->id.INFOG(34));CHKERRQ(ierr); 1658f6c57405SHong Zhang 1659a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(3) (estimated real workspace for factors on all processors after analysis): %d \n",mumps->id.INFOG(3));CHKERRQ(ierr); 1660a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(4) (estimated integer workspace for factors on all processors after analysis): %d \n",mumps->id.INFOG(4));CHKERRQ(ierr); 1661a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(5) (estimated maximum front size in the complete tree): %d \n",mumps->id.INFOG(5));CHKERRQ(ierr); 1662a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(6) (number of nodes in the complete tree): %d \n",mumps->id.INFOG(6));CHKERRQ(ierr); 1663a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(7) (ordering option effectively use after analysis): %d \n",mumps->id.INFOG(7));CHKERRQ(ierr); 1664a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(8) (structural symmetry in percent of the permuted matrix after analysis): %d \n",mumps->id.INFOG(8));CHKERRQ(ierr); 1665a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(9) (total real/complex workspace to store the matrix factors after factorization): %d \n",mumps->id.INFOG(9));CHKERRQ(ierr); 1666a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(10) (total integer space store the matrix factors after factorization): %d \n",mumps->id.INFOG(10));CHKERRQ(ierr); 1667a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(11) (order of largest frontal matrix after factorization): %d \n",mumps->id.INFOG(11));CHKERRQ(ierr); 1668a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(12) (number of off-diagonal pivots): %d \n",mumps->id.INFOG(12));CHKERRQ(ierr); 1669a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(13) (number of delayed pivots after factorization): %d \n",mumps->id.INFOG(13));CHKERRQ(ierr); 1670a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(14) (number of memory compress after factorization): %d \n",mumps->id.INFOG(14));CHKERRQ(ierr); 1671a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(15) (number of steps of iterative refinement after solution): %d \n",mumps->id.INFOG(15));CHKERRQ(ierr); 1672a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(16) (estimated size (in MB) of all MUMPS internal data for factorization after analysis: value on the most memory consuming processor): %d \n",mumps->id.INFOG(16));CHKERRQ(ierr); 1673a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(17) (estimated size of all MUMPS internal data for factorization after analysis: sum over all processors): %d \n",mumps->id.INFOG(17));CHKERRQ(ierr); 1674a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(18) (size of all MUMPS internal data allocated during factorization: value on the most memory consuming processor): %d \n",mumps->id.INFOG(18));CHKERRQ(ierr); 1675a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(19) (size of all MUMPS internal data allocated during factorization: sum over all processors): %d \n",mumps->id.INFOG(19));CHKERRQ(ierr); 1676a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(20) (estimated number of entries in the factors): %d \n",mumps->id.INFOG(20));CHKERRQ(ierr); 1677a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(21) (size in MB of memory effectively used during factorization - value on the most memory consuming processor): %d \n",mumps->id.INFOG(21));CHKERRQ(ierr); 1678a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(22) (size in MB of memory effectively used during factorization - sum over all processors): %d \n",mumps->id.INFOG(22));CHKERRQ(ierr); 1679a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(23) (after analysis: value of ICNTL(6) effectively used): %d \n",mumps->id.INFOG(23));CHKERRQ(ierr); 1680a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(24) (after analysis: value of ICNTL(12) effectively used): %d \n",mumps->id.INFOG(24));CHKERRQ(ierr); 1681a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(25) (after factorization: number of pivots modified by static pivoting): %d \n",mumps->id.INFOG(25));CHKERRQ(ierr); 168240d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(28) (after factorization: number of null pivots encountered): %d\n",mumps->id.INFOG(28));CHKERRQ(ierr); 168340d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(29) (after factorization: effective number of entries in the factors (sum over all processors)): %d\n",mumps->id.INFOG(29));CHKERRQ(ierr); 168440d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(30, 31) (after solution: size in Mbytes of memory used during solution phase): %d, %d\n",mumps->id.INFOG(30),mumps->id.INFOG(31));CHKERRQ(ierr); 168540d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(32) (after analysis: type of analysis done): %d\n",mumps->id.INFOG(32));CHKERRQ(ierr); 168640d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(33) (value used for ICNTL(8)): %d\n",mumps->id.INFOG(33));CHKERRQ(ierr); 168740d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(34) (exponent of the determinant if determinant is requested): %d\n",mumps->id.INFOG(34));CHKERRQ(ierr); 1688f6c57405SHong Zhang } 1689f6c57405SHong Zhang } 1690cb828f0fSHong Zhang } 1691f6c57405SHong Zhang PetscFunctionReturn(0); 1692f6c57405SHong Zhang } 1693f6c57405SHong Zhang 169435bd34faSBarry Smith #undef __FUNCT__ 169535bd34faSBarry Smith #define __FUNCT__ "MatGetInfo_MUMPS" 169635bd34faSBarry Smith PetscErrorCode MatGetInfo_MUMPS(Mat A,MatInfoType flag,MatInfo *info) 169735bd34faSBarry Smith { 1698cb828f0fSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)A->spptr; 169935bd34faSBarry Smith 170035bd34faSBarry Smith PetscFunctionBegin; 170135bd34faSBarry Smith info->block_size = 1.0; 1702cb828f0fSHong Zhang info->nz_allocated = mumps->id.INFOG(20); 1703cb828f0fSHong Zhang info->nz_used = mumps->id.INFOG(20); 170435bd34faSBarry Smith info->nz_unneeded = 0.0; 170535bd34faSBarry Smith info->assemblies = 0.0; 170635bd34faSBarry Smith info->mallocs = 0.0; 170735bd34faSBarry Smith info->memory = 0.0; 170835bd34faSBarry Smith info->fill_ratio_given = 0; 170935bd34faSBarry Smith info->fill_ratio_needed = 0; 171035bd34faSBarry Smith info->factor_mallocs = 0; 171135bd34faSBarry Smith PetscFunctionReturn(0); 171235bd34faSBarry Smith } 171335bd34faSBarry Smith 17145ccb76cbSHong Zhang /* -------------------------------------------------------------------------------------------*/ 17155ccb76cbSHong Zhang #undef __FUNCT__ 17166444a565SStefano Zampini #define __FUNCT__ "MatMumpsSetSchurIndices_MUMPS" 17176444a565SStefano Zampini PetscErrorCode MatMumpsSetSchurIndices_MUMPS(Mat F,PetscInt size,PetscInt idxs[]) 17186444a565SStefano Zampini { 17196444a565SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 17206444a565SStefano Zampini PetscErrorCode ierr; 17216444a565SStefano Zampini 17226444a565SStefano Zampini PetscFunctionBegin; 172359ac8732SStefano Zampini if (mumps->size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"MUMPS parallel Schur complements not yet supported from PETSc\n"); 17246444a565SStefano Zampini if (mumps->id.size_schur != size) { 17256444a565SStefano Zampini ierr = PetscFree2(mumps->id.listvar_schur,mumps->id.schur);CHKERRQ(ierr); 17266444a565SStefano Zampini mumps->id.size_schur = size; 17276444a565SStefano Zampini mumps->id.schur_lld = size; 17286444a565SStefano Zampini ierr = PetscMalloc2(size,&mumps->id.listvar_schur,size*size,&mumps->id.schur);CHKERRQ(ierr); 17296444a565SStefano Zampini } 17306444a565SStefano Zampini ierr = PetscMemcpy(mumps->id.listvar_schur,idxs,size*sizeof(PetscInt));CHKERRQ(ierr); 17316444a565SStefano Zampini if (F->factortype == MAT_FACTOR_LU) { 173259ac8732SStefano Zampini mumps->id.ICNTL(19) = 3; /* MUMPS returns full matrix */ 17336444a565SStefano Zampini } else { 173459ac8732SStefano Zampini mumps->id.ICNTL(19) = 2; /* MUMPS returns lower triangular part */ 17356444a565SStefano Zampini } 173659ac8732SStefano Zampini /* set a special value of ICNTL (not handled my MUMPS) to be used in the solve phase by PETSc */ 1737b5fa320bSStefano Zampini mumps->id.ICNTL(26) = -1; 17386444a565SStefano Zampini PetscFunctionReturn(0); 17396444a565SStefano Zampini } 17406444a565SStefano Zampini 17416444a565SStefano Zampini #undef __FUNCT__ 17426444a565SStefano Zampini #define __FUNCT__ "MatMumpsSetSchurIndices" 17436444a565SStefano Zampini /*@ 17446444a565SStefano Zampini MatMumpsSetSchurIndices - Set indices defining the Schur complement that MUMPS will compute during the factorization steps 17456444a565SStefano Zampini 17466444a565SStefano Zampini Logically Collective on Mat 17476444a565SStefano Zampini 17486444a565SStefano Zampini Input Parameters: 17496444a565SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 17506444a565SStefano Zampini . size - size of the Schur complement indices 17516444a565SStefano Zampini - idxs[] - array of Schur complement indices 17526444a565SStefano Zampini 17536444a565SStefano Zampini Notes: 175459ac8732SStefano Zampini The user has to free the array idxs[] since the indices are copied by the routine. 175559ac8732SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 17566444a565SStefano Zampini 17576444a565SStefano Zampini Level: advanced 17586444a565SStefano Zampini 17596444a565SStefano Zampini References: MUMPS Users' Guide 17606444a565SStefano Zampini 176159ac8732SStefano Zampini .seealso: MatGetFactor(), MatMumpsCreateSchurComplement(), MatMumpsGetSchurComplement() 17626444a565SStefano Zampini @*/ 17636444a565SStefano Zampini PetscErrorCode MatMumpsSetSchurIndices(Mat F,PetscInt size,PetscInt idxs[]) 17646444a565SStefano Zampini { 17656444a565SStefano Zampini PetscErrorCode ierr; 17666444a565SStefano Zampini 17676444a565SStefano Zampini PetscFunctionBegin; 1768e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 1769e807eca7SStefano Zampini if (size) PetscValidIntPointer(idxs,3); 17706444a565SStefano Zampini ierr = PetscTryMethod(F,"MatMumpsSetSchurIndices_C",(Mat,PetscInt,PetscInt[]),(F,size,idxs));CHKERRQ(ierr); 17716444a565SStefano Zampini PetscFunctionReturn(0); 17726444a565SStefano Zampini } 177359ac8732SStefano Zampini 17746444a565SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 17756444a565SStefano Zampini #undef __FUNCT__ 177659ac8732SStefano Zampini #define __FUNCT__ "MatMumpsCreateSchurComplement_MUMPS" 177759ac8732SStefano Zampini PetscErrorCode MatMumpsCreateSchurComplement_MUMPS(Mat F,Mat* S) 17786444a565SStefano Zampini { 17796444a565SStefano Zampini Mat St; 17806444a565SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 17816444a565SStefano Zampini PetscScalar *array; 17826444a565SStefano Zampini #if defined(PETSC_USE_COMPLEX) 17838ac429a0SStefano Zampini PetscScalar im = PetscSqrtScalar((PetscScalar)-1.0); 17846444a565SStefano Zampini #endif 17856444a565SStefano Zampini PetscErrorCode ierr; 17866444a565SStefano Zampini 17876444a565SStefano Zampini PetscFunctionBegin; 1788*6f3cc6f9SBarry Smith if (!mumps->id.ICNTL(19)) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatMumpsSetSchurIndices to enable it"); 1789*6f3cc6f9SBarry Smith else if (!mumps->id.size_schur) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 1790*6f3cc6f9SBarry Smith else if (!mumps->schur_restored) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 1791*6f3cc6f9SBarry Smith 17926444a565SStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)F),&St);CHKERRQ(ierr); 17936444a565SStefano Zampini ierr = MatSetSizes(St,PETSC_DECIDE,PETSC_DECIDE,mumps->id.size_schur,mumps->id.size_schur);CHKERRQ(ierr); 17946444a565SStefano Zampini ierr = MatSetType(St,MATDENSE);CHKERRQ(ierr); 17956444a565SStefano Zampini ierr = MatSetUp(St);CHKERRQ(ierr); 17966444a565SStefano Zampini ierr = MatDenseGetArray(St,&array);CHKERRQ(ierr); 179759ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full matrix */ 17986444a565SStefano Zampini if (mumps->id.ICNTL(19) == 1) { /* stored by rows */ 17996444a565SStefano Zampini PetscInt i,j,N=mumps->id.size_schur; 18006444a565SStefano Zampini for (i=0;i<N;i++) { 18016444a565SStefano Zampini for (j=0;j<N;j++) { 18026444a565SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 18036444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j]; 18046444a565SStefano Zampini #else 18056444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j].r + im*mumps->id.schur[i*N+j].i; 18066444a565SStefano Zampini #endif 18076444a565SStefano Zampini array[j*N+i] = val; 18086444a565SStefano Zampini } 18096444a565SStefano Zampini } 18106444a565SStefano Zampini } else { /* stored by columns */ 18116444a565SStefano Zampini ierr = PetscMemcpy(array,mumps->id.schur,mumps->id.size_schur*mumps->id.size_schur*sizeof(PetscScalar));CHKERRQ(ierr); 18126444a565SStefano Zampini } 18136444a565SStefano Zampini } else { /* either full or lower-triangular (not packed) */ 18146444a565SStefano Zampini if (mumps->id.ICNTL(19) == 2) { /* lower triangular stored by columns */ 18156444a565SStefano Zampini PetscInt i,j,N=mumps->id.size_schur; 18166444a565SStefano Zampini for (i=0;i<N;i++) { 18176444a565SStefano Zampini for (j=i;j<N;j++) { 18186444a565SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 18196444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j]; 18206444a565SStefano Zampini #else 18216444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j].r + im*mumps->id.schur[i*N+j].i; 18226444a565SStefano Zampini #endif 18236444a565SStefano Zampini array[i*N+j] = val; 18246444a565SStefano Zampini array[j*N+i] = val; 18256444a565SStefano Zampini } 18266444a565SStefano Zampini } 18276444a565SStefano Zampini } else if (mumps->id.ICNTL(19) == 3) { /* full matrix */ 18286444a565SStefano Zampini ierr = PetscMemcpy(array,mumps->id.schur,mumps->id.size_schur*mumps->id.size_schur*sizeof(PetscScalar));CHKERRQ(ierr); 18296444a565SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 18306444a565SStefano Zampini PetscInt i,j,N=mumps->id.size_schur; 18316444a565SStefano Zampini for (i=0;i<N;i++) { 18326444a565SStefano Zampini for (j=0;j<i+1;j++) { 18336444a565SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 18346444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j]; 18356444a565SStefano Zampini #else 18366444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j].r + im*mumps->id.schur[i*N+j].i; 18376444a565SStefano Zampini #endif 18386444a565SStefano Zampini array[i*N+j] = val; 18396444a565SStefano Zampini array[j*N+i] = val; 18406444a565SStefano Zampini } 18416444a565SStefano Zampini } 18426444a565SStefano Zampini } 18436444a565SStefano Zampini } 18446444a565SStefano Zampini ierr = MatDenseRestoreArray(St,&array);CHKERRQ(ierr); 18456444a565SStefano Zampini *S = St; 18466444a565SStefano Zampini PetscFunctionReturn(0); 18476444a565SStefano Zampini } 18486444a565SStefano Zampini 18496444a565SStefano Zampini #undef __FUNCT__ 185059ac8732SStefano Zampini #define __FUNCT__ "MatMumpsCreateSchurComplement" 18516444a565SStefano Zampini /*@ 185259ac8732SStefano Zampini MatMumpsCreateSchurComplement - Create a Schur complement matrix object using Schur data computed by MUMPS during the factorization step 18536444a565SStefano Zampini 18546444a565SStefano Zampini Logically Collective on Mat 18556444a565SStefano Zampini 18566444a565SStefano Zampini Input Parameters: 18576444a565SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 18586444a565SStefano Zampini . *S - location where to return the Schur complement (MATDENSE) 18596444a565SStefano Zampini 18606444a565SStefano Zampini Notes: 186159ac8732SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 186259ac8732SStefano Zampini The routine provides a copy of the Schur data stored within MUMPS data strutures. The caller must destroy the object when it is no longer needed. 1863066565c5SStefano Zampini If MatMumpsInvertSchurComplement has been called, the routine gets back the inverse 18646444a565SStefano Zampini 18656444a565SStefano Zampini Level: advanced 18666444a565SStefano Zampini 18676444a565SStefano Zampini References: MUMPS Users' Guide 18686444a565SStefano Zampini 186959ac8732SStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices(), MatMumpsGetSchurComplement() 187059ac8732SStefano Zampini @*/ 187159ac8732SStefano Zampini PetscErrorCode MatMumpsCreateSchurComplement(Mat F,Mat* S) 187259ac8732SStefano Zampini { 187359ac8732SStefano Zampini PetscErrorCode ierr; 187459ac8732SStefano Zampini 187559ac8732SStefano Zampini PetscFunctionBegin; 1876e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 187759ac8732SStefano Zampini ierr = PetscTryMethod(F,"MatMumpsCreateSchurComplement_C",(Mat,Mat*),(F,S));CHKERRQ(ierr); 187859ac8732SStefano Zampini PetscFunctionReturn(0); 187959ac8732SStefano Zampini } 188059ac8732SStefano Zampini 188159ac8732SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 188259ac8732SStefano Zampini #undef __FUNCT__ 188359ac8732SStefano Zampini #define __FUNCT__ "MatMumpsGetSchurComplement_MUMPS" 188459ac8732SStefano Zampini PetscErrorCode MatMumpsGetSchurComplement_MUMPS(Mat F,Mat* S) 188559ac8732SStefano Zampini { 188659ac8732SStefano Zampini Mat St; 188759ac8732SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 188859ac8732SStefano Zampini PetscErrorCode ierr; 188959ac8732SStefano Zampini 189059ac8732SStefano Zampini PetscFunctionBegin; 1891*6f3cc6f9SBarry Smith if (!mumps->id.ICNTL(19)) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatMumpsSetSchurIndices to enable it"); 1892*6f3cc6f9SBarry Smith else if (!mumps->id.size_schur) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 1893*6f3cc6f9SBarry Smith else if (!mumps->schur_restored) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 1894*6f3cc6f9SBarry Smith 189559ac8732SStefano Zampini /* It should be the responsibility of the user to handle different ICNTL(19) cases if they want to work with the raw data */ 189659ac8732SStefano Zampini /* should I also add errors when the Schur complement has been already factored? */ 189759ac8732SStefano Zampini ierr = MatCreateSeqDense(PetscObjectComm((PetscObject)F),mumps->id.size_schur,mumps->id.size_schur,(PetscScalar*)mumps->id.schur,&St);CHKERRQ(ierr); 189859ac8732SStefano Zampini *S = St; 189959ac8732SStefano Zampini mumps->schur_restored = PETSC_FALSE; 190059ac8732SStefano Zampini PetscFunctionReturn(0); 190159ac8732SStefano Zampini } 190259ac8732SStefano Zampini 190359ac8732SStefano Zampini #undef __FUNCT__ 190459ac8732SStefano Zampini #define __FUNCT__ "MatMumpsGetSchurComplement" 190559ac8732SStefano Zampini /*@ 190659ac8732SStefano Zampini MatMumpsGetSchurComplement - Get a Schur complement matrix object using the current status of the raw Schur data computed by MUMPS during the factorization step 190759ac8732SStefano Zampini 190859ac8732SStefano Zampini Logically Collective on Mat 190959ac8732SStefano Zampini 191059ac8732SStefano Zampini Input Parameters: 191159ac8732SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 191259ac8732SStefano Zampini . *S - location where to return the Schur complement (MATDENSE) 191359ac8732SStefano Zampini 191459ac8732SStefano Zampini Notes: 191559ac8732SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 191659ac8732SStefano Zampini The routine uses the pointer to the raw data of the Schur Complement stored within MUMPS data strutures. The caller should call MatMumpsRestoreSchurComplement when the object is no longer needed. 1917066565c5SStefano Zampini If MatMumpsInvertSchurComplement has been called, the routine gets back the inverse 191859ac8732SStefano Zampini 191959ac8732SStefano Zampini Level: advanced 192059ac8732SStefano Zampini 192159ac8732SStefano Zampini References: MUMPS Users' Guide 192259ac8732SStefano Zampini 192359ac8732SStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices(), MatMumpsRestoreSchurComplement(), MatMumpsCreateSchurComplement() 19246444a565SStefano Zampini @*/ 19256444a565SStefano Zampini PetscErrorCode MatMumpsGetSchurComplement(Mat F,Mat* S) 19266444a565SStefano Zampini { 19276444a565SStefano Zampini PetscErrorCode ierr; 19286444a565SStefano Zampini 19296444a565SStefano Zampini PetscFunctionBegin; 1930e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 193159ac8732SStefano Zampini ierr = PetscUseMethod(F,"MatMumpsGetSchurComplement_C",(Mat,Mat*),(F,S));CHKERRQ(ierr); 193259ac8732SStefano Zampini PetscFunctionReturn(0); 193359ac8732SStefano Zampini } 193459ac8732SStefano Zampini 193559ac8732SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 193659ac8732SStefano Zampini #undef __FUNCT__ 193759ac8732SStefano Zampini #define __FUNCT__ "MatMumpsRestoreSchurComplement_MUMPS" 193859ac8732SStefano Zampini PetscErrorCode MatMumpsRestoreSchurComplement_MUMPS(Mat F,Mat* S) 193959ac8732SStefano Zampini { 194059ac8732SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 194159ac8732SStefano Zampini PetscErrorCode ierr; 194259ac8732SStefano Zampini 194359ac8732SStefano Zampini PetscFunctionBegin; 1944*6f3cc6f9SBarry Smith if (!mumps->id.ICNTL(19)) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatMumpsSetSchurIndices to enable it"); 1945*6f3cc6f9SBarry Smith else if (!mumps->id.size_schur) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 1946*6f3cc6f9SBarry Smith else if (mumps->schur_restored) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has been already restored"); 194759ac8732SStefano Zampini ierr = MatDestroy(S);CHKERRQ(ierr); 194859ac8732SStefano Zampini *S = NULL; 194959ac8732SStefano Zampini mumps->schur_restored = PETSC_TRUE; 195059ac8732SStefano Zampini PetscFunctionReturn(0); 195159ac8732SStefano Zampini } 195259ac8732SStefano Zampini 195359ac8732SStefano Zampini #undef __FUNCT__ 195459ac8732SStefano Zampini #define __FUNCT__ "MatMumpsRestoreSchurComplement" 195559ac8732SStefano Zampini /*@ 195659ac8732SStefano Zampini MatMumpsRestoreSchurComplement - Restore the Schur complement matrix object obtained from a call to MatGetSchurComplement 195759ac8732SStefano Zampini 195859ac8732SStefano Zampini Logically Collective on Mat 195959ac8732SStefano Zampini 196059ac8732SStefano Zampini Input Parameters: 196159ac8732SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 196259ac8732SStefano Zampini . *S - location where the Schur complement is stored 196359ac8732SStefano Zampini 196459ac8732SStefano Zampini Notes: 196559ac8732SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 196659ac8732SStefano Zampini 196759ac8732SStefano Zampini Level: advanced 196859ac8732SStefano Zampini 196959ac8732SStefano Zampini References: MUMPS Users' Guide 197059ac8732SStefano Zampini 197159ac8732SStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices(), MatMumpsGetSchurComplement(), MatMumpsCreateSchurComplement() 197259ac8732SStefano Zampini @*/ 197359ac8732SStefano Zampini PetscErrorCode MatMumpsRestoreSchurComplement(Mat F,Mat* S) 197459ac8732SStefano Zampini { 197559ac8732SStefano Zampini PetscErrorCode ierr; 197659ac8732SStefano Zampini 197759ac8732SStefano Zampini PetscFunctionBegin; 1978e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 197959ac8732SStefano Zampini ierr = PetscUseMethod(F,"MatMumpsRestoreSchurComplement_C",(Mat,Mat*),(F,S));CHKERRQ(ierr); 198059ac8732SStefano Zampini PetscFunctionReturn(0); 198159ac8732SStefano Zampini } 198259ac8732SStefano Zampini 198359ac8732SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 198459ac8732SStefano Zampini #undef __FUNCT__ 198559ac8732SStefano Zampini #define __FUNCT__ "MatMumpsInvertSchurComplement_MUMPS" 198659ac8732SStefano Zampini PetscErrorCode MatMumpsInvertSchurComplement_MUMPS(Mat F) 198759ac8732SStefano Zampini { 198859ac8732SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 198959ac8732SStefano Zampini PetscErrorCode ierr; 199059ac8732SStefano Zampini 199159ac8732SStefano Zampini PetscFunctionBegin; 199259ac8732SStefano Zampini if (!mumps->id.ICNTL(19)) { /* do nothing */ 199359ac8732SStefano Zampini PetscFunctionReturn(0); 199459ac8732SStefano Zampini } 1995*6f3cc6f9SBarry Smith if (!mumps->id.size_schur) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 1996*6f3cc6f9SBarry Smith else if (!mumps->schur_restored) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 199759ac8732SStefano Zampini ierr = MatMumpsInvertSchur_Private(mumps);CHKERRQ(ierr); 199859ac8732SStefano Zampini PetscFunctionReturn(0); 199959ac8732SStefano Zampini } 200059ac8732SStefano Zampini 200159ac8732SStefano Zampini #undef __FUNCT__ 200259ac8732SStefano Zampini #define __FUNCT__ "MatMumpsInvertSchurComplement" 200359ac8732SStefano Zampini /*@ 200459ac8732SStefano Zampini MatMumpsInvertSchurComplement - Invert the raw Schur data computed by MUMPS during the factorization step 200559ac8732SStefano Zampini 200659ac8732SStefano Zampini Logically Collective on Mat 200759ac8732SStefano Zampini 200859ac8732SStefano Zampini Input Parameters: 200959ac8732SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 201059ac8732SStefano Zampini 201159ac8732SStefano Zampini Notes: 201259ac8732SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 201359ac8732SStefano Zampini The routine uses the pointer to the raw data of the Schur Complement stored within MUMPS data strutures. 201459ac8732SStefano Zampini 201559ac8732SStefano Zampini Level: advanced 201659ac8732SStefano Zampini 201759ac8732SStefano Zampini References: MUMPS Users' Guide 201859ac8732SStefano Zampini 201959ac8732SStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices() 202059ac8732SStefano Zampini @*/ 202159ac8732SStefano Zampini PetscErrorCode MatMumpsInvertSchurComplement(Mat F) 202259ac8732SStefano Zampini { 202359ac8732SStefano Zampini PetscErrorCode ierr; 202459ac8732SStefano Zampini 202559ac8732SStefano Zampini PetscFunctionBegin; 2026e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 202759ac8732SStefano Zampini ierr = PetscTryMethod(F,"MatMumpsInvertSchurComplement_C",(Mat),(F));CHKERRQ(ierr); 20286444a565SStefano Zampini PetscFunctionReturn(0); 20296444a565SStefano Zampini } 20306444a565SStefano Zampini 20316444a565SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 20326444a565SStefano Zampini #undef __FUNCT__ 2033e807eca7SStefano Zampini #define __FUNCT__ "MatMumpsSolveSchurComplement_MUMPS" 2034e807eca7SStefano Zampini PetscErrorCode MatMumpsSolveSchurComplement_MUMPS(Mat F, Vec rhs, Vec sol) 2035e807eca7SStefano Zampini { 2036e807eca7SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2037e807eca7SStefano Zampini MumpsScalar *orhs; 2038e807eca7SStefano Zampini PetscScalar *osol,*nrhs,*nsol; 20399a3a5937SStefano Zampini PetscInt orhs_size,osol_size,olrhs_size; 2040e807eca7SStefano Zampini PetscErrorCode ierr; 2041e807eca7SStefano Zampini 2042e807eca7SStefano Zampini PetscFunctionBegin; 2043*6f3cc6f9SBarry Smith if (!mumps->id.ICNTL(19)) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatMumpsSetSchurIndices to enable it"); 2044*6f3cc6f9SBarry Smith if (!mumps->id.size_schur) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 2045*6f3cc6f9SBarry Smith else if (!mumps->schur_restored) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 2046*6f3cc6f9SBarry Smith 2047e807eca7SStefano Zampini /* swap pointers */ 2048e807eca7SStefano Zampini orhs = mumps->id.redrhs; 20499a3a5937SStefano Zampini olrhs_size = mumps->id.lredrhs; 2050a12f35bfSStefano Zampini orhs_size = mumps->sizeredrhs; 2051e807eca7SStefano Zampini osol = mumps->schur_sol; 2052a12f35bfSStefano Zampini osol_size = mumps->schur_sizesol; 2053e807eca7SStefano Zampini ierr = VecGetArray(rhs,&nrhs);CHKERRQ(ierr); 2054e807eca7SStefano Zampini ierr = VecGetArray(sol,&nsol);CHKERRQ(ierr); 2055e807eca7SStefano Zampini mumps->id.redrhs = (MumpsScalar*)nrhs; 2056a12f35bfSStefano Zampini ierr = VecGetLocalSize(rhs,&mumps->sizeredrhs);CHKERRQ(ierr); 20579a3a5937SStefano Zampini mumps->id.lredrhs = mumps->sizeredrhs; 2058e807eca7SStefano Zampini mumps->schur_sol = nsol; 2059a12f35bfSStefano Zampini ierr = VecGetLocalSize(sol,&mumps->schur_sizesol);CHKERRQ(ierr); 2060a12f35bfSStefano Zampini 2061e807eca7SStefano Zampini /* solve Schur complement */ 2062e807eca7SStefano Zampini mumps->id.nrhs = 1; 2063e807eca7SStefano Zampini ierr = MatMumpsSolveSchur_Private(mumps,PETSC_FALSE);CHKERRQ(ierr); 2064e807eca7SStefano Zampini /* restore pointers */ 2065e807eca7SStefano Zampini ierr = VecRestoreArray(rhs,&nrhs);CHKERRQ(ierr); 2066e807eca7SStefano Zampini ierr = VecRestoreArray(sol,&nsol);CHKERRQ(ierr); 2067e807eca7SStefano Zampini mumps->id.redrhs = orhs; 20689a3a5937SStefano Zampini mumps->id.lredrhs = olrhs_size; 2069a12f35bfSStefano Zampini mumps->sizeredrhs = orhs_size; 2070e807eca7SStefano Zampini mumps->schur_sol = osol; 2071a12f35bfSStefano Zampini mumps->schur_sizesol = osol_size; 2072e807eca7SStefano Zampini PetscFunctionReturn(0); 2073e807eca7SStefano Zampini } 2074e807eca7SStefano Zampini 2075e807eca7SStefano Zampini #undef __FUNCT__ 2076e807eca7SStefano Zampini #define __FUNCT__ "MatMumpsSolveSchurComplement" 2077e807eca7SStefano Zampini /*@ 2078e807eca7SStefano Zampini MatMumpsSolveSchurComplement - Solve the Schur complement system computed by MUMPS during the factorization step 2079e807eca7SStefano Zampini 2080e807eca7SStefano Zampini Logically Collective on Mat 2081e807eca7SStefano Zampini 2082e807eca7SStefano Zampini Input Parameters: 2083e807eca7SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2084e807eca7SStefano Zampini . rhs - location where the right hand side of the Schur complement system is stored 2085e807eca7SStefano Zampini - sol - location where the solution of the Schur complement system has to be returned 2086e807eca7SStefano Zampini 2087e807eca7SStefano Zampini Notes: 2088e807eca7SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 2089e807eca7SStefano Zampini The sizes of the vectors should match the size of the Schur complement 2090e807eca7SStefano Zampini 2091e807eca7SStefano Zampini Level: advanced 2092e807eca7SStefano Zampini 2093e807eca7SStefano Zampini References: MUMPS Users' Guide 2094e807eca7SStefano Zampini 2095e807eca7SStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices() 2096e807eca7SStefano Zampini @*/ 2097e807eca7SStefano Zampini PetscErrorCode MatMumpsSolveSchurComplement(Mat F, Vec rhs, Vec sol) 2098e807eca7SStefano Zampini { 2099e807eca7SStefano Zampini PetscErrorCode ierr; 2100e807eca7SStefano Zampini 2101e807eca7SStefano Zampini PetscFunctionBegin; 2102e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 2103e807eca7SStefano Zampini PetscValidHeaderSpecific(rhs,VEC_CLASSID,2); 2104e807eca7SStefano Zampini PetscValidHeaderSpecific(sol,VEC_CLASSID,2); 2105e807eca7SStefano Zampini PetscCheckSameComm(F,1,rhs,2); 2106e807eca7SStefano Zampini PetscCheckSameComm(F,1,sol,3); 21077404bcfbSStefano Zampini ierr = PetscUseMethod(F,"MatMumpsSolveSchurComplement_C",(Mat,Vec,Vec),(F,rhs,sol));CHKERRQ(ierr); 21087404bcfbSStefano Zampini PetscFunctionReturn(0); 21097404bcfbSStefano Zampini } 21107404bcfbSStefano Zampini 21117404bcfbSStefano Zampini /* -------------------------------------------------------------------------------------------*/ 21127404bcfbSStefano Zampini #undef __FUNCT__ 21137404bcfbSStefano Zampini #define __FUNCT__ "MatMumpsSolveSchurComplementTranspose_MUMPS" 21147404bcfbSStefano Zampini PetscErrorCode MatMumpsSolveSchurComplementTranspose_MUMPS(Mat F, Vec rhs, Vec sol) 21157404bcfbSStefano Zampini { 21167404bcfbSStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 21177404bcfbSStefano Zampini MumpsScalar *orhs; 21187404bcfbSStefano Zampini PetscScalar *osol,*nrhs,*nsol; 2119a12f35bfSStefano Zampini PetscInt orhs_size,osol_size; 21207404bcfbSStefano Zampini PetscErrorCode ierr; 21217404bcfbSStefano Zampini 21227404bcfbSStefano Zampini PetscFunctionBegin; 2123*6f3cc6f9SBarry Smith if (!mumps->id.ICNTL(19)) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatMumpsSetSchurIndices to enable it"); 2124*6f3cc6f9SBarry Smith else if (!mumps->id.size_schur) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 2125*6f3cc6f9SBarry Smith if (!mumps->schur_restored) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 2126*6f3cc6f9SBarry Smith 21277404bcfbSStefano Zampini /* swap pointers */ 21287404bcfbSStefano Zampini orhs = mumps->id.redrhs; 2129a12f35bfSStefano Zampini orhs_size = mumps->sizeredrhs; 21307404bcfbSStefano Zampini osol = mumps->schur_sol; 2131a12f35bfSStefano Zampini osol_size = mumps->schur_sizesol; 21327404bcfbSStefano Zampini ierr = VecGetArray(rhs,&nrhs);CHKERRQ(ierr); 21337404bcfbSStefano Zampini ierr = VecGetArray(sol,&nsol);CHKERRQ(ierr); 21347404bcfbSStefano Zampini mumps->id.redrhs = (MumpsScalar*)nrhs; 2135a12f35bfSStefano Zampini ierr = VecGetLocalSize(rhs,&mumps->sizeredrhs);CHKERRQ(ierr); 21367404bcfbSStefano Zampini mumps->schur_sol = nsol; 2137a12f35bfSStefano Zampini ierr = VecGetLocalSize(sol,&mumps->schur_sizesol);CHKERRQ(ierr); 2138a12f35bfSStefano Zampini 21397404bcfbSStefano Zampini /* solve Schur complement */ 21407404bcfbSStefano Zampini mumps->id.nrhs = 1; 21417404bcfbSStefano Zampini mumps->id.ICNTL(9) = 0; 21427404bcfbSStefano Zampini ierr = MatMumpsSolveSchur_Private(mumps,PETSC_FALSE);CHKERRQ(ierr); 21437404bcfbSStefano Zampini mumps->id.ICNTL(9) = 1; 21447404bcfbSStefano Zampini /* restore pointers */ 21457404bcfbSStefano Zampini ierr = VecRestoreArray(rhs,&nrhs);CHKERRQ(ierr); 21467404bcfbSStefano Zampini ierr = VecRestoreArray(sol,&nsol);CHKERRQ(ierr); 21477404bcfbSStefano Zampini mumps->id.redrhs = orhs; 2148a12f35bfSStefano Zampini mumps->sizeredrhs = orhs_size; 21497404bcfbSStefano Zampini mumps->schur_sol = osol; 2150a12f35bfSStefano Zampini mumps->schur_sizesol = osol_size; 21517404bcfbSStefano Zampini PetscFunctionReturn(0); 21527404bcfbSStefano Zampini } 21537404bcfbSStefano Zampini 21547404bcfbSStefano Zampini #undef __FUNCT__ 21557404bcfbSStefano Zampini #define __FUNCT__ "MatMumpsSolveSchurComplementTranspose" 21567404bcfbSStefano Zampini /*@ 21577404bcfbSStefano Zampini MatMumpsSolveSchurComplementTranspose - Solve the transpose of the Schur complement system computed by MUMPS during the factorization step 21587404bcfbSStefano Zampini 21597404bcfbSStefano Zampini Logically Collective on Mat 21607404bcfbSStefano Zampini 21617404bcfbSStefano Zampini Input Parameters: 21627404bcfbSStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 21637404bcfbSStefano Zampini . rhs - location where the right hand side of the Schur complement system is stored 21647404bcfbSStefano Zampini - sol - location where the solution of the Schur complement system has to be returned 21657404bcfbSStefano Zampini 21667404bcfbSStefano Zampini Notes: 21677404bcfbSStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 21687404bcfbSStefano Zampini The sizes of the vectors should match the size of the Schur complement 21697404bcfbSStefano Zampini 21707404bcfbSStefano Zampini Level: advanced 21717404bcfbSStefano Zampini 21727404bcfbSStefano Zampini References: MUMPS Users' Guide 21737404bcfbSStefano Zampini 21747404bcfbSStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices() 21757404bcfbSStefano Zampini @*/ 21767404bcfbSStefano Zampini PetscErrorCode MatMumpsSolveSchurComplementTranspose(Mat F, Vec rhs, Vec sol) 21777404bcfbSStefano Zampini { 21787404bcfbSStefano Zampini PetscErrorCode ierr; 21797404bcfbSStefano Zampini 21807404bcfbSStefano Zampini PetscFunctionBegin; 21817404bcfbSStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 21827404bcfbSStefano Zampini PetscValidHeaderSpecific(rhs,VEC_CLASSID,2); 21837404bcfbSStefano Zampini PetscValidHeaderSpecific(sol,VEC_CLASSID,2); 21847404bcfbSStefano Zampini PetscCheckSameComm(F,1,rhs,2); 21857404bcfbSStefano Zampini PetscCheckSameComm(F,1,sol,3); 21867404bcfbSStefano Zampini ierr = PetscUseMethod(F,"MatMumpsSolveSchurComplementTranspose_C",(Mat,Vec,Vec),(F,rhs,sol));CHKERRQ(ierr); 2187e807eca7SStefano Zampini PetscFunctionReturn(0); 2188e807eca7SStefano Zampini } 2189e807eca7SStefano Zampini 2190e807eca7SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 2191e807eca7SStefano Zampini #undef __FUNCT__ 21925ccb76cbSHong Zhang #define __FUNCT__ "MatMumpsSetIcntl_MUMPS" 21935ccb76cbSHong Zhang PetscErrorCode MatMumpsSetIcntl_MUMPS(Mat F,PetscInt icntl,PetscInt ival) 21945ccb76cbSHong Zhang { 2195a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 21965ccb76cbSHong Zhang 21975ccb76cbSHong Zhang PetscFunctionBegin; 2198a5e57a09SHong Zhang mumps->id.ICNTL(icntl) = ival; 21995ccb76cbSHong Zhang PetscFunctionReturn(0); 22005ccb76cbSHong Zhang } 22015ccb76cbSHong Zhang 22025ccb76cbSHong Zhang #undef __FUNCT__ 2203bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetIcntl_MUMPS" 2204bc6112feSHong Zhang PetscErrorCode MatMumpsGetIcntl_MUMPS(Mat F,PetscInt icntl,PetscInt *ival) 2205bc6112feSHong Zhang { 2206bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2207bc6112feSHong Zhang 2208bc6112feSHong Zhang PetscFunctionBegin; 2209bc6112feSHong Zhang *ival = mumps->id.ICNTL(icntl); 2210bc6112feSHong Zhang PetscFunctionReturn(0); 2211bc6112feSHong Zhang } 2212bc6112feSHong Zhang 2213bc6112feSHong Zhang #undef __FUNCT__ 22145ccb76cbSHong Zhang #define __FUNCT__ "MatMumpsSetIcntl" 22155ccb76cbSHong Zhang /*@ 22165ccb76cbSHong Zhang MatMumpsSetIcntl - Set MUMPS parameter ICNTL() 22175ccb76cbSHong Zhang 22185ccb76cbSHong Zhang Logically Collective on Mat 22195ccb76cbSHong Zhang 22205ccb76cbSHong Zhang Input Parameters: 22215ccb76cbSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 22225ccb76cbSHong Zhang . icntl - index of MUMPS parameter array ICNTL() 22235ccb76cbSHong Zhang - ival - value of MUMPS ICNTL(icntl) 22245ccb76cbSHong Zhang 22255ccb76cbSHong Zhang Options Database: 22265ccb76cbSHong Zhang . -mat_mumps_icntl_<icntl> <ival> 22275ccb76cbSHong Zhang 22285ccb76cbSHong Zhang Level: beginner 22295ccb76cbSHong Zhang 22305ccb76cbSHong Zhang References: MUMPS Users' Guide 22315ccb76cbSHong Zhang 22325ccb76cbSHong Zhang .seealso: MatGetFactor() 22335ccb76cbSHong Zhang @*/ 22345ccb76cbSHong Zhang PetscErrorCode MatMumpsSetIcntl(Mat F,PetscInt icntl,PetscInt ival) 22355ccb76cbSHong Zhang { 22365ccb76cbSHong Zhang PetscErrorCode ierr; 22375ccb76cbSHong Zhang 22385ccb76cbSHong Zhang PetscFunctionBegin; 22395ccb76cbSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 22405ccb76cbSHong Zhang PetscValidLogicalCollectiveInt(F,ival,3); 22415ccb76cbSHong Zhang ierr = PetscTryMethod(F,"MatMumpsSetIcntl_C",(Mat,PetscInt,PetscInt),(F,icntl,ival));CHKERRQ(ierr); 22425ccb76cbSHong Zhang PetscFunctionReturn(0); 22435ccb76cbSHong Zhang } 22445ccb76cbSHong Zhang 2245bc6112feSHong Zhang #undef __FUNCT__ 2246bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetIcntl" 2247a21f80fcSHong Zhang /*@ 2248a21f80fcSHong Zhang MatMumpsGetIcntl - Get MUMPS parameter ICNTL() 2249a21f80fcSHong Zhang 2250a21f80fcSHong Zhang Logically Collective on Mat 2251a21f80fcSHong Zhang 2252a21f80fcSHong Zhang Input Parameters: 2253a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2254a21f80fcSHong Zhang - icntl - index of MUMPS parameter array ICNTL() 2255a21f80fcSHong Zhang 2256a21f80fcSHong Zhang Output Parameter: 2257a21f80fcSHong Zhang . ival - value of MUMPS ICNTL(icntl) 2258a21f80fcSHong Zhang 2259a21f80fcSHong Zhang Level: beginner 2260a21f80fcSHong Zhang 2261a21f80fcSHong Zhang References: MUMPS Users' Guide 2262a21f80fcSHong Zhang 2263a21f80fcSHong Zhang .seealso: MatGetFactor() 2264a21f80fcSHong Zhang @*/ 2265bc6112feSHong Zhang PetscErrorCode MatMumpsGetIcntl(Mat F,PetscInt icntl,PetscInt *ival) 2266bc6112feSHong Zhang { 2267bc6112feSHong Zhang PetscErrorCode ierr; 2268bc6112feSHong Zhang 2269bc6112feSHong Zhang PetscFunctionBegin; 2270bc6112feSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 2271bc6112feSHong Zhang PetscValidIntPointer(ival,3); 2272bc6112feSHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetIcntl_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 2273bc6112feSHong Zhang PetscFunctionReturn(0); 2274bc6112feSHong Zhang } 2275bc6112feSHong Zhang 22768928b65cSHong Zhang /* -------------------------------------------------------------------------------------------*/ 22778928b65cSHong Zhang #undef __FUNCT__ 22788928b65cSHong Zhang #define __FUNCT__ "MatMumpsSetCntl_MUMPS" 22798928b65cSHong Zhang PetscErrorCode MatMumpsSetCntl_MUMPS(Mat F,PetscInt icntl,PetscReal val) 22808928b65cSHong Zhang { 22818928b65cSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 22828928b65cSHong Zhang 22838928b65cSHong Zhang PetscFunctionBegin; 22848928b65cSHong Zhang mumps->id.CNTL(icntl) = val; 22858928b65cSHong Zhang PetscFunctionReturn(0); 22868928b65cSHong Zhang } 22878928b65cSHong Zhang 22888928b65cSHong Zhang #undef __FUNCT__ 2289bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetCntl_MUMPS" 2290bc6112feSHong Zhang PetscErrorCode MatMumpsGetCntl_MUMPS(Mat F,PetscInt icntl,PetscReal *val) 2291bc6112feSHong Zhang { 2292bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2293bc6112feSHong Zhang 2294bc6112feSHong Zhang PetscFunctionBegin; 2295bc6112feSHong Zhang *val = mumps->id.CNTL(icntl); 2296bc6112feSHong Zhang PetscFunctionReturn(0); 2297bc6112feSHong Zhang } 2298bc6112feSHong Zhang 2299bc6112feSHong Zhang #undef __FUNCT__ 23008928b65cSHong Zhang #define __FUNCT__ "MatMumpsSetCntl" 23018928b65cSHong Zhang /*@ 23028928b65cSHong Zhang MatMumpsSetCntl - Set MUMPS parameter CNTL() 23038928b65cSHong Zhang 23048928b65cSHong Zhang Logically Collective on Mat 23058928b65cSHong Zhang 23068928b65cSHong Zhang Input Parameters: 23078928b65cSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 23088928b65cSHong Zhang . icntl - index of MUMPS parameter array CNTL() 23098928b65cSHong Zhang - val - value of MUMPS CNTL(icntl) 23108928b65cSHong Zhang 23118928b65cSHong Zhang Options Database: 23128928b65cSHong Zhang . -mat_mumps_cntl_<icntl> <val> 23138928b65cSHong Zhang 23148928b65cSHong Zhang Level: beginner 23158928b65cSHong Zhang 23168928b65cSHong Zhang References: MUMPS Users' Guide 23178928b65cSHong Zhang 23188928b65cSHong Zhang .seealso: MatGetFactor() 23198928b65cSHong Zhang @*/ 23208928b65cSHong Zhang PetscErrorCode MatMumpsSetCntl(Mat F,PetscInt icntl,PetscReal val) 23218928b65cSHong Zhang { 23228928b65cSHong Zhang PetscErrorCode ierr; 23238928b65cSHong Zhang 23248928b65cSHong Zhang PetscFunctionBegin; 23258928b65cSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 2326bc6112feSHong Zhang PetscValidLogicalCollectiveReal(F,val,3); 23278928b65cSHong Zhang ierr = PetscTryMethod(F,"MatMumpsSetCntl_C",(Mat,PetscInt,PetscReal),(F,icntl,val));CHKERRQ(ierr); 23288928b65cSHong Zhang PetscFunctionReturn(0); 23298928b65cSHong Zhang } 23308928b65cSHong Zhang 2331bc6112feSHong Zhang #undef __FUNCT__ 2332bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetCntl" 2333a21f80fcSHong Zhang /*@ 2334a21f80fcSHong Zhang MatMumpsGetCntl - Get MUMPS parameter CNTL() 2335a21f80fcSHong Zhang 2336a21f80fcSHong Zhang Logically Collective on Mat 2337a21f80fcSHong Zhang 2338a21f80fcSHong Zhang Input Parameters: 2339a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2340a21f80fcSHong Zhang - icntl - index of MUMPS parameter array CNTL() 2341a21f80fcSHong Zhang 2342a21f80fcSHong Zhang Output Parameter: 2343a21f80fcSHong Zhang . val - value of MUMPS CNTL(icntl) 2344a21f80fcSHong Zhang 2345a21f80fcSHong Zhang Level: beginner 2346a21f80fcSHong Zhang 2347a21f80fcSHong Zhang References: MUMPS Users' Guide 2348a21f80fcSHong Zhang 2349a21f80fcSHong Zhang .seealso: MatGetFactor() 2350a21f80fcSHong Zhang @*/ 2351bc6112feSHong Zhang PetscErrorCode MatMumpsGetCntl(Mat F,PetscInt icntl,PetscReal *val) 2352bc6112feSHong Zhang { 2353bc6112feSHong Zhang PetscErrorCode ierr; 2354bc6112feSHong Zhang 2355bc6112feSHong Zhang PetscFunctionBegin; 2356bc6112feSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 2357bc6112feSHong Zhang PetscValidRealPointer(val,3); 2358bc6112feSHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetCntl_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 2359bc6112feSHong Zhang PetscFunctionReturn(0); 2360bc6112feSHong Zhang } 2361bc6112feSHong Zhang 2362bc6112feSHong Zhang #undef __FUNCT__ 2363ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfo_MUMPS" 2364ca810319SHong Zhang PetscErrorCode MatMumpsGetInfo_MUMPS(Mat F,PetscInt icntl,PetscInt *info) 2365bc6112feSHong Zhang { 2366bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2367bc6112feSHong Zhang 2368bc6112feSHong Zhang PetscFunctionBegin; 2369bc6112feSHong Zhang *info = mumps->id.INFO(icntl); 2370bc6112feSHong Zhang PetscFunctionReturn(0); 2371bc6112feSHong Zhang } 2372bc6112feSHong Zhang 2373bc6112feSHong Zhang #undef __FUNCT__ 2374ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfog_MUMPS" 2375ca810319SHong Zhang PetscErrorCode MatMumpsGetInfog_MUMPS(Mat F,PetscInt icntl,PetscInt *infog) 2376bc6112feSHong Zhang { 2377bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2378bc6112feSHong Zhang 2379bc6112feSHong Zhang PetscFunctionBegin; 2380bc6112feSHong Zhang *infog = mumps->id.INFOG(icntl); 2381bc6112feSHong Zhang PetscFunctionReturn(0); 2382bc6112feSHong Zhang } 2383bc6112feSHong Zhang 2384bc6112feSHong Zhang #undef __FUNCT__ 2385ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfo_MUMPS" 2386ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfo_MUMPS(Mat F,PetscInt icntl,PetscReal *rinfo) 2387bc6112feSHong Zhang { 2388bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2389bc6112feSHong Zhang 2390bc6112feSHong Zhang PetscFunctionBegin; 2391bc6112feSHong Zhang *rinfo = mumps->id.RINFO(icntl); 2392bc6112feSHong Zhang PetscFunctionReturn(0); 2393bc6112feSHong Zhang } 2394bc6112feSHong Zhang 2395bc6112feSHong Zhang #undef __FUNCT__ 2396ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfog_MUMPS" 2397ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfog_MUMPS(Mat F,PetscInt icntl,PetscReal *rinfog) 2398bc6112feSHong Zhang { 2399bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2400bc6112feSHong Zhang 2401bc6112feSHong Zhang PetscFunctionBegin; 2402bc6112feSHong Zhang *rinfog = mumps->id.RINFOG(icntl); 2403bc6112feSHong Zhang PetscFunctionReturn(0); 2404bc6112feSHong Zhang } 2405bc6112feSHong Zhang 2406bc6112feSHong Zhang #undef __FUNCT__ 2407ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfo" 2408a21f80fcSHong Zhang /*@ 2409a21f80fcSHong Zhang MatMumpsGetInfo - Get MUMPS parameter INFO() 2410a21f80fcSHong Zhang 2411a21f80fcSHong Zhang Logically Collective on Mat 2412a21f80fcSHong Zhang 2413a21f80fcSHong Zhang Input Parameters: 2414a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2415a21f80fcSHong Zhang - icntl - index of MUMPS parameter array INFO() 2416a21f80fcSHong Zhang 2417a21f80fcSHong Zhang Output Parameter: 2418a21f80fcSHong Zhang . ival - value of MUMPS INFO(icntl) 2419a21f80fcSHong Zhang 2420a21f80fcSHong Zhang Level: beginner 2421a21f80fcSHong Zhang 2422a21f80fcSHong Zhang References: MUMPS Users' Guide 2423a21f80fcSHong Zhang 2424a21f80fcSHong Zhang .seealso: MatGetFactor() 2425a21f80fcSHong Zhang @*/ 2426ca810319SHong Zhang PetscErrorCode MatMumpsGetInfo(Mat F,PetscInt icntl,PetscInt *ival) 2427bc6112feSHong Zhang { 2428bc6112feSHong Zhang PetscErrorCode ierr; 2429bc6112feSHong Zhang 2430bc6112feSHong Zhang PetscFunctionBegin; 2431ca810319SHong Zhang PetscValidIntPointer(ival,3); 2432ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetInfo_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 2433bc6112feSHong Zhang PetscFunctionReturn(0); 2434bc6112feSHong Zhang } 2435bc6112feSHong Zhang 2436bc6112feSHong Zhang #undef __FUNCT__ 2437ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfog" 2438a21f80fcSHong Zhang /*@ 2439a21f80fcSHong Zhang MatMumpsGetInfog - Get MUMPS parameter INFOG() 2440a21f80fcSHong Zhang 2441a21f80fcSHong Zhang Logically Collective on Mat 2442a21f80fcSHong Zhang 2443a21f80fcSHong Zhang Input Parameters: 2444a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2445a21f80fcSHong Zhang - icntl - index of MUMPS parameter array INFOG() 2446a21f80fcSHong Zhang 2447a21f80fcSHong Zhang Output Parameter: 2448a21f80fcSHong Zhang . ival - value of MUMPS INFOG(icntl) 2449a21f80fcSHong Zhang 2450a21f80fcSHong Zhang Level: beginner 2451a21f80fcSHong Zhang 2452a21f80fcSHong Zhang References: MUMPS Users' Guide 2453a21f80fcSHong Zhang 2454a21f80fcSHong Zhang .seealso: MatGetFactor() 2455a21f80fcSHong Zhang @*/ 2456ca810319SHong Zhang PetscErrorCode MatMumpsGetInfog(Mat F,PetscInt icntl,PetscInt *ival) 2457bc6112feSHong Zhang { 2458bc6112feSHong Zhang PetscErrorCode ierr; 2459bc6112feSHong Zhang 2460bc6112feSHong Zhang PetscFunctionBegin; 2461ca810319SHong Zhang PetscValidIntPointer(ival,3); 2462ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetInfog_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 2463bc6112feSHong Zhang PetscFunctionReturn(0); 2464bc6112feSHong Zhang } 2465bc6112feSHong Zhang 2466bc6112feSHong Zhang #undef __FUNCT__ 2467ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfo" 2468a21f80fcSHong Zhang /*@ 2469a21f80fcSHong Zhang MatMumpsGetRinfo - Get MUMPS parameter RINFO() 2470a21f80fcSHong Zhang 2471a21f80fcSHong Zhang Logically Collective on Mat 2472a21f80fcSHong Zhang 2473a21f80fcSHong Zhang Input Parameters: 2474a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2475a21f80fcSHong Zhang - icntl - index of MUMPS parameter array RINFO() 2476a21f80fcSHong Zhang 2477a21f80fcSHong Zhang Output Parameter: 2478a21f80fcSHong Zhang . val - value of MUMPS RINFO(icntl) 2479a21f80fcSHong Zhang 2480a21f80fcSHong Zhang Level: beginner 2481a21f80fcSHong Zhang 2482a21f80fcSHong Zhang References: MUMPS Users' Guide 2483a21f80fcSHong Zhang 2484a21f80fcSHong Zhang .seealso: MatGetFactor() 2485a21f80fcSHong Zhang @*/ 2486ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfo(Mat F,PetscInt icntl,PetscReal *val) 2487bc6112feSHong Zhang { 2488bc6112feSHong Zhang PetscErrorCode ierr; 2489bc6112feSHong Zhang 2490bc6112feSHong Zhang PetscFunctionBegin; 2491bc6112feSHong Zhang PetscValidRealPointer(val,3); 2492ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetRinfo_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 2493bc6112feSHong Zhang PetscFunctionReturn(0); 2494bc6112feSHong Zhang } 2495bc6112feSHong Zhang 2496bc6112feSHong Zhang #undef __FUNCT__ 2497ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfog" 2498a21f80fcSHong Zhang /*@ 2499a21f80fcSHong Zhang MatMumpsGetRinfog - Get MUMPS parameter RINFOG() 2500a21f80fcSHong Zhang 2501a21f80fcSHong Zhang Logically Collective on Mat 2502a21f80fcSHong Zhang 2503a21f80fcSHong Zhang Input Parameters: 2504a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2505a21f80fcSHong Zhang - icntl - index of MUMPS parameter array RINFOG() 2506a21f80fcSHong Zhang 2507a21f80fcSHong Zhang Output Parameter: 2508a21f80fcSHong Zhang . val - value of MUMPS RINFOG(icntl) 2509a21f80fcSHong Zhang 2510a21f80fcSHong Zhang Level: beginner 2511a21f80fcSHong Zhang 2512a21f80fcSHong Zhang References: MUMPS Users' Guide 2513a21f80fcSHong Zhang 2514a21f80fcSHong Zhang .seealso: MatGetFactor() 2515a21f80fcSHong Zhang @*/ 2516ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfog(Mat F,PetscInt icntl,PetscReal *val) 2517bc6112feSHong Zhang { 2518bc6112feSHong Zhang PetscErrorCode ierr; 2519bc6112feSHong Zhang 2520bc6112feSHong Zhang PetscFunctionBegin; 2521bc6112feSHong Zhang PetscValidRealPointer(val,3); 2522ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetRinfog_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 2523bc6112feSHong Zhang PetscFunctionReturn(0); 2524bc6112feSHong Zhang } 2525bc6112feSHong Zhang 252624b6179bSKris Buschelman /*MC 25272692d6eeSBarry Smith MATSOLVERMUMPS - A matrix type providing direct solvers (LU and Cholesky) for 252824b6179bSKris Buschelman distributed and sequential matrices via the external package MUMPS. 252924b6179bSKris Buschelman 253041c8de11SBarry Smith Works with MATAIJ and MATSBAIJ matrices 253124b6179bSKris Buschelman 2532c2b89b5dSBarry Smith Use ./configure --download-mumps --download-scalapack --download-parmetis --download-metis --download-ptscotch to have PETSc installed with MUMPS 2533c2b89b5dSBarry Smith 2534c2b89b5dSBarry Smith Use -pc_type cholesky or lu -pc_factor_mat_solver_package mumps to us this direct solver 2535c2b89b5dSBarry Smith 253624b6179bSKris Buschelman Options Database Keys: 25374e34a73bSHong Zhang + -mat_mumps_icntl_1 <6>: ICNTL(1): output stream for error messages (None) 25384e34a73bSHong Zhang . -mat_mumps_icntl_2 <0>: ICNTL(2): output stream for diagnostic printing, statistics, and warning (None) 25394e34a73bSHong Zhang . -mat_mumps_icntl_3 <0>: ICNTL(3): output stream for global information, collected on the host (None) 25404e34a73bSHong Zhang . -mat_mumps_icntl_4 <0>: ICNTL(4): level of printing (0 to 4) (None) 25414e34a73bSHong Zhang . -mat_mumps_icntl_6 <7>: ICNTL(6): permutes to a zero-free diagonal and/or scale the matrix (0 to 7) (None) 25424e34a73bSHong Zhang . -mat_mumps_icntl_7 <7>: ICNTL(7): computes a symmetric permutation in sequential analysis (0 to 7). 3=Scotch, 4=PORD, 5=Metis (None) 25434e34a73bSHong Zhang . -mat_mumps_icntl_8 <77>: ICNTL(8): scaling strategy (-2 to 8 or 77) (None) 25444e34a73bSHong Zhang . -mat_mumps_icntl_10 <0>: ICNTL(10): max num of refinements (None) 25454e34a73bSHong Zhang . -mat_mumps_icntl_11 <0>: ICNTL(11): statistics related to an error analysis (via -ksp_view) (None) 25464e34a73bSHong Zhang . -mat_mumps_icntl_12 <1>: ICNTL(12): an ordering strategy for symmetric matrices (0 to 3) (None) 25474e34a73bSHong Zhang . -mat_mumps_icntl_13 <0>: ICNTL(13): parallelism of the root node (enable ScaLAPACK) and its splitting (None) 25484e34a73bSHong Zhang . -mat_mumps_icntl_14 <20>: ICNTL(14): percentage increase in the estimated working space (None) 25494e34a73bSHong Zhang . -mat_mumps_icntl_19 <0>: ICNTL(19): computes the Schur complement (None) 25504e34a73bSHong Zhang . -mat_mumps_icntl_22 <0>: ICNTL(22): in-core/out-of-core factorization and solve (0 or 1) (None) 25514e34a73bSHong Zhang . -mat_mumps_icntl_23 <0>: ICNTL(23): max size of the working memory (MB) that can allocate per processor (None) 25524e34a73bSHong Zhang . -mat_mumps_icntl_24 <0>: ICNTL(24): detection of null pivot rows (0 or 1) (None) 25534e34a73bSHong Zhang . -mat_mumps_icntl_25 <0>: ICNTL(25): compute a solution of a deficient matrix and a null space basis (None) 25544e34a73bSHong Zhang . -mat_mumps_icntl_26 <0>: ICNTL(26): drives the solution phase if a Schur complement matrix (None) 25554e34a73bSHong Zhang . -mat_mumps_icntl_28 <1>: ICNTL(28): use 1 for sequential analysis and ictnl(7) ordering, or 2 for parallel analysis and ictnl(29) ordering (None) 25564e34a73bSHong Zhang . -mat_mumps_icntl_29 <0>: ICNTL(29): parallel ordering 1 = ptscotch, 2 = parmetis (None) 25574e34a73bSHong Zhang . -mat_mumps_icntl_30 <0>: ICNTL(30): compute user-specified set of entries in inv(A) (None) 25584e34a73bSHong Zhang . -mat_mumps_icntl_31 <0>: ICNTL(31): indicates which factors may be discarded during factorization (None) 25594e34a73bSHong Zhang . -mat_mumps_icntl_33 <0>: ICNTL(33): compute determinant (None) 25604e34a73bSHong Zhang . -mat_mumps_cntl_1 <0.01>: CNTL(1): relative pivoting threshold (None) 25614e34a73bSHong Zhang . -mat_mumps_cntl_2 <1.49012e-08>: CNTL(2): stopping criterion of refinement (None) 25624e34a73bSHong Zhang . -mat_mumps_cntl_3 <0>: CNTL(3): absolute pivoting threshold (None) 25634e34a73bSHong Zhang . -mat_mumps_cntl_4 <-1>: CNTL(4): value for static pivoting (None) 25644e34a73bSHong Zhang - -mat_mumps_cntl_5 <0>: CNTL(5): fixation for null pivots (None) 256524b6179bSKris Buschelman 256624b6179bSKris Buschelman Level: beginner 256724b6179bSKris Buschelman 256841c8de11SBarry Smith .seealso: PCFactorSetMatSolverPackage(), MatSolverPackage 256941c8de11SBarry Smith 257024b6179bSKris Buschelman M*/ 257124b6179bSKris Buschelman 257235bd34faSBarry Smith #undef __FUNCT__ 257335bd34faSBarry Smith #define __FUNCT__ "MatFactorGetSolverPackage_mumps" 2574f7a08781SBarry Smith static PetscErrorCode MatFactorGetSolverPackage_mumps(Mat A,const MatSolverPackage *type) 257535bd34faSBarry Smith { 257635bd34faSBarry Smith PetscFunctionBegin; 25772692d6eeSBarry Smith *type = MATSOLVERMUMPS; 257835bd34faSBarry Smith PetscFunctionReturn(0); 257935bd34faSBarry Smith } 258035bd34faSBarry Smith 2581bccb9932SShri Abhyankar /* MatGetFactor for Seq and MPI AIJ matrices */ 25822877fffaSHong Zhang #undef __FUNCT__ 2583bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_aij_mumps" 25848cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_aij_mumps(Mat A,MatFactorType ftype,Mat *F) 25852877fffaSHong Zhang { 25862877fffaSHong Zhang Mat B; 25872877fffaSHong Zhang PetscErrorCode ierr; 25882877fffaSHong Zhang Mat_MUMPS *mumps; 2589ace3abfcSBarry Smith PetscBool isSeqAIJ; 25902877fffaSHong Zhang 25912877fffaSHong Zhang PetscFunctionBegin; 25922877fffaSHong Zhang /* Create the factorization matrix */ 2593251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQAIJ,&isSeqAIJ);CHKERRQ(ierr); 2594ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 25952877fffaSHong Zhang ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 25962877fffaSHong Zhang ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2597bccb9932SShri Abhyankar if (isSeqAIJ) { 25980298fd71SBarry Smith ierr = MatSeqAIJSetPreallocation(B,0,NULL);CHKERRQ(ierr); 2599bccb9932SShri Abhyankar } else { 26000298fd71SBarry Smith ierr = MatMPIAIJSetPreallocation(B,0,NULL,0,NULL);CHKERRQ(ierr); 2601bccb9932SShri Abhyankar } 26022877fffaSHong Zhang 2603b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 26042205254eSKarl Rupp 26052877fffaSHong Zhang B->ops->view = MatView_MUMPS; 260635bd34faSBarry Smith B->ops->getinfo = MatGetInfo_MUMPS; 260720be8e61SHong Zhang B->ops->getdiagonal = MatGetDiagonal_MUMPS; 26082205254eSKarl Rupp 2609bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 2610bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 2611bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 2612bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 2613bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 2614bc6112feSHong Zhang 2615ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 2616ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 2617ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 2618ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 26196444a565SStefano Zampini 26206444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetSchurIndices_C",MatMumpsSetSchurIndices_MUMPS);CHKERRQ(ierr); 262159ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsInvertSchurComplement_C",MatMumpsInvertSchurComplement_MUMPS);CHKERRQ(ierr); 262259ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsCreateSchurComplement_C",MatMumpsCreateSchurComplement_MUMPS);CHKERRQ(ierr); 26236444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetSchurComplement_C",MatMumpsGetSchurComplement_MUMPS);CHKERRQ(ierr); 262459ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsRestoreSchurComplement_C",MatMumpsRestoreSchurComplement_MUMPS);CHKERRQ(ierr); 2625e807eca7SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplement_C",MatMumpsSolveSchurComplement_MUMPS);CHKERRQ(ierr); 26267404bcfbSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplementTranspose_C",MatMumpsSolveSchurComplementTranspose_MUMPS);CHKERRQ(ierr); 2627e807eca7SStefano Zampini 2628450b117fSShri Abhyankar if (ftype == MAT_FACTOR_LU) { 2629450b117fSShri Abhyankar B->ops->lufactorsymbolic = MatLUFactorSymbolic_AIJMUMPS; 2630d5f3da31SBarry Smith B->factortype = MAT_FACTOR_LU; 2631bccb9932SShri Abhyankar if (isSeqAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqaij_seqaij; 2632bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpiaij_mpiaij; 2633746480a1SHong Zhang mumps->sym = 0; 2634dcd589f8SShri Abhyankar } else { 263567877ebaSShri Abhyankar B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_MUMPS; 2636450b117fSShri Abhyankar B->factortype = MAT_FACTOR_CHOLESKY; 2637bccb9932SShri Abhyankar if (isSeqAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqaij_seqsbaij; 2638bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpiaij_mpisbaij; 263959ac8732SStefano Zampini #if defined(PETSC_USE_COMPLEX) 264059ac8732SStefano Zampini mumps->sym = 2; 264159ac8732SStefano Zampini #else 26426fdc2a6dSBarry Smith if (A->spd_set && A->spd) mumps->sym = 1; 26436fdc2a6dSBarry Smith else mumps->sym = 2; 264459ac8732SStefano Zampini #endif 2645450b117fSShri Abhyankar } 26462877fffaSHong Zhang 26472877fffaSHong Zhang mumps->isAIJ = PETSC_TRUE; 2648bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 26492877fffaSHong Zhang B->ops->destroy = MatDestroy_MUMPS; 26502877fffaSHong Zhang B->spptr = (void*)mumps; 26512205254eSKarl Rupp 2652f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 2653746480a1SHong Zhang 26542877fffaSHong Zhang *F = B; 26552877fffaSHong Zhang PetscFunctionReturn(0); 26562877fffaSHong Zhang } 26572877fffaSHong Zhang 2658bccb9932SShri Abhyankar /* MatGetFactor for Seq and MPI SBAIJ matrices */ 26592877fffaSHong Zhang #undef __FUNCT__ 2660bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_sbaij_mumps" 26618cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_sbaij_mumps(Mat A,MatFactorType ftype,Mat *F) 26622877fffaSHong Zhang { 26632877fffaSHong Zhang Mat B; 26642877fffaSHong Zhang PetscErrorCode ierr; 26652877fffaSHong Zhang Mat_MUMPS *mumps; 2666ace3abfcSBarry Smith PetscBool isSeqSBAIJ; 26672877fffaSHong Zhang 26682877fffaSHong Zhang PetscFunctionBegin; 2669ce94432eSBarry Smith if (ftype != MAT_FACTOR_CHOLESKY) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with MUMPS LU, use AIJ matrix"); 2670ce94432eSBarry Smith if (A->rmap->bs > 1) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with block size > 1 with MUMPS Cholesky, use AIJ matrix instead"); 2671251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQSBAIJ,&isSeqSBAIJ);CHKERRQ(ierr); 26722877fffaSHong Zhang /* Create the factorization matrix */ 2673ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 26742877fffaSHong Zhang ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 26752877fffaSHong Zhang ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2676b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 2677bccb9932SShri Abhyankar if (isSeqSBAIJ) { 26780298fd71SBarry Smith ierr = MatSeqSBAIJSetPreallocation(B,1,0,NULL);CHKERRQ(ierr); 26792205254eSKarl Rupp 268016ebf90aSShri Abhyankar mumps->ConvertToTriples = MatConvertToTriples_seqsbaij_seqsbaij; 2681dcd589f8SShri Abhyankar } else { 26820298fd71SBarry Smith ierr = MatMPISBAIJSetPreallocation(B,1,0,NULL,0,NULL);CHKERRQ(ierr); 26832205254eSKarl Rupp 2684bccb9932SShri Abhyankar mumps->ConvertToTriples = MatConvertToTriples_mpisbaij_mpisbaij; 2685bccb9932SShri Abhyankar } 2686bccb9932SShri Abhyankar 268767877ebaSShri Abhyankar B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_MUMPS; 2688bccb9932SShri Abhyankar B->ops->view = MatView_MUMPS; 268920be8e61SHong Zhang B->ops->getdiagonal = MatGetDiagonal_MUMPS; 26902205254eSKarl Rupp 2691bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 2692b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 2693b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 2694b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 2695b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 2696bc6112feSHong Zhang 2697ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 2698ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 2699ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 2700ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 27012205254eSKarl Rupp 27026444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetSchurIndices_C",MatMumpsSetSchurIndices_MUMPS);CHKERRQ(ierr); 270359ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsInvertSchurComplement_C",MatMumpsInvertSchurComplement_MUMPS);CHKERRQ(ierr); 270459ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsCreateSchurComplement_C",MatMumpsCreateSchurComplement_MUMPS);CHKERRQ(ierr); 27056444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetSchurComplement_C",MatMumpsGetSchurComplement_MUMPS);CHKERRQ(ierr); 270659ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsRestoreSchurComplement_C",MatMumpsRestoreSchurComplement_MUMPS);CHKERRQ(ierr); 2707e807eca7SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplement_C",MatMumpsSolveSchurComplement_MUMPS);CHKERRQ(ierr); 27087404bcfbSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplementTranspose_C",MatMumpsSolveSchurComplementTranspose_MUMPS);CHKERRQ(ierr); 27096444a565SStefano Zampini 2710f4762488SHong Zhang B->factortype = MAT_FACTOR_CHOLESKY; 271159ac8732SStefano Zampini #if defined(PETSC_USE_COMPLEX) 271259ac8732SStefano Zampini mumps->sym = 2; 271359ac8732SStefano Zampini #else 27146fdc2a6dSBarry Smith if (A->spd_set && A->spd) mumps->sym = 1; 27156fdc2a6dSBarry Smith else mumps->sym = 2; 271659ac8732SStefano Zampini #endif 2717a214ac2aSShri Abhyankar 2718bccb9932SShri Abhyankar mumps->isAIJ = PETSC_FALSE; 2719bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 2720f3c0ef26SHong Zhang B->ops->destroy = MatDestroy_MUMPS; 27212877fffaSHong Zhang B->spptr = (void*)mumps; 27222205254eSKarl Rupp 2723f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 2724746480a1SHong Zhang 27252877fffaSHong Zhang *F = B; 27262877fffaSHong Zhang PetscFunctionReturn(0); 27272877fffaSHong Zhang } 272897969023SHong Zhang 2729450b117fSShri Abhyankar #undef __FUNCT__ 2730bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_baij_mumps" 27318cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_baij_mumps(Mat A,MatFactorType ftype,Mat *F) 273267877ebaSShri Abhyankar { 273367877ebaSShri Abhyankar Mat B; 273467877ebaSShri Abhyankar PetscErrorCode ierr; 273567877ebaSShri Abhyankar Mat_MUMPS *mumps; 2736ace3abfcSBarry Smith PetscBool isSeqBAIJ; 273767877ebaSShri Abhyankar 273867877ebaSShri Abhyankar PetscFunctionBegin; 273967877ebaSShri Abhyankar /* Create the factorization matrix */ 2740251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQBAIJ,&isSeqBAIJ);CHKERRQ(ierr); 2741ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 274267877ebaSShri Abhyankar ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 274367877ebaSShri Abhyankar ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2744bccb9932SShri Abhyankar if (isSeqBAIJ) { 27450298fd71SBarry Smith ierr = MatSeqBAIJSetPreallocation(B,A->rmap->bs,0,NULL);CHKERRQ(ierr); 2746bccb9932SShri Abhyankar } else { 27470298fd71SBarry Smith ierr = MatMPIBAIJSetPreallocation(B,A->rmap->bs,0,NULL,0,NULL);CHKERRQ(ierr); 2748bccb9932SShri Abhyankar } 2749450b117fSShri Abhyankar 2750b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 2751450b117fSShri Abhyankar if (ftype == MAT_FACTOR_LU) { 2752450b117fSShri Abhyankar B->ops->lufactorsymbolic = MatLUFactorSymbolic_BAIJMUMPS; 2753450b117fSShri Abhyankar B->factortype = MAT_FACTOR_LU; 2754bccb9932SShri Abhyankar if (isSeqBAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqbaij_seqaij; 2755bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpibaij_mpiaij; 2756746480a1SHong Zhang mumps->sym = 0; 2757f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Cannot use PETSc BAIJ matrices with MUMPS Cholesky, use SBAIJ or AIJ matrix instead\n"); 2758bccb9932SShri Abhyankar 2759450b117fSShri Abhyankar B->ops->view = MatView_MUMPS; 276020be8e61SHong Zhang B->ops->getdiagonal = MatGetDiagonal_MUMPS; 27612205254eSKarl Rupp 2762bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 2763bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 2764bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 2765bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 2766bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 2767bc6112feSHong Zhang 2768ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 2769ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 2770ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 2771ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 2772450b117fSShri Abhyankar 27736444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetSchurIndices_C",MatMumpsSetSchurIndices_MUMPS);CHKERRQ(ierr); 277459ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsInvertSchurComplement_C",MatMumpsInvertSchurComplement_MUMPS);CHKERRQ(ierr); 277559ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsCreateSchurComplement_C",MatMumpsCreateSchurComplement_MUMPS);CHKERRQ(ierr); 27766444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetSchurComplement_C",MatMumpsGetSchurComplement_MUMPS);CHKERRQ(ierr); 277759ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsRestoreSchurComplement_C",MatMumpsRestoreSchurComplement_MUMPS);CHKERRQ(ierr); 2778e807eca7SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplement_C",MatMumpsSolveSchurComplement_MUMPS);CHKERRQ(ierr); 27797404bcfbSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplementTranspose_C",MatMumpsSolveSchurComplementTranspose_MUMPS);CHKERRQ(ierr); 27806444a565SStefano Zampini 2781450b117fSShri Abhyankar mumps->isAIJ = PETSC_TRUE; 2782bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 2783450b117fSShri Abhyankar B->ops->destroy = MatDestroy_MUMPS; 2784450b117fSShri Abhyankar B->spptr = (void*)mumps; 27852205254eSKarl Rupp 2786f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 2787746480a1SHong Zhang 2788450b117fSShri Abhyankar *F = B; 2789450b117fSShri Abhyankar PetscFunctionReturn(0); 2790450b117fSShri Abhyankar } 279142c9c57cSBarry Smith 279242c9c57cSBarry Smith PETSC_EXTERN PetscErrorCode MatGetFactor_aij_mumps(Mat,MatFactorType,Mat*); 279342c9c57cSBarry Smith PETSC_EXTERN PetscErrorCode MatGetFactor_baij_mumps(Mat,MatFactorType,Mat*); 279442c9c57cSBarry Smith PETSC_EXTERN PetscErrorCode MatGetFactor_sbaij_mumps(Mat,MatFactorType,Mat*); 279542c9c57cSBarry Smith 279642c9c57cSBarry Smith #undef __FUNCT__ 279742c9c57cSBarry Smith #define __FUNCT__ "MatSolverPackageRegister_MUMPS" 279829b38603SBarry Smith PETSC_EXTERN PetscErrorCode MatSolverPackageRegister_MUMPS(void) 279942c9c57cSBarry Smith { 280042c9c57cSBarry Smith PetscErrorCode ierr; 280142c9c57cSBarry Smith 280242c9c57cSBarry Smith PetscFunctionBegin; 280342c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIAIJ,MAT_FACTOR_LU,MatGetFactor_aij_mumps);CHKERRQ(ierr); 280442c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_aij_mumps);CHKERRQ(ierr); 280542c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIBAIJ,MAT_FACTOR_LU,MatGetFactor_baij_mumps);CHKERRQ(ierr); 280642c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_baij_mumps);CHKERRQ(ierr); 280742c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPISBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_sbaij_mumps);CHKERRQ(ierr); 280842c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQAIJ,MAT_FACTOR_LU,MatGetFactor_aij_mumps);CHKERRQ(ierr); 280942c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_aij_mumps);CHKERRQ(ierr); 281042c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQBAIJ,MAT_FACTOR_LU,MatGetFactor_baij_mumps);CHKERRQ(ierr); 281142c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_baij_mumps);CHKERRQ(ierr); 281242c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQSBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_sbaij_mumps);CHKERRQ(ierr); 281342c9c57cSBarry Smith PetscFunctionReturn(0); 281442c9c57cSBarry Smith } 281542c9c57cSBarry Smith 2816