11c2a3de1SBarry Smith 2397b6df1SKris Buschelman /* 3c2b5dc30SHong Zhang Provides an interface to the MUMPS sparse solver 4397b6df1SKris Buschelman */ 551d5961aSHong Zhang 6c6db04a5SJed Brown #include <../src/mat/impls/aij/mpi/mpiaij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <../src/mat/impls/sbaij/mpi/mpisbaij.h> 8b5fa320bSStefano Zampini #include <petscblaslapack.h> 9397b6df1SKris Buschelman 10397b6df1SKris Buschelman EXTERN_C_BEGIN 11397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 122907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 132907cef9SHong Zhang #include <cmumps_c.h> 142907cef9SHong Zhang #else 15c6db04a5SJed Brown #include <zmumps_c.h> 162907cef9SHong Zhang #endif 172907cef9SHong Zhang #else 182907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 192907cef9SHong Zhang #include <smumps_c.h> 20397b6df1SKris Buschelman #else 21c6db04a5SJed Brown #include <dmumps_c.h> 22397b6df1SKris Buschelman #endif 232907cef9SHong Zhang #endif 24397b6df1SKris Buschelman EXTERN_C_END 25397b6df1SKris Buschelman #define JOB_INIT -1 263d472b54SHong Zhang #define JOB_FACTSYMBOLIC 1 273d472b54SHong Zhang #define JOB_FACTNUMERIC 2 283d472b54SHong Zhang #define JOB_SOLVE 3 29397b6df1SKris Buschelman #define JOB_END -2 303d472b54SHong Zhang 312907cef9SHong Zhang /* calls to MUMPS */ 322907cef9SHong Zhang #if defined(PETSC_USE_COMPLEX) 332907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 342907cef9SHong Zhang #define PetscMUMPS_c cmumps_c 352907cef9SHong Zhang #else 362907cef9SHong Zhang #define PetscMUMPS_c zmumps_c 372907cef9SHong Zhang #endif 382907cef9SHong Zhang #else 392907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 402907cef9SHong Zhang #define PetscMUMPS_c smumps_c 412907cef9SHong Zhang #else 422907cef9SHong Zhang #define PetscMUMPS_c dmumps_c 432907cef9SHong Zhang #endif 442907cef9SHong Zhang #endif 452907cef9SHong Zhang 46940cd9d6SSatish Balay /* declare MumpsScalar */ 47940cd9d6SSatish Balay #if defined(PETSC_USE_COMPLEX) 48940cd9d6SSatish Balay #if defined(PETSC_USE_REAL_SINGLE) 49940cd9d6SSatish Balay #define MumpsScalar mumps_complex 50940cd9d6SSatish Balay #else 51940cd9d6SSatish Balay #define MumpsScalar mumps_double_complex 52940cd9d6SSatish Balay #endif 53940cd9d6SSatish Balay #else 54940cd9d6SSatish Balay #define MumpsScalar PetscScalar 55940cd9d6SSatish Balay #endif 563d472b54SHong Zhang 57397b6df1SKris Buschelman /* macros s.t. indices match MUMPS documentation */ 58397b6df1SKris Buschelman #define ICNTL(I) icntl[(I)-1] 59397b6df1SKris Buschelman #define CNTL(I) cntl[(I)-1] 60397b6df1SKris Buschelman #define INFOG(I) infog[(I)-1] 61a7aca84bSHong Zhang #define INFO(I) info[(I)-1] 62397b6df1SKris Buschelman #define RINFOG(I) rinfog[(I)-1] 63adc1d99fSHong Zhang #define RINFO(I) rinfo[(I)-1] 64397b6df1SKris Buschelman 65397b6df1SKris Buschelman typedef struct { 66397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 672907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 682907cef9SHong Zhang CMUMPS_STRUC_C id; 692907cef9SHong Zhang #else 70397b6df1SKris Buschelman ZMUMPS_STRUC_C id; 712907cef9SHong Zhang #endif 722907cef9SHong Zhang #else 732907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 742907cef9SHong Zhang SMUMPS_STRUC_C id; 75397b6df1SKris Buschelman #else 76397b6df1SKris Buschelman DMUMPS_STRUC_C id; 77397b6df1SKris Buschelman #endif 782907cef9SHong Zhang #endif 792907cef9SHong Zhang 80397b6df1SKris Buschelman MatStructure matstruc; 81c1490034SHong Zhang PetscMPIInt myid,size; 82a5e57a09SHong Zhang PetscInt *irn,*jcn,nz,sym; 83397b6df1SKris Buschelman PetscScalar *val; 84397b6df1SKris Buschelman MPI_Comm comm_mumps; 856f3cc6f9SBarry Smith PetscBool isAIJ; 86a5e57a09SHong Zhang PetscInt ICNTL9_pre; /* check if ICNTL(9) is changed from previous MatSolve */ 87801fbe65SHong Zhang VecScatter scat_rhs, scat_sol; /* used by MatSolve() */ 88801fbe65SHong Zhang Vec b_seq,x_seq; 89b34f08ffSHong Zhang PetscInt ninfo,*info; /* display INFO */ 90b5fa320bSStefano Zampini PetscBool schur_second_solve; 91b5fa320bSStefano Zampini PetscInt sizeredrhs; 92b5fa320bSStefano Zampini PetscInt *schur_pivots; 9359ac8732SStefano Zampini PetscInt schur_B_lwork; 94b5fa320bSStefano Zampini PetscScalar *schur_work; 9559ac8732SStefano Zampini PetscScalar *schur_sol; 9659ac8732SStefano Zampini PetscInt schur_sizesol; 9759ac8732SStefano Zampini PetscBool schur_restored; 9859ac8732SStefano Zampini PetscBool schur_factored; 9959ac8732SStefano Zampini PetscBool schur_inverted; 1002205254eSKarl Rupp 101bf0cc555SLisandro Dalcin PetscErrorCode (*Destroy)(Mat); 102bccb9932SShri Abhyankar PetscErrorCode (*ConvertToTriples)(Mat, int, MatReuse, int*, int**, int**, PetscScalar**); 103f0c56d0fSKris Buschelman } Mat_MUMPS; 104f0c56d0fSKris Buschelman 10509573ac7SBarry Smith extern PetscErrorCode MatDuplicate_MUMPS(Mat,MatDuplicateOption,Mat*); 106b24902e0SBarry Smith 10759ac8732SStefano Zampini #undef __FUNCT__ 10859ac8732SStefano Zampini #define __FUNCT__ "MatMumpsResetSchur_Private" 10959ac8732SStefano Zampini static PetscErrorCode MatMumpsResetSchur_Private(Mat_MUMPS* mumps) 110b5fa320bSStefano Zampini { 111b5fa320bSStefano Zampini PetscErrorCode ierr; 112b5fa320bSStefano Zampini 113b5fa320bSStefano Zampini PetscFunctionBegin; 11459ac8732SStefano Zampini ierr = PetscFree2(mumps->id.listvar_schur,mumps->id.schur);CHKERRQ(ierr); 11559ac8732SStefano Zampini ierr = PetscFree(mumps->id.redrhs);CHKERRQ(ierr); 11659ac8732SStefano Zampini ierr = PetscFree(mumps->schur_sol);CHKERRQ(ierr); 11759ac8732SStefano Zampini ierr = PetscFree(mumps->schur_pivots);CHKERRQ(ierr); 11859ac8732SStefano Zampini ierr = PetscFree(mumps->schur_work);CHKERRQ(ierr); 119*6c4ed002SBarry Smith if (!mumps->schur_restored) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 12059ac8732SStefano Zampini mumps->id.size_schur = 0; 12159ac8732SStefano Zampini mumps->id.ICNTL(19) = 0; 12259ac8732SStefano Zampini PetscFunctionReturn(0); 12359ac8732SStefano Zampini } 12459ac8732SStefano Zampini 12559ac8732SStefano Zampini #undef __FUNCT__ 12659ac8732SStefano Zampini #define __FUNCT__ "MatMumpsFactorSchur_Private" 12759ac8732SStefano Zampini static PetscErrorCode MatMumpsFactorSchur_Private(Mat_MUMPS* mumps) 12859ac8732SStefano Zampini { 12959ac8732SStefano Zampini PetscBLASInt B_N,B_ierr,B_slda; 13059ac8732SStefano Zampini PetscErrorCode ierr; 13159ac8732SStefano Zampini 13259ac8732SStefano Zampini PetscFunctionBegin; 13359ac8732SStefano Zampini if (mumps->schur_factored) { 13459ac8732SStefano Zampini PetscFunctionReturn(0); 13559ac8732SStefano Zampini } 13659ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.size_schur,&B_N);CHKERRQ(ierr); 13759ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.schur_lld,&B_slda);CHKERRQ(ierr); 13859ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full Schur matrix */ 13959ac8732SStefano Zampini if (!mumps->schur_pivots) { 14059ac8732SStefano Zampini ierr = PetscMalloc1(B_N,&mumps->schur_pivots);CHKERRQ(ierr); 14159ac8732SStefano Zampini } 14259ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 14359ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetrf",LAPACKgetrf_(&B_N,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,&B_ierr)); 14459ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 14559ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GETRF Lapack routine %d",(int)B_ierr); 14659ac8732SStefano Zampini } else { /* either full or lower-triangular (not packed) */ 14759ac8732SStefano Zampini char ord[2]; 14859ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 14959ac8732SStefano Zampini sprintf(ord,"L"); 15059ac8732SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 15159ac8732SStefano Zampini sprintf(ord,"U"); 15259ac8732SStefano Zampini } 15359ac8732SStefano Zampini if (mumps->id.sym == 2) { 15459ac8732SStefano Zampini if (!mumps->schur_pivots) { 15559ac8732SStefano Zampini PetscScalar lwork; 15659ac8732SStefano Zampini 15759ac8732SStefano Zampini ierr = PetscMalloc1(B_N,&mumps->schur_pivots);CHKERRQ(ierr); 15859ac8732SStefano Zampini mumps->schur_B_lwork=-1; 15959ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 16059ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytrf",LAPACKsytrf_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,&lwork,&mumps->schur_B_lwork,&B_ierr)); 16159ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 16259ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SYTRF Lapack routine %d",(int)B_ierr); 16359ac8732SStefano Zampini ierr = PetscBLASIntCast((PetscInt)PetscRealPart(lwork),&mumps->schur_B_lwork);CHKERRQ(ierr); 16459ac8732SStefano Zampini ierr = PetscMalloc1(mumps->schur_B_lwork,&mumps->schur_work);CHKERRQ(ierr); 16559ac8732SStefano Zampini } 16659ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 16759ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytrf",LAPACKsytrf_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,mumps->schur_work,&mumps->schur_B_lwork,&B_ierr)); 16859ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 16959ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYTRF Lapack routine %d",(int)B_ierr); 17059ac8732SStefano Zampini } else { 17159ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 17259ac8732SStefano Zampini PetscStackCallBLAS("LAPACKpotrf",LAPACKpotrf_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,&B_ierr)); 17359ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 17459ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in POTRF Lapack routine %d",(int)B_ierr); 17559ac8732SStefano Zampini } 17659ac8732SStefano Zampini } 17759ac8732SStefano Zampini mumps->schur_factored = PETSC_TRUE; 17859ac8732SStefano Zampini PetscFunctionReturn(0); 17959ac8732SStefano Zampini } 18059ac8732SStefano Zampini 18159ac8732SStefano Zampini #undef __FUNCT__ 18259ac8732SStefano Zampini #define __FUNCT__ "MatMumpsInvertSchur_Private" 18359ac8732SStefano Zampini static PetscErrorCode MatMumpsInvertSchur_Private(Mat_MUMPS* mumps) 18459ac8732SStefano Zampini { 18559ac8732SStefano Zampini PetscBLASInt B_N,B_ierr,B_slda; 18659ac8732SStefano Zampini PetscErrorCode ierr; 18759ac8732SStefano Zampini 18859ac8732SStefano Zampini PetscFunctionBegin; 18959ac8732SStefano Zampini ierr = MatMumpsFactorSchur_Private(mumps);CHKERRQ(ierr); 19059ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.size_schur,&B_N);CHKERRQ(ierr); 19159ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.schur_lld,&B_slda);CHKERRQ(ierr); 19259ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full Schur matrix */ 19359ac8732SStefano Zampini if (!mumps->schur_work) { 19459ac8732SStefano Zampini PetscScalar lwork; 19559ac8732SStefano Zampini 19659ac8732SStefano Zampini mumps->schur_B_lwork = -1; 19759ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 19859ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetri",LAPACKgetri_(&B_N,(PetscScalar*)mumps->id.schur,&B_N,mumps->schur_pivots,&lwork,&mumps->schur_B_lwork,&B_ierr)); 19959ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 20059ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to GETRI Lapack routine %d",(int)B_ierr); 20159ac8732SStefano Zampini ierr = PetscBLASIntCast((PetscInt)PetscRealPart(lwork),&mumps->schur_B_lwork);CHKERRQ(ierr); 20259ac8732SStefano Zampini ierr = PetscMalloc1(mumps->schur_B_lwork,&mumps->schur_work);CHKERRQ(ierr); 20359ac8732SStefano Zampini } 20459ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 20559ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetri",LAPACKgetri_(&B_N,(PetscScalar*)mumps->id.schur,&B_N,mumps->schur_pivots,mumps->schur_work,&mumps->schur_B_lwork,&B_ierr)); 20659ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 20759ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GETRI Lapack routine %d",(int)B_ierr); 20859ac8732SStefano Zampini } else { /* either full or lower-triangular (not packed) */ 20959ac8732SStefano Zampini char ord[2]; 21059ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 21159ac8732SStefano Zampini sprintf(ord,"L"); 21259ac8732SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 21359ac8732SStefano Zampini sprintf(ord,"U"); 21459ac8732SStefano Zampini } 21559ac8732SStefano Zampini if (mumps->id.sym == 2) { 21659ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 21759ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytri",LAPACKsytri_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_N,mumps->schur_pivots,mumps->schur_work,&B_ierr)); 21859ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 21959ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYTRI Lapack routine %d",(int)B_ierr); 22059ac8732SStefano Zampini } else { 22159ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 22259ac8732SStefano Zampini PetscStackCallBLAS("LAPACKpotri",LAPACKpotri_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_N,&B_ierr)); 22359ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 22459ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in POTRI Lapack routine %d",(int)B_ierr); 22559ac8732SStefano Zampini } 22659ac8732SStefano Zampini } 22759ac8732SStefano Zampini mumps->schur_inverted = PETSC_TRUE; 22859ac8732SStefano Zampini PetscFunctionReturn(0); 22959ac8732SStefano Zampini } 23059ac8732SStefano Zampini 23159ac8732SStefano Zampini #undef __FUNCT__ 23259ac8732SStefano Zampini #define __FUNCT__ "MatMumpsSolveSchur_Private" 233e807eca7SStefano Zampini static PetscErrorCode MatMumpsSolveSchur_Private(Mat_MUMPS* mumps, PetscBool sol_in_redrhs) 23459ac8732SStefano Zampini { 23559ac8732SStefano Zampini PetscBLASInt B_N,B_Nrhs,B_ierr,B_slda,B_rlda; 23659ac8732SStefano Zampini PetscScalar one=1.,zero=0.; 23759ac8732SStefano Zampini PetscErrorCode ierr; 23859ac8732SStefano Zampini 23959ac8732SStefano Zampini PetscFunctionBegin; 24059ac8732SStefano Zampini ierr = MatMumpsFactorSchur_Private(mumps);CHKERRQ(ierr); 241b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.size_schur,&B_N);CHKERRQ(ierr); 242b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.schur_lld,&B_slda);CHKERRQ(ierr); 243b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.nrhs,&B_Nrhs);CHKERRQ(ierr); 244b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.lredrhs,&B_rlda);CHKERRQ(ierr); 24559ac8732SStefano Zampini if (mumps->schur_inverted) { 24659ac8732SStefano Zampini PetscInt sizesol = B_Nrhs*B_N; 24759ac8732SStefano Zampini if (!mumps->schur_sol || sizesol > mumps->schur_sizesol) { 24859ac8732SStefano Zampini ierr = PetscFree(mumps->schur_sol);CHKERRQ(ierr); 24959ac8732SStefano Zampini ierr = PetscMalloc1(sizesol,&mumps->schur_sol);CHKERRQ(ierr); 25059ac8732SStefano Zampini mumps->schur_sizesol = sizesol; 251b5fa320bSStefano Zampini } 25259ac8732SStefano Zampini if (!mumps->sym) { 25359ac8732SStefano Zampini char type[2]; 254b5fa320bSStefano Zampini if (mumps->id.ICNTL(19) == 1) { /* stored by rows */ 25559ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 25659ac8732SStefano Zampini sprintf(type,"N"); 257b5fa320bSStefano Zampini } else { 25859ac8732SStefano Zampini sprintf(type,"T"); 259b5fa320bSStefano Zampini } 26059ac8732SStefano Zampini } else { /* stored by columns */ 26159ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 26259ac8732SStefano Zampini sprintf(type,"T"); 26359ac8732SStefano Zampini } else { 26459ac8732SStefano Zampini sprintf(type,"N"); 26559ac8732SStefano Zampini } 26659ac8732SStefano Zampini } 26759ac8732SStefano Zampini PetscStackCallBLAS("BLASgemm",BLASgemm_(type,"N",&B_N,&B_Nrhs,&B_N,&one,(PetscScalar*)mumps->id.schur,&B_slda,(PetscScalar*)mumps->id.redrhs,&B_rlda,&zero,mumps->schur_sol,&B_rlda)); 26859ac8732SStefano Zampini } else { 26959ac8732SStefano Zampini char ord[2]; 27059ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 27159ac8732SStefano Zampini sprintf(ord,"L"); 27259ac8732SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 27359ac8732SStefano Zampini sprintf(ord,"U"); 27459ac8732SStefano Zampini } 27559ac8732SStefano Zampini PetscStackCallBLAS("BLASsymm",BLASsymm_("L",ord,&B_N,&B_Nrhs,&one,(PetscScalar*)mumps->id.schur,&B_slda,(PetscScalar*)mumps->id.redrhs,&B_rlda,&zero,mumps->schur_sol,&B_rlda)); 27659ac8732SStefano Zampini } 277e807eca7SStefano Zampini if (sol_in_redrhs) { 27859ac8732SStefano Zampini ierr = PetscMemcpy(mumps->id.redrhs,mumps->schur_sol,sizesol*sizeof(PetscScalar));CHKERRQ(ierr); 279e807eca7SStefano Zampini } 280a12f35bfSStefano Zampini } else { /* Schur complement has not been inverted */ 281a12f35bfSStefano Zampini MumpsScalar *orhs=NULL; 282a12f35bfSStefano Zampini 283a12f35bfSStefano Zampini if (!sol_in_redrhs) { 284a12f35bfSStefano Zampini PetscInt sizesol = B_Nrhs*B_N; 285a12f35bfSStefano Zampini if (!mumps->schur_sol || sizesol > mumps->schur_sizesol) { 286a12f35bfSStefano Zampini ierr = PetscFree(mumps->schur_sol);CHKERRQ(ierr); 287a12f35bfSStefano Zampini ierr = PetscMalloc1(sizesol,&mumps->schur_sol);CHKERRQ(ierr); 288a12f35bfSStefano Zampini mumps->schur_sizesol = sizesol; 289a12f35bfSStefano Zampini } 290a12f35bfSStefano Zampini orhs = mumps->id.redrhs; 291a12f35bfSStefano Zampini ierr = PetscMemcpy(mumps->schur_sol,mumps->id.redrhs,sizesol*sizeof(PetscScalar));CHKERRQ(ierr); 292a12f35bfSStefano Zampini mumps->id.redrhs = (MumpsScalar*)mumps->schur_sol; 293a12f35bfSStefano Zampini } 29459ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full Schur matrix */ 29559ac8732SStefano Zampini char type[2]; 29659ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 1) { /* stored by rows */ 29759ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 29859ac8732SStefano Zampini sprintf(type,"N"); 29959ac8732SStefano Zampini } else { 30059ac8732SStefano Zampini sprintf(type,"T"); 30159ac8732SStefano Zampini } 30259ac8732SStefano Zampini } else { /* stored by columns */ 30359ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 30459ac8732SStefano Zampini sprintf(type,"T"); 30559ac8732SStefano Zampini } else { 30659ac8732SStefano Zampini sprintf(type,"N"); 30759ac8732SStefano Zampini } 30859ac8732SStefano Zampini } 30959ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 31059ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetrs",LAPACKgetrs_(type,&B_N,&B_Nrhs,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,(PetscScalar*)mumps->id.redrhs,&B_rlda,&B_ierr)); 311b5fa320bSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 312b5fa320bSStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GETRS Lapack routine %d",(int)B_ierr); 313b5fa320bSStefano Zampini } else { /* either full or lower-triangular (not packed) */ 314b5fa320bSStefano Zampini char ord[2]; 315b5fa320bSStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 316b5fa320bSStefano Zampini sprintf(ord,"L"); 317b5fa320bSStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 318b5fa320bSStefano Zampini sprintf(ord,"U"); 319b5fa320bSStefano Zampini } 320b5fa320bSStefano Zampini if (mumps->id.sym == 2) { 321b5fa320bSStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 32259ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytrs",LAPACKsytrs_(ord,&B_N,&B_Nrhs,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,(PetscScalar*)mumps->id.redrhs,&B_rlda,&B_ierr)); 323b5fa320bSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 324b5fa320bSStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYTRS Lapack routine %d",(int)B_ierr); 325b5fa320bSStefano Zampini } else { 326b5fa320bSStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 32759ac8732SStefano Zampini PetscStackCallBLAS("LAPACKpotrs",LAPACKpotrs_(ord,&B_N,&B_Nrhs,(PetscScalar*)mumps->id.schur,&B_slda,(PetscScalar*)mumps->id.redrhs,&B_rlda,&B_ierr)); 328b5fa320bSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 329b5fa320bSStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in POTRS Lapack routine %d",(int)B_ierr); 330b5fa320bSStefano Zampini } 331b5fa320bSStefano Zampini } 332e807eca7SStefano Zampini if (!sol_in_redrhs) { 333a12f35bfSStefano Zampini mumps->id.redrhs = orhs; 334e807eca7SStefano Zampini } 33559ac8732SStefano Zampini } 336b5fa320bSStefano Zampini PetscFunctionReturn(0); 337b5fa320bSStefano Zampini } 338b5fa320bSStefano Zampini 33959ac8732SStefano Zampini #undef __FUNCT__ 34059ac8732SStefano Zampini #define __FUNCT__ "MatMumpsHandleSchur_Private" 341b5fa320bSStefano Zampini static PetscErrorCode MatMumpsHandleSchur_Private(Mat_MUMPS* mumps) 342b5fa320bSStefano Zampini { 343b5fa320bSStefano Zampini PetscErrorCode ierr; 344b5fa320bSStefano Zampini 345b5fa320bSStefano Zampini PetscFunctionBegin; 346b5fa320bSStefano Zampini if (!mumps->id.ICNTL(19)) { /* do nothing when Schur complement has not been computed */ 347b5fa320bSStefano Zampini PetscFunctionReturn(0); 348b5fa320bSStefano Zampini } 349b5fa320bSStefano Zampini if (!mumps->schur_second_solve) { /* prepare for the condensation step */ 350b5fa320bSStefano Zampini /* check if schur complement has been computed 351e807eca7SStefano Zampini We set by default ICNTL(26) == -1 when Schur indices have been provided by the user. 352b5fa320bSStefano Zampini According to MUMPS (5.0.0) manual, any value should be harmful during the factorization phase 353b5fa320bSStefano Zampini Unless the user provides a valid value for ICNTL(26), MatSolve and MatMatSolve routines solve the full system. 354b5fa320bSStefano Zampini This requires an extra call to PetscMUMPS_c and the computation of the factors for S, handled setting double_schur_solve to PETSC_TRUE */ 355b5fa320bSStefano Zampini if (mumps->id.ICNTL(26) < 0 || mumps->id.ICNTL(26) > 2) { 356b5fa320bSStefano Zampini PetscInt sizeredrhs = mumps->id.nrhs*mumps->id.size_schur; 357b5fa320bSStefano Zampini /* allocate MUMPS internal array to store reduced right-hand sides */ 358b5fa320bSStefano Zampini if (!mumps->id.redrhs || sizeredrhs > mumps->sizeredrhs) { 359b5fa320bSStefano Zampini ierr = PetscFree(mumps->id.redrhs);CHKERRQ(ierr); 360b5fa320bSStefano Zampini mumps->id.lredrhs = mumps->id.size_schur; 361b5fa320bSStefano Zampini ierr = PetscMalloc1(mumps->id.nrhs*mumps->id.lredrhs,&mumps->id.redrhs);CHKERRQ(ierr); 362b5fa320bSStefano Zampini mumps->sizeredrhs = mumps->id.nrhs*mumps->id.lredrhs; 363b5fa320bSStefano Zampini } 364b5fa320bSStefano Zampini mumps->schur_second_solve = PETSC_TRUE; 365b5fa320bSStefano Zampini mumps->id.ICNTL(26) = 1; /* condensation phase */ 366b5fa320bSStefano Zampini } 367b5fa320bSStefano Zampini } else { /* prepare for the expansion step */ 368b5fa320bSStefano Zampini /* solve Schur complement (this should be done by the MUMPS user, so basically us) */ 369e807eca7SStefano Zampini ierr = MatMumpsSolveSchur_Private(mumps,PETSC_TRUE);CHKERRQ(ierr); 370b5fa320bSStefano Zampini mumps->id.ICNTL(26) = 2; /* expansion phase */ 371b5fa320bSStefano Zampini PetscMUMPS_c(&mumps->id); 372b5fa320bSStefano Zampini if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 373b5fa320bSStefano Zampini /* restore defaults */ 374b5fa320bSStefano Zampini mumps->id.ICNTL(26) = -1; 375b5fa320bSStefano Zampini mumps->schur_second_solve = PETSC_FALSE; 376b5fa320bSStefano Zampini } 377b5fa320bSStefano Zampini PetscFunctionReturn(0); 378b5fa320bSStefano Zampini } 379b5fa320bSStefano Zampini 380397b6df1SKris Buschelman /* 381d341cd04SHong Zhang MatConvertToTriples_A_B - convert Petsc matrix to triples: row[nz], col[nz], val[nz] 382d341cd04SHong Zhang 383397b6df1SKris Buschelman input: 38467877ebaSShri Abhyankar A - matrix in aij,baij or sbaij (bs=1) format 385397b6df1SKris Buschelman shift - 0: C style output triple; 1: Fortran style output triple. 386bccb9932SShri Abhyankar reuse - MAT_INITIAL_MATRIX: spaces are allocated and values are set for the triple 387bccb9932SShri Abhyankar MAT_REUSE_MATRIX: only the values in v array are updated 388397b6df1SKris Buschelman output: 389397b6df1SKris Buschelman nnz - dim of r, c, and v (number of local nonzero entries of A) 390397b6df1SKris Buschelman r, c, v - row and col index, matrix values (matrix triples) 391eb9baa12SBarry Smith 392eb9baa12SBarry Smith The returned values r, c, and sometimes v are obtained in a single PetscMalloc(). Then in MatDestroy_MUMPS() it is 393eb9baa12SBarry Smith freed with PetscFree((mumps->irn); This is not ideal code, the fact that v is ONLY sometimes part of mumps->irn means 394eb9baa12SBarry Smith that the PetscMalloc() cannot easily be replaced with a PetscMalloc3(). 395eb9baa12SBarry Smith 396397b6df1SKris Buschelman */ 39716ebf90aSShri Abhyankar 39816ebf90aSShri Abhyankar #undef __FUNCT__ 39916ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqaij_seqaij" 400bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqaij_seqaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 401b24902e0SBarry Smith { 402185f6596SHong Zhang const PetscInt *ai,*aj,*ajj,M=A->rmap->n; 40367877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 404dfbe8321SBarry Smith PetscErrorCode ierr; 405c1490034SHong Zhang PetscInt *row,*col; 40616ebf90aSShri Abhyankar Mat_SeqAIJ *aa=(Mat_SeqAIJ*)A->data; 407397b6df1SKris Buschelman 408397b6df1SKris Buschelman PetscFunctionBegin; 40916ebf90aSShri Abhyankar *v=aa->a; 410bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 4112205254eSKarl Rupp nz = aa->nz; 4122205254eSKarl Rupp ai = aa->i; 4132205254eSKarl Rupp aj = aa->j; 41416ebf90aSShri Abhyankar *nnz = nz; 415785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 416185f6596SHong Zhang col = row + nz; 417185f6596SHong Zhang 41816ebf90aSShri Abhyankar nz = 0; 41916ebf90aSShri Abhyankar for (i=0; i<M; i++) { 42016ebf90aSShri Abhyankar rnz = ai[i+1] - ai[i]; 42167877ebaSShri Abhyankar ajj = aj + ai[i]; 42267877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 42367877ebaSShri Abhyankar row[nz] = i+shift; col[nz++] = ajj[j] + shift; 42416ebf90aSShri Abhyankar } 42516ebf90aSShri Abhyankar } 42616ebf90aSShri Abhyankar *r = row; *c = col; 42716ebf90aSShri Abhyankar } 42816ebf90aSShri Abhyankar PetscFunctionReturn(0); 42916ebf90aSShri Abhyankar } 430397b6df1SKris Buschelman 43116ebf90aSShri Abhyankar #undef __FUNCT__ 43267877ebaSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqbaij_seqaij" 433bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqbaij_seqaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 43467877ebaSShri Abhyankar { 43567877ebaSShri Abhyankar Mat_SeqBAIJ *aa=(Mat_SeqBAIJ*)A->data; 43633d57670SJed Brown const PetscInt *ai,*aj,*ajj,bs2 = aa->bs2; 43733d57670SJed Brown PetscInt bs,M,nz,idx=0,rnz,i,j,k,m; 43867877ebaSShri Abhyankar PetscErrorCode ierr; 43967877ebaSShri Abhyankar PetscInt *row,*col; 44067877ebaSShri Abhyankar 44167877ebaSShri Abhyankar PetscFunctionBegin; 44233d57670SJed Brown ierr = MatGetBlockSize(A,&bs);CHKERRQ(ierr); 44333d57670SJed Brown M = A->rmap->N/bs; 444cf3759fdSShri Abhyankar *v = aa->a; 445bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 446cf3759fdSShri Abhyankar ai = aa->i; aj = aa->j; 44767877ebaSShri Abhyankar nz = bs2*aa->nz; 44867877ebaSShri Abhyankar *nnz = nz; 449785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 450185f6596SHong Zhang col = row + nz; 451185f6596SHong Zhang 45267877ebaSShri Abhyankar for (i=0; i<M; i++) { 45367877ebaSShri Abhyankar ajj = aj + ai[i]; 45467877ebaSShri Abhyankar rnz = ai[i+1] - ai[i]; 45567877ebaSShri Abhyankar for (k=0; k<rnz; k++) { 45667877ebaSShri Abhyankar for (j=0; j<bs; j++) { 45767877ebaSShri Abhyankar for (m=0; m<bs; m++) { 45867877ebaSShri Abhyankar row[idx] = i*bs + m + shift; 459cf3759fdSShri Abhyankar col[idx++] = bs*(ajj[k]) + j + shift; 46067877ebaSShri Abhyankar } 46167877ebaSShri Abhyankar } 46267877ebaSShri Abhyankar } 46367877ebaSShri Abhyankar } 464cf3759fdSShri Abhyankar *r = row; *c = col; 46567877ebaSShri Abhyankar } 46667877ebaSShri Abhyankar PetscFunctionReturn(0); 46767877ebaSShri Abhyankar } 46867877ebaSShri Abhyankar 46967877ebaSShri Abhyankar #undef __FUNCT__ 47016ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqsbaij_seqsbaij" 471bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqsbaij_seqsbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 47216ebf90aSShri Abhyankar { 47367877ebaSShri Abhyankar const PetscInt *ai, *aj,*ajj,M=A->rmap->n; 47467877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 47516ebf90aSShri Abhyankar PetscErrorCode ierr; 47616ebf90aSShri Abhyankar PetscInt *row,*col; 47716ebf90aSShri Abhyankar Mat_SeqSBAIJ *aa=(Mat_SeqSBAIJ*)A->data; 47816ebf90aSShri Abhyankar 47916ebf90aSShri Abhyankar PetscFunctionBegin; 480882afa5aSHong Zhang *v = aa->a; 481bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 4822205254eSKarl Rupp nz = aa->nz; 4832205254eSKarl Rupp ai = aa->i; 4842205254eSKarl Rupp aj = aa->j; 4852205254eSKarl Rupp *v = aa->a; 48616ebf90aSShri Abhyankar *nnz = nz; 487785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 488185f6596SHong Zhang col = row + nz; 489185f6596SHong Zhang 49016ebf90aSShri Abhyankar nz = 0; 49116ebf90aSShri Abhyankar for (i=0; i<M; i++) { 49216ebf90aSShri Abhyankar rnz = ai[i+1] - ai[i]; 49367877ebaSShri Abhyankar ajj = aj + ai[i]; 49467877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 49567877ebaSShri Abhyankar row[nz] = i+shift; col[nz++] = ajj[j] + shift; 49616ebf90aSShri Abhyankar } 49716ebf90aSShri Abhyankar } 49816ebf90aSShri Abhyankar *r = row; *c = col; 49916ebf90aSShri Abhyankar } 50016ebf90aSShri Abhyankar PetscFunctionReturn(0); 50116ebf90aSShri Abhyankar } 50216ebf90aSShri Abhyankar 50316ebf90aSShri Abhyankar #undef __FUNCT__ 50416ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqaij_seqsbaij" 505bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqaij_seqsbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 50616ebf90aSShri Abhyankar { 50767877ebaSShri Abhyankar const PetscInt *ai,*aj,*ajj,*adiag,M=A->rmap->n; 50867877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 50967877ebaSShri Abhyankar const PetscScalar *av,*v1; 51016ebf90aSShri Abhyankar PetscScalar *val; 51116ebf90aSShri Abhyankar PetscErrorCode ierr; 51216ebf90aSShri Abhyankar PetscInt *row,*col; 513829b1710SHong Zhang Mat_SeqAIJ *aa=(Mat_SeqAIJ*)A->data; 51416ebf90aSShri Abhyankar 51516ebf90aSShri Abhyankar PetscFunctionBegin; 51616ebf90aSShri Abhyankar ai =aa->i; aj=aa->j;av=aa->a; 51716ebf90aSShri Abhyankar adiag=aa->diag; 518bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 519829b1710SHong Zhang /* count nz in the uppper triangular part of A */ 520829b1710SHong Zhang nz = 0; 521829b1710SHong Zhang for (i=0; i<M; i++) nz += ai[i+1] - adiag[i]; 52216ebf90aSShri Abhyankar *nnz = nz; 523829b1710SHong Zhang 524185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 525185f6596SHong Zhang col = row + nz; 526185f6596SHong Zhang val = (PetscScalar*)(col + nz); 527185f6596SHong Zhang 52816ebf90aSShri Abhyankar nz = 0; 52916ebf90aSShri Abhyankar for (i=0; i<M; i++) { 53016ebf90aSShri Abhyankar rnz = ai[i+1] - adiag[i]; 53167877ebaSShri Abhyankar ajj = aj + adiag[i]; 532cf3759fdSShri Abhyankar v1 = av + adiag[i]; 53367877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 53467877ebaSShri Abhyankar row[nz] = i+shift; col[nz] = ajj[j] + shift; val[nz++] = v1[j]; 53516ebf90aSShri Abhyankar } 53616ebf90aSShri Abhyankar } 53716ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 538397b6df1SKris Buschelman } else { 53916ebf90aSShri Abhyankar nz = 0; val = *v; 54016ebf90aSShri Abhyankar for (i=0; i <M; i++) { 54116ebf90aSShri Abhyankar rnz = ai[i+1] - adiag[i]; 54267877ebaSShri Abhyankar ajj = aj + adiag[i]; 54367877ebaSShri Abhyankar v1 = av + adiag[i]; 54467877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 54567877ebaSShri Abhyankar val[nz++] = v1[j]; 54616ebf90aSShri Abhyankar } 54716ebf90aSShri Abhyankar } 54816ebf90aSShri Abhyankar } 54916ebf90aSShri Abhyankar PetscFunctionReturn(0); 55016ebf90aSShri Abhyankar } 55116ebf90aSShri Abhyankar 55216ebf90aSShri Abhyankar #undef __FUNCT__ 55316ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpisbaij_mpisbaij" 554bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpisbaij_mpisbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 55516ebf90aSShri Abhyankar { 55616ebf90aSShri Abhyankar const PetscInt *ai, *aj, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 55716ebf90aSShri Abhyankar PetscErrorCode ierr; 55816ebf90aSShri Abhyankar PetscInt rstart,nz,i,j,jj,irow,countA,countB; 55916ebf90aSShri Abhyankar PetscInt *row,*col; 56016ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 56116ebf90aSShri Abhyankar PetscScalar *val; 562397b6df1SKris Buschelman Mat_MPISBAIJ *mat = (Mat_MPISBAIJ*)A->data; 563397b6df1SKris Buschelman Mat_SeqSBAIJ *aa = (Mat_SeqSBAIJ*)(mat->A)->data; 564397b6df1SKris Buschelman Mat_SeqBAIJ *bb = (Mat_SeqBAIJ*)(mat->B)->data; 56516ebf90aSShri Abhyankar 56616ebf90aSShri Abhyankar PetscFunctionBegin; 567d0f46423SBarry Smith ai=aa->i; aj=aa->j; bi=bb->i; bj=bb->j; rstart= A->rmap->rstart; 568397b6df1SKris Buschelman av=aa->a; bv=bb->a; 569397b6df1SKris Buschelman 5702205254eSKarl Rupp garray = mat->garray; 5712205254eSKarl Rupp 572bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 57316ebf90aSShri Abhyankar nz = aa->nz + bb->nz; 57416ebf90aSShri Abhyankar *nnz = nz; 575185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 576185f6596SHong Zhang col = row + nz; 577185f6596SHong Zhang val = (PetscScalar*)(col + nz); 578185f6596SHong Zhang 579397b6df1SKris Buschelman *r = row; *c = col; *v = val; 580397b6df1SKris Buschelman } else { 581397b6df1SKris Buschelman row = *r; col = *c; val = *v; 582397b6df1SKris Buschelman } 583397b6df1SKris Buschelman 584028e57e8SHong Zhang jj = 0; irow = rstart; 585397b6df1SKris Buschelman for (i=0; i<m; i++) { 586397b6df1SKris Buschelman ajj = aj + ai[i]; /* ptr to the beginning of this row */ 587397b6df1SKris Buschelman countA = ai[i+1] - ai[i]; 588397b6df1SKris Buschelman countB = bi[i+1] - bi[i]; 589397b6df1SKris Buschelman bjj = bj + bi[i]; 59016ebf90aSShri Abhyankar v1 = av + ai[i]; 59116ebf90aSShri Abhyankar v2 = bv + bi[i]; 592397b6df1SKris Buschelman 593397b6df1SKris Buschelman /* A-part */ 594397b6df1SKris Buschelman for (j=0; j<countA; j++) { 595bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 596397b6df1SKris Buschelman row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 597397b6df1SKris Buschelman } 59816ebf90aSShri Abhyankar val[jj++] = v1[j]; 599397b6df1SKris Buschelman } 60016ebf90aSShri Abhyankar 60116ebf90aSShri Abhyankar /* B-part */ 60216ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 603bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 604397b6df1SKris Buschelman row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 605397b6df1SKris Buschelman } 60616ebf90aSShri Abhyankar val[jj++] = v2[j]; 60716ebf90aSShri Abhyankar } 60816ebf90aSShri Abhyankar irow++; 60916ebf90aSShri Abhyankar } 61016ebf90aSShri Abhyankar PetscFunctionReturn(0); 61116ebf90aSShri Abhyankar } 61216ebf90aSShri Abhyankar 61316ebf90aSShri Abhyankar #undef __FUNCT__ 61416ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpiaij_mpiaij" 615bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpiaij_mpiaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 61616ebf90aSShri Abhyankar { 61716ebf90aSShri Abhyankar const PetscInt *ai, *aj, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 61816ebf90aSShri Abhyankar PetscErrorCode ierr; 61916ebf90aSShri Abhyankar PetscInt rstart,nz,i,j,jj,irow,countA,countB; 62016ebf90aSShri Abhyankar PetscInt *row,*col; 62116ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 62216ebf90aSShri Abhyankar PetscScalar *val; 62316ebf90aSShri Abhyankar Mat_MPIAIJ *mat = (Mat_MPIAIJ*)A->data; 62416ebf90aSShri Abhyankar Mat_SeqAIJ *aa = (Mat_SeqAIJ*)(mat->A)->data; 62516ebf90aSShri Abhyankar Mat_SeqAIJ *bb = (Mat_SeqAIJ*)(mat->B)->data; 62616ebf90aSShri Abhyankar 62716ebf90aSShri Abhyankar PetscFunctionBegin; 62816ebf90aSShri Abhyankar ai=aa->i; aj=aa->j; bi=bb->i; bj=bb->j; rstart= A->rmap->rstart; 62916ebf90aSShri Abhyankar av=aa->a; bv=bb->a; 63016ebf90aSShri Abhyankar 6312205254eSKarl Rupp garray = mat->garray; 6322205254eSKarl Rupp 633bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 63416ebf90aSShri Abhyankar nz = aa->nz + bb->nz; 63516ebf90aSShri Abhyankar *nnz = nz; 636185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 637185f6596SHong Zhang col = row + nz; 638185f6596SHong Zhang val = (PetscScalar*)(col + nz); 639185f6596SHong Zhang 64016ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 64116ebf90aSShri Abhyankar } else { 64216ebf90aSShri Abhyankar row = *r; col = *c; val = *v; 64316ebf90aSShri Abhyankar } 64416ebf90aSShri Abhyankar 64516ebf90aSShri Abhyankar jj = 0; irow = rstart; 64616ebf90aSShri Abhyankar for (i=0; i<m; i++) { 64716ebf90aSShri Abhyankar ajj = aj + ai[i]; /* ptr to the beginning of this row */ 64816ebf90aSShri Abhyankar countA = ai[i+1] - ai[i]; 64916ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 65016ebf90aSShri Abhyankar bjj = bj + bi[i]; 65116ebf90aSShri Abhyankar v1 = av + ai[i]; 65216ebf90aSShri Abhyankar v2 = bv + bi[i]; 65316ebf90aSShri Abhyankar 65416ebf90aSShri Abhyankar /* A-part */ 65516ebf90aSShri Abhyankar for (j=0; j<countA; j++) { 656bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 65716ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 65816ebf90aSShri Abhyankar } 65916ebf90aSShri Abhyankar val[jj++] = v1[j]; 66016ebf90aSShri Abhyankar } 66116ebf90aSShri Abhyankar 66216ebf90aSShri Abhyankar /* B-part */ 66316ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 664bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 66516ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 66616ebf90aSShri Abhyankar } 66716ebf90aSShri Abhyankar val[jj++] = v2[j]; 66816ebf90aSShri Abhyankar } 66916ebf90aSShri Abhyankar irow++; 67016ebf90aSShri Abhyankar } 67116ebf90aSShri Abhyankar PetscFunctionReturn(0); 67216ebf90aSShri Abhyankar } 67316ebf90aSShri Abhyankar 67416ebf90aSShri Abhyankar #undef __FUNCT__ 67567877ebaSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpibaij_mpiaij" 676bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpibaij_mpiaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 67767877ebaSShri Abhyankar { 67867877ebaSShri Abhyankar Mat_MPIBAIJ *mat = (Mat_MPIBAIJ*)A->data; 67967877ebaSShri Abhyankar Mat_SeqBAIJ *aa = (Mat_SeqBAIJ*)(mat->A)->data; 68067877ebaSShri Abhyankar Mat_SeqBAIJ *bb = (Mat_SeqBAIJ*)(mat->B)->data; 68167877ebaSShri Abhyankar const PetscInt *ai = aa->i, *bi = bb->i, *aj = aa->j, *bj = bb->j,*ajj, *bjj; 682d985c460SShri Abhyankar const PetscInt *garray = mat->garray,mbs=mat->mbs,rstart=A->rmap->rstart; 68333d57670SJed Brown const PetscInt bs2=mat->bs2; 68467877ebaSShri Abhyankar PetscErrorCode ierr; 68533d57670SJed Brown PetscInt bs,nz,i,j,k,n,jj,irow,countA,countB,idx; 68667877ebaSShri Abhyankar PetscInt *row,*col; 68767877ebaSShri Abhyankar const PetscScalar *av=aa->a, *bv=bb->a,*v1,*v2; 68867877ebaSShri Abhyankar PetscScalar *val; 68967877ebaSShri Abhyankar 69067877ebaSShri Abhyankar PetscFunctionBegin; 69133d57670SJed Brown ierr = MatGetBlockSize(A,&bs);CHKERRQ(ierr); 692bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 69367877ebaSShri Abhyankar nz = bs2*(aa->nz + bb->nz); 69467877ebaSShri Abhyankar *nnz = nz; 695185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 696185f6596SHong Zhang col = row + nz; 697185f6596SHong Zhang val = (PetscScalar*)(col + nz); 698185f6596SHong Zhang 69967877ebaSShri Abhyankar *r = row; *c = col; *v = val; 70067877ebaSShri Abhyankar } else { 70167877ebaSShri Abhyankar row = *r; col = *c; val = *v; 70267877ebaSShri Abhyankar } 70367877ebaSShri Abhyankar 704d985c460SShri Abhyankar jj = 0; irow = rstart; 70567877ebaSShri Abhyankar for (i=0; i<mbs; i++) { 70667877ebaSShri Abhyankar countA = ai[i+1] - ai[i]; 70767877ebaSShri Abhyankar countB = bi[i+1] - bi[i]; 70867877ebaSShri Abhyankar ajj = aj + ai[i]; 70967877ebaSShri Abhyankar bjj = bj + bi[i]; 71067877ebaSShri Abhyankar v1 = av + bs2*ai[i]; 71167877ebaSShri Abhyankar v2 = bv + bs2*bi[i]; 71267877ebaSShri Abhyankar 71367877ebaSShri Abhyankar idx = 0; 71467877ebaSShri Abhyankar /* A-part */ 71567877ebaSShri Abhyankar for (k=0; k<countA; k++) { 71667877ebaSShri Abhyankar for (j=0; j<bs; j++) { 71767877ebaSShri Abhyankar for (n=0; n<bs; n++) { 718bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 719d985c460SShri Abhyankar row[jj] = irow + n + shift; 720d985c460SShri Abhyankar col[jj] = rstart + bs*ajj[k] + j + shift; 72167877ebaSShri Abhyankar } 72267877ebaSShri Abhyankar val[jj++] = v1[idx++]; 72367877ebaSShri Abhyankar } 72467877ebaSShri Abhyankar } 72567877ebaSShri Abhyankar } 72667877ebaSShri Abhyankar 72767877ebaSShri Abhyankar idx = 0; 72867877ebaSShri Abhyankar /* B-part */ 72967877ebaSShri Abhyankar for (k=0; k<countB; k++) { 73067877ebaSShri Abhyankar for (j=0; j<bs; j++) { 73167877ebaSShri Abhyankar for (n=0; n<bs; n++) { 732bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 733d985c460SShri Abhyankar row[jj] = irow + n + shift; 734d985c460SShri Abhyankar col[jj] = bs*garray[bjj[k]] + j + shift; 73567877ebaSShri Abhyankar } 736d985c460SShri Abhyankar val[jj++] = v2[idx++]; 73767877ebaSShri Abhyankar } 73867877ebaSShri Abhyankar } 73967877ebaSShri Abhyankar } 740d985c460SShri Abhyankar irow += bs; 74167877ebaSShri Abhyankar } 74267877ebaSShri Abhyankar PetscFunctionReturn(0); 74367877ebaSShri Abhyankar } 74467877ebaSShri Abhyankar 74567877ebaSShri Abhyankar #undef __FUNCT__ 74616ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpiaij_mpisbaij" 747bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpiaij_mpisbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 74816ebf90aSShri Abhyankar { 74916ebf90aSShri Abhyankar const PetscInt *ai, *aj,*adiag, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 75016ebf90aSShri Abhyankar PetscErrorCode ierr; 751e0bace9bSHong Zhang PetscInt rstart,nz,nza,nzb,i,j,jj,irow,countA,countB; 75216ebf90aSShri Abhyankar PetscInt *row,*col; 75316ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 75416ebf90aSShri Abhyankar PetscScalar *val; 75516ebf90aSShri Abhyankar Mat_MPIAIJ *mat = (Mat_MPIAIJ*)A->data; 75616ebf90aSShri Abhyankar Mat_SeqAIJ *aa =(Mat_SeqAIJ*)(mat->A)->data; 75716ebf90aSShri Abhyankar Mat_SeqAIJ *bb =(Mat_SeqAIJ*)(mat->B)->data; 75816ebf90aSShri Abhyankar 75916ebf90aSShri Abhyankar PetscFunctionBegin; 76016ebf90aSShri Abhyankar ai=aa->i; aj=aa->j; adiag=aa->diag; 76116ebf90aSShri Abhyankar bi=bb->i; bj=bb->j; garray = mat->garray; 76216ebf90aSShri Abhyankar av=aa->a; bv=bb->a; 7632205254eSKarl Rupp 76416ebf90aSShri Abhyankar rstart = A->rmap->rstart; 76516ebf90aSShri Abhyankar 766bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 767e0bace9bSHong Zhang nza = 0; /* num of upper triangular entries in mat->A, including diagonals */ 768e0bace9bSHong Zhang nzb = 0; /* num of upper triangular entries in mat->B */ 76916ebf90aSShri Abhyankar for (i=0; i<m; i++) { 770e0bace9bSHong Zhang nza += (ai[i+1] - adiag[i]); 77116ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 77216ebf90aSShri Abhyankar bjj = bj + bi[i]; 773e0bace9bSHong Zhang for (j=0; j<countB; j++) { 774e0bace9bSHong Zhang if (garray[bjj[j]] > rstart) nzb++; 775e0bace9bSHong Zhang } 776e0bace9bSHong Zhang } 77716ebf90aSShri Abhyankar 778e0bace9bSHong Zhang nz = nza + nzb; /* total nz of upper triangular part of mat */ 77916ebf90aSShri Abhyankar *nnz = nz; 780185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 781185f6596SHong Zhang col = row + nz; 782185f6596SHong Zhang val = (PetscScalar*)(col + nz); 783185f6596SHong Zhang 78416ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 78516ebf90aSShri Abhyankar } else { 78616ebf90aSShri Abhyankar row = *r; col = *c; val = *v; 78716ebf90aSShri Abhyankar } 78816ebf90aSShri Abhyankar 78916ebf90aSShri Abhyankar jj = 0; irow = rstart; 79016ebf90aSShri Abhyankar for (i=0; i<m; i++) { 79116ebf90aSShri Abhyankar ajj = aj + adiag[i]; /* ptr to the beginning of the diagonal of this row */ 79216ebf90aSShri Abhyankar v1 = av + adiag[i]; 79316ebf90aSShri Abhyankar countA = ai[i+1] - adiag[i]; 79416ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 79516ebf90aSShri Abhyankar bjj = bj + bi[i]; 79616ebf90aSShri Abhyankar v2 = bv + bi[i]; 79716ebf90aSShri Abhyankar 79816ebf90aSShri Abhyankar /* A-part */ 79916ebf90aSShri Abhyankar for (j=0; j<countA; j++) { 800bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 80116ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 80216ebf90aSShri Abhyankar } 80316ebf90aSShri Abhyankar val[jj++] = v1[j]; 80416ebf90aSShri Abhyankar } 80516ebf90aSShri Abhyankar 80616ebf90aSShri Abhyankar /* B-part */ 80716ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 80816ebf90aSShri Abhyankar if (garray[bjj[j]] > rstart) { 809bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 81016ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 81116ebf90aSShri Abhyankar } 81216ebf90aSShri Abhyankar val[jj++] = v2[j]; 81316ebf90aSShri Abhyankar } 814397b6df1SKris Buschelman } 815397b6df1SKris Buschelman irow++; 816397b6df1SKris Buschelman } 817397b6df1SKris Buschelman PetscFunctionReturn(0); 818397b6df1SKris Buschelman } 819397b6df1SKris Buschelman 820397b6df1SKris Buschelman #undef __FUNCT__ 82120be8e61SHong Zhang #define __FUNCT__ "MatGetDiagonal_MUMPS" 82220be8e61SHong Zhang PetscErrorCode MatGetDiagonal_MUMPS(Mat A,Vec v) 82320be8e61SHong Zhang { 82420be8e61SHong Zhang PetscFunctionBegin; 82520be8e61SHong Zhang SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Mat type: MUMPS factor"); 82620be8e61SHong Zhang PetscFunctionReturn(0); 82720be8e61SHong Zhang } 82820be8e61SHong Zhang 82920be8e61SHong Zhang #undef __FUNCT__ 8303924e44cSKris Buschelman #define __FUNCT__ "MatDestroy_MUMPS" 831dfbe8321SBarry Smith PetscErrorCode MatDestroy_MUMPS(Mat A) 832dfbe8321SBarry Smith { 833a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 834dfbe8321SBarry Smith PetscErrorCode ierr; 835b24902e0SBarry Smith 836397b6df1SKris Buschelman PetscFunctionBegin; 837a5e57a09SHong Zhang ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr); 838a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_rhs);CHKERRQ(ierr); 839a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 840801fbe65SHong Zhang ierr = VecDestroy(&mumps->b_seq);CHKERRQ(ierr); 841a5e57a09SHong Zhang ierr = VecDestroy(&mumps->x_seq);CHKERRQ(ierr); 842a5e57a09SHong Zhang ierr = PetscFree(mumps->id.perm_in);CHKERRQ(ierr); 843a5e57a09SHong Zhang ierr = PetscFree(mumps->irn);CHKERRQ(ierr); 844b34f08ffSHong Zhang ierr = PetscFree(mumps->info);CHKERRQ(ierr); 84559ac8732SStefano Zampini ierr = MatMumpsResetSchur_Private(mumps);CHKERRQ(ierr); 846a5e57a09SHong Zhang mumps->id.job = JOB_END; 847a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 8486f3cc6f9SBarry Smith ierr = MPI_Comm_free(&mumps->comm_mumps);CHKERRQ(ierr); 849a5e57a09SHong Zhang if (mumps->Destroy) { 850a5e57a09SHong Zhang ierr = (mumps->Destroy)(A);CHKERRQ(ierr); 851bf0cc555SLisandro Dalcin } 852bf0cc555SLisandro Dalcin ierr = PetscFree(A->spptr);CHKERRQ(ierr); 853bf0cc555SLisandro Dalcin 85497969023SHong Zhang /* clear composed functions */ 855bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatFactorGetSolverPackage_C",NULL);CHKERRQ(ierr); 856bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetIcntl_C",NULL);CHKERRQ(ierr); 857bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetIcntl_C",NULL);CHKERRQ(ierr); 858bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetCntl_C",NULL);CHKERRQ(ierr); 859bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetCntl_C",NULL);CHKERRQ(ierr); 860bc6112feSHong Zhang 861ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetInfo_C",NULL);CHKERRQ(ierr); 862ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetInfog_C",NULL);CHKERRQ(ierr); 863ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetRinfo_C",NULL);CHKERRQ(ierr); 864ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetRinfog_C",NULL);CHKERRQ(ierr); 8656444a565SStefano Zampini 8666444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetSchurIndices_C",NULL);CHKERRQ(ierr); 86759ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsInvertSchurComplement_C",NULL);CHKERRQ(ierr); 86859ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsCreateSchurComplement_C",NULL);CHKERRQ(ierr); 8696444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetSchurComplement_C",NULL);CHKERRQ(ierr); 87059ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsRestoreSchurComplement_C",NULL);CHKERRQ(ierr); 871e807eca7SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSolveSchurComplement_C",NULL);CHKERRQ(ierr); 8727404bcfbSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSolveSchurComplementTranspose_C",NULL);CHKERRQ(ierr); 873397b6df1SKris Buschelman PetscFunctionReturn(0); 874397b6df1SKris Buschelman } 875397b6df1SKris Buschelman 876397b6df1SKris Buschelman #undef __FUNCT__ 877f6c57405SHong Zhang #define __FUNCT__ "MatSolve_MUMPS" 878b24902e0SBarry Smith PetscErrorCode MatSolve_MUMPS(Mat A,Vec b,Vec x) 879b24902e0SBarry Smith { 880a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 881d54de34fSKris Buschelman PetscScalar *array; 88267877ebaSShri Abhyankar Vec b_seq; 883329ec9b3SHong Zhang IS is_iden,is_petsc; 884dfbe8321SBarry Smith PetscErrorCode ierr; 885329ec9b3SHong Zhang PetscInt i; 886883f2eb9SBarry Smith static PetscBool cite1 = PETSC_FALSE,cite2 = PETSC_FALSE; 887397b6df1SKris Buschelman 888397b6df1SKris Buschelman PetscFunctionBegin; 889883f2eb9SBarry Smith ierr = PetscCitationsRegister("@article{MUMPS01,\n author = {P.~R. Amestoy and I.~S. Duff and J.-Y. L'Excellent and J. Koster},\n title = {A fully asynchronous multifrontal solver using distributed dynamic scheduling},\n journal = {SIAM Journal on Matrix Analysis and Applications},\n volume = {23},\n number = {1},\n pages = {15--41},\n year = {2001}\n}\n",&cite1);CHKERRQ(ierr); 890883f2eb9SBarry Smith ierr = PetscCitationsRegister("@article{MUMPS02,\n author = {P.~R. Amestoy and A. Guermouche and J.-Y. L'Excellent and S. Pralet},\n title = {Hybrid scheduling for the parallel solution of linear systems},\n journal = {Parallel Computing},\n volume = {32},\n number = {2},\n pages = {136--156},\n year = {2006}\n}\n",&cite2);CHKERRQ(ierr); 891a5e57a09SHong Zhang mumps->id.nrhs = 1; 892a5e57a09SHong Zhang b_seq = mumps->b_seq; 893a5e57a09SHong Zhang if (mumps->size > 1) { 894329ec9b3SHong Zhang /* MUMPS only supports centralized rhs. Scatter b into a seqential rhs vector */ 895a5e57a09SHong Zhang ierr = VecScatterBegin(mumps->scat_rhs,b,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 896a5e57a09SHong Zhang ierr = VecScatterEnd(mumps->scat_rhs,b,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 897a5e57a09SHong Zhang if (!mumps->myid) {ierr = VecGetArray(b_seq,&array);CHKERRQ(ierr);} 898397b6df1SKris Buschelman } else { /* size == 1 */ 899397b6df1SKris Buschelman ierr = VecCopy(b,x);CHKERRQ(ierr); 900397b6df1SKris Buschelman ierr = VecGetArray(x,&array);CHKERRQ(ierr); 901397b6df1SKris Buschelman } 902a5e57a09SHong Zhang if (!mumps->myid) { /* define rhs on the host */ 903a5e57a09SHong Zhang mumps->id.nrhs = 1; 904940cd9d6SSatish Balay mumps->id.rhs = (MumpsScalar*)array; 905397b6df1SKris Buschelman } 906397b6df1SKris Buschelman 907b5fa320bSStefano Zampini /* handle condensation step of Schur complement (if any) */ 908b5fa320bSStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps);CHKERRQ(ierr); 909b5fa320bSStefano Zampini 910397b6df1SKris Buschelman /* solve phase */ 911329ec9b3SHong Zhang /*-------------*/ 912a5e57a09SHong Zhang mumps->id.job = JOB_SOLVE; 913a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 914a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 915397b6df1SKris Buschelman 916b5fa320bSStefano Zampini /* handle expansion step of Schur complement (if any) */ 917b5fa320bSStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps);CHKERRQ(ierr); 918b5fa320bSStefano Zampini 919a5e57a09SHong Zhang if (mumps->size > 1) { /* convert mumps distributed solution to petsc mpi x */ 920a5e57a09SHong Zhang if (mumps->scat_sol && mumps->ICNTL9_pre != mumps->id.ICNTL(9)) { 921a5e57a09SHong Zhang /* when id.ICNTL(9) changes, the contents of lsol_loc may change (not its size, lsol_loc), recreates scat_sol */ 922a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 923397b6df1SKris Buschelman } 924a5e57a09SHong Zhang if (!mumps->scat_sol) { /* create scatter scat_sol */ 925a5e57a09SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,mumps->id.lsol_loc,0,1,&is_iden);CHKERRQ(ierr); /* from */ 926a5e57a09SHong Zhang for (i=0; i<mumps->id.lsol_loc; i++) { 927a5e57a09SHong Zhang mumps->id.isol_loc[i] -= 1; /* change Fortran style to C style */ 928a5e57a09SHong Zhang } 929a5e57a09SHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,mumps->id.lsol_loc,mumps->id.isol_loc,PETSC_COPY_VALUES,&is_petsc);CHKERRQ(ierr); /* to */ 930a5e57a09SHong Zhang ierr = VecScatterCreate(mumps->x_seq,is_iden,x,is_petsc,&mumps->scat_sol);CHKERRQ(ierr); 9316bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 9326bf464f9SBarry Smith ierr = ISDestroy(&is_petsc);CHKERRQ(ierr); 9332205254eSKarl Rupp 934a5e57a09SHong Zhang mumps->ICNTL9_pre = mumps->id.ICNTL(9); /* save current value of id.ICNTL(9) */ 935397b6df1SKris Buschelman } 936a5e57a09SHong Zhang 937a5e57a09SHong Zhang ierr = VecScatterBegin(mumps->scat_sol,mumps->x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 938a5e57a09SHong Zhang ierr = VecScatterEnd(mumps->scat_sol,mumps->x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 939329ec9b3SHong Zhang } 940397b6df1SKris Buschelman PetscFunctionReturn(0); 941397b6df1SKris Buschelman } 942397b6df1SKris Buschelman 94351d5961aSHong Zhang #undef __FUNCT__ 94451d5961aSHong Zhang #define __FUNCT__ "MatSolveTranspose_MUMPS" 94551d5961aSHong Zhang PetscErrorCode MatSolveTranspose_MUMPS(Mat A,Vec b,Vec x) 94651d5961aSHong Zhang { 947a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 94851d5961aSHong Zhang PetscErrorCode ierr; 94951d5961aSHong Zhang 95051d5961aSHong Zhang PetscFunctionBegin; 951a5e57a09SHong Zhang mumps->id.ICNTL(9) = 0; 9520ad0caddSJed Brown ierr = MatSolve_MUMPS(A,b,x);CHKERRQ(ierr); 953a5e57a09SHong Zhang mumps->id.ICNTL(9) = 1; 95451d5961aSHong Zhang PetscFunctionReturn(0); 95551d5961aSHong Zhang } 95651d5961aSHong Zhang 957e0b74bf9SHong Zhang #undef __FUNCT__ 958e0b74bf9SHong Zhang #define __FUNCT__ "MatMatSolve_MUMPS" 959e0b74bf9SHong Zhang PetscErrorCode MatMatSolve_MUMPS(Mat A,Mat B,Mat X) 960e0b74bf9SHong Zhang { 961bda8bf91SBarry Smith PetscErrorCode ierr; 962bda8bf91SBarry Smith PetscBool flg; 9634e34a73bSHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 964334c5f61SHong Zhang PetscInt i,nrhs,M; 9652cd7d884SHong Zhang PetscScalar *array,*bray; 966bda8bf91SBarry Smith 967e0b74bf9SHong Zhang PetscFunctionBegin; 9680298fd71SBarry Smith ierr = PetscObjectTypeCompareAny((PetscObject)B,&flg,MATSEQDENSE,MATMPIDENSE,NULL);CHKERRQ(ierr); 969801fbe65SHong Zhang if (!flg) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_ARG_WRONG,"Matrix B must be MATDENSE matrix"); 9700298fd71SBarry Smith ierr = PetscObjectTypeCompareAny((PetscObject)X,&flg,MATSEQDENSE,MATMPIDENSE,NULL);CHKERRQ(ierr); 971801fbe65SHong Zhang if (!flg) SETERRQ(PetscObjectComm((PetscObject)X),PETSC_ERR_ARG_WRONG,"Matrix X must be MATDENSE matrix"); 972801fbe65SHong Zhang if (B->rmap->n != X->rmap->n) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_ARG_WRONG,"Matrix B and X must have same row distribution"); 9734e34a73bSHong Zhang 9742cd7d884SHong Zhang ierr = MatGetSize(B,&M,&nrhs);CHKERRQ(ierr); 975334c5f61SHong Zhang mumps->id.nrhs = nrhs; 976334c5f61SHong Zhang mumps->id.lrhs = M; 9774e34a73bSHong Zhang 9782cd7d884SHong Zhang if (mumps->size == 1) { 9792cd7d884SHong Zhang /* copy B to X */ 9802cd7d884SHong Zhang ierr = MatDenseGetArray(B,&bray);CHKERRQ(ierr); 9812cd7d884SHong Zhang ierr = MatDenseGetArray(X,&array);CHKERRQ(ierr); 9826444a565SStefano Zampini ierr = PetscMemcpy(array,bray,M*nrhs*sizeof(PetscScalar));CHKERRQ(ierr); 9832cd7d884SHong Zhang ierr = MatDenseRestoreArray(B,&bray);CHKERRQ(ierr); 984940cd9d6SSatish Balay mumps->id.rhs = (MumpsScalar*)array; 985b5fa320bSStefano Zampini /* handle condensation step of Schur complement (if any) */ 986b5fa320bSStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps);CHKERRQ(ierr); 987801fbe65SHong Zhang 9882cd7d884SHong Zhang /* solve phase */ 9892cd7d884SHong Zhang /*-------------*/ 9902cd7d884SHong Zhang mumps->id.job = JOB_SOLVE; 9912cd7d884SHong Zhang PetscMUMPS_c(&mumps->id); 9922cd7d884SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 993b5fa320bSStefano Zampini 994b5fa320bSStefano Zampini /* handle expansion step of Schur complement (if any) */ 995b5fa320bSStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps);CHKERRQ(ierr); 9962cd7d884SHong Zhang ierr = MatDenseRestoreArray(X,&array);CHKERRQ(ierr); 997334c5f61SHong Zhang } else { /*--------- parallel case --------*/ 99871aed81dSHong Zhang PetscInt lsol_loc,nlsol_loc,*isol_loc,*idx,*iidx,*idxx,*isol_loc_save; 9991070efccSSatish Balay MumpsScalar *sol_loc,*sol_loc_save; 1000801fbe65SHong Zhang IS is_to,is_from; 1001334c5f61SHong Zhang PetscInt k,proc,j,m; 1002801fbe65SHong Zhang const PetscInt *rstart; 1003334c5f61SHong Zhang Vec v_mpi,b_seq,x_seq; 1004334c5f61SHong Zhang VecScatter scat_rhs,scat_sol; 1005801fbe65SHong Zhang 1006801fbe65SHong Zhang /* create x_seq to hold local solution */ 100771aed81dSHong Zhang isol_loc_save = mumps->id.isol_loc; /* save it for MatSovle() */ 100871aed81dSHong Zhang sol_loc_save = mumps->id.sol_loc; 1009801fbe65SHong Zhang 101071aed81dSHong Zhang lsol_loc = mumps->id.INFO(23); 101171aed81dSHong Zhang nlsol_loc = nrhs*lsol_loc; /* length of sol_loc */ 101271aed81dSHong Zhang ierr = PetscMalloc2(nlsol_loc,&sol_loc,nlsol_loc,&isol_loc);CHKERRQ(ierr); 1013940cd9d6SSatish Balay mumps->id.sol_loc = (MumpsScalar*)sol_loc; 1014801fbe65SHong Zhang mumps->id.isol_loc = isol_loc; 1015801fbe65SHong Zhang 10161070efccSSatish Balay ierr = VecCreateSeqWithArray(PETSC_COMM_SELF,1,nlsol_loc,(PetscScalar*)sol_loc,&x_seq);CHKERRQ(ierr); 10172cd7d884SHong Zhang 101874f0fcc7SHong Zhang /* copy rhs matrix B into vector v_mpi */ 1019334c5f61SHong Zhang ierr = MatGetLocalSize(B,&m,NULL);CHKERRQ(ierr); 1020801fbe65SHong Zhang ierr = MatDenseGetArray(B,&bray);CHKERRQ(ierr); 102174f0fcc7SHong Zhang ierr = VecCreateMPIWithArray(PetscObjectComm((PetscObject)B),1,nrhs*m,nrhs*M,(const PetscScalar*)bray,&v_mpi);CHKERRQ(ierr); 1022801fbe65SHong Zhang ierr = MatDenseRestoreArray(B,&bray);CHKERRQ(ierr); 1023801fbe65SHong Zhang 1024334c5f61SHong Zhang /* scatter v_mpi to b_seq because MUMPS only supports centralized rhs */ 102574f0fcc7SHong Zhang /* idx: maps from k-th index of v_mpi to (i,j)-th global entry of B; 1026801fbe65SHong Zhang iidx: inverse of idx, will be used by scattering xx_seq -> X */ 1027801fbe65SHong Zhang ierr = PetscMalloc2(nrhs*M,&idx,nrhs*M,&iidx);CHKERRQ(ierr); 1028801fbe65SHong Zhang ierr = MatGetOwnershipRanges(B,&rstart);CHKERRQ(ierr); 1029801fbe65SHong Zhang k = 0; 1030801fbe65SHong Zhang for (proc=0; proc<mumps->size; proc++){ 1031801fbe65SHong Zhang for (j=0; j<nrhs; j++){ 1032801fbe65SHong Zhang for (i=rstart[proc]; i<rstart[proc+1]; i++){ 1033801fbe65SHong Zhang iidx[j*M + i] = k; 1034801fbe65SHong Zhang idx[k++] = j*M + i; 1035801fbe65SHong Zhang } 1036801fbe65SHong Zhang } 10372cd7d884SHong Zhang } 10382cd7d884SHong Zhang 1039801fbe65SHong Zhang if (!mumps->myid) { 1040334c5f61SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,nrhs*M,&b_seq);CHKERRQ(ierr); 1041801fbe65SHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,nrhs*M,idx,PETSC_COPY_VALUES,&is_to);CHKERRQ(ierr); 1042801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,nrhs*M,0,1,&is_from);CHKERRQ(ierr); 1043801fbe65SHong Zhang } else { 1044334c5f61SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&b_seq);CHKERRQ(ierr); 1045801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_to);CHKERRQ(ierr); 1046801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_from);CHKERRQ(ierr); 1047801fbe65SHong Zhang } 1048334c5f61SHong Zhang ierr = VecScatterCreate(v_mpi,is_from,b_seq,is_to,&scat_rhs);CHKERRQ(ierr); 1049334c5f61SHong Zhang ierr = VecScatterBegin(scat_rhs,v_mpi,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1050801fbe65SHong Zhang ierr = ISDestroy(&is_to);CHKERRQ(ierr); 1051801fbe65SHong Zhang ierr = ISDestroy(&is_from);CHKERRQ(ierr); 1052334c5f61SHong Zhang ierr = VecScatterEnd(scat_rhs,v_mpi,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1053801fbe65SHong Zhang 1054801fbe65SHong Zhang if (!mumps->myid) { /* define rhs on the host */ 1055334c5f61SHong Zhang ierr = VecGetArray(b_seq,&bray);CHKERRQ(ierr); 1056940cd9d6SSatish Balay mumps->id.rhs = (MumpsScalar*)bray; 1057334c5f61SHong Zhang ierr = VecRestoreArray(b_seq,&bray);CHKERRQ(ierr); 1058801fbe65SHong Zhang } 1059801fbe65SHong Zhang 1060801fbe65SHong Zhang /* solve phase */ 1061801fbe65SHong Zhang /*-------------*/ 1062801fbe65SHong Zhang mumps->id.job = JOB_SOLVE; 1063801fbe65SHong Zhang PetscMUMPS_c(&mumps->id); 1064801fbe65SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 1065801fbe65SHong Zhang 1066334c5f61SHong Zhang /* scatter mumps distributed solution to petsc vector v_mpi, which shares local arrays with solution matrix X */ 106774f0fcc7SHong Zhang ierr = MatDenseGetArray(X,&array);CHKERRQ(ierr); 106874f0fcc7SHong Zhang ierr = VecPlaceArray(v_mpi,array);CHKERRQ(ierr); 1069801fbe65SHong Zhang 1070334c5f61SHong Zhang /* create scatter scat_sol */ 107171aed81dSHong Zhang ierr = PetscMalloc1(nlsol_loc,&idxx);CHKERRQ(ierr); 107271aed81dSHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,nlsol_loc,0,1,&is_from);CHKERRQ(ierr); 107371aed81dSHong Zhang for (i=0; i<lsol_loc; i++) { 1074334c5f61SHong Zhang isol_loc[i] -= 1; /* change Fortran style to C style */ 1075334c5f61SHong Zhang idxx[i] = iidx[isol_loc[i]]; 1076801fbe65SHong Zhang for (j=1; j<nrhs; j++){ 1077334c5f61SHong Zhang idxx[j*lsol_loc+i] = iidx[isol_loc[i]+j*M]; 1078801fbe65SHong Zhang } 1079801fbe65SHong Zhang } 108071aed81dSHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,nlsol_loc,idxx,PETSC_COPY_VALUES,&is_to);CHKERRQ(ierr); 1081334c5f61SHong Zhang ierr = VecScatterCreate(x_seq,is_from,v_mpi,is_to,&scat_sol);CHKERRQ(ierr); 1082334c5f61SHong Zhang ierr = VecScatterBegin(scat_sol,x_seq,v_mpi,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1083801fbe65SHong Zhang ierr = ISDestroy(&is_from);CHKERRQ(ierr); 1084801fbe65SHong Zhang ierr = ISDestroy(&is_to);CHKERRQ(ierr); 1085334c5f61SHong Zhang ierr = VecScatterEnd(scat_sol,x_seq,v_mpi,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1086801fbe65SHong Zhang ierr = MatDenseRestoreArray(X,&array);CHKERRQ(ierr); 108771aed81dSHong Zhang 108871aed81dSHong Zhang /* free spaces */ 108971aed81dSHong Zhang mumps->id.sol_loc = sol_loc_save; 109071aed81dSHong Zhang mumps->id.isol_loc = isol_loc_save; 109171aed81dSHong Zhang 109271aed81dSHong Zhang ierr = PetscFree2(sol_loc,isol_loc);CHKERRQ(ierr); 1093801fbe65SHong Zhang ierr = PetscFree2(idx,iidx);CHKERRQ(ierr); 1094801fbe65SHong Zhang ierr = PetscFree(idxx);CHKERRQ(ierr); 109571aed81dSHong Zhang ierr = VecDestroy(&x_seq);CHKERRQ(ierr); 109674f0fcc7SHong Zhang ierr = VecDestroy(&v_mpi);CHKERRQ(ierr); 1097334c5f61SHong Zhang ierr = VecDestroy(&b_seq);CHKERRQ(ierr); 1098334c5f61SHong Zhang ierr = VecScatterDestroy(&scat_rhs);CHKERRQ(ierr); 1099334c5f61SHong Zhang ierr = VecScatterDestroy(&scat_sol);CHKERRQ(ierr); 1100801fbe65SHong Zhang } 1101e0b74bf9SHong Zhang PetscFunctionReturn(0); 1102e0b74bf9SHong Zhang } 1103e0b74bf9SHong Zhang 1104ace3df97SHong Zhang #if !defined(PETSC_USE_COMPLEX) 1105a58c3f20SHong Zhang /* 1106a58c3f20SHong Zhang input: 1107a58c3f20SHong Zhang F: numeric factor 1108a58c3f20SHong Zhang output: 1109a58c3f20SHong Zhang nneg: total number of negative pivots 1110a58c3f20SHong Zhang nzero: 0 1111a58c3f20SHong Zhang npos: (global dimension of F) - nneg 1112a58c3f20SHong Zhang */ 1113a58c3f20SHong Zhang 1114a58c3f20SHong Zhang #undef __FUNCT__ 1115a58c3f20SHong Zhang #define __FUNCT__ "MatGetInertia_SBAIJMUMPS" 1116dfbe8321SBarry Smith PetscErrorCode MatGetInertia_SBAIJMUMPS(Mat F,int *nneg,int *nzero,int *npos) 1117a58c3f20SHong Zhang { 1118a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 1119dfbe8321SBarry Smith PetscErrorCode ierr; 1120c1490034SHong Zhang PetscMPIInt size; 1121a58c3f20SHong Zhang 1122a58c3f20SHong Zhang PetscFunctionBegin; 1123ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)F),&size);CHKERRQ(ierr); 1124bcb30aebSHong Zhang /* MUMPS 4.3.1 calls ScaLAPACK when ICNTL(13)=0 (default), which does not offer the possibility to compute the inertia of a dense matrix. Set ICNTL(13)=1 to skip ScaLAPACK */ 1125a5e57a09SHong Zhang if (size > 1 && mumps->id.ICNTL(13) != 1) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"ICNTL(13)=%d. -mat_mumps_icntl_13 must be set as 1 for correct global matrix inertia\n",mumps->id.INFOG(13)); 1126ed85ac9fSHong Zhang 1127710ac8efSHong Zhang if (nneg) *nneg = mumps->id.INFOG(12); 1128ed85ac9fSHong Zhang if (nzero || npos) { 1129ed85ac9fSHong Zhang if (mumps->id.ICNTL(24) != 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"-mat_mumps_icntl_24 must be set as 1 for null pivot row detection"); 1130710ac8efSHong Zhang if (nzero) *nzero = mumps->id.INFOG(28); 1131710ac8efSHong Zhang if (npos) *npos = F->rmap->N - (mumps->id.INFOG(12) + mumps->id.INFOG(28)); 1132a58c3f20SHong Zhang } 1133a58c3f20SHong Zhang PetscFunctionReturn(0); 1134a58c3f20SHong Zhang } 1135ace3df97SHong Zhang #endif /* !defined(PETSC_USE_COMPLEX) */ 1136a58c3f20SHong Zhang 1137397b6df1SKris Buschelman #undef __FUNCT__ 1138f6c57405SHong Zhang #define __FUNCT__ "MatFactorNumeric_MUMPS" 11390481f469SBarry Smith PetscErrorCode MatFactorNumeric_MUMPS(Mat F,Mat A,const MatFactorInfo *info) 1140af281ebdSHong Zhang { 1141a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)(F)->spptr; 11426849ba73SBarry Smith PetscErrorCode ierr; 1143e09efc27SHong Zhang Mat F_diag; 1144ace3abfcSBarry Smith PetscBool isMPIAIJ; 1145397b6df1SKris Buschelman 1146397b6df1SKris Buschelman PetscFunctionBegin; 1147a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_REUSE_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 1148397b6df1SKris Buschelman 1149397b6df1SKris Buschelman /* numerical factorization phase */ 1150329ec9b3SHong Zhang /*-------------------------------*/ 1151a5e57a09SHong Zhang mumps->id.job = JOB_FACTNUMERIC; 11524e34a73bSHong Zhang if (!mumps->id.ICNTL(18)) { /* A is centralized */ 1153a5e57a09SHong Zhang if (!mumps->myid) { 1154940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 1155397b6df1SKris Buschelman } 1156397b6df1SKris Buschelman } else { 1157940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 1158397b6df1SKris Buschelman } 1159a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1160a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) { 1161151787a6SHong Zhang if (mumps->id.INFO(1) == -13) { 1162*6c4ed002SBarry Smith if (mumps->id.INFO(2) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: Cannot allocate required memory %d megabytes\n",-mumps->id.INFO(2)); 1163*6c4ed002SBarry Smith else SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: Cannot allocate required memory %d bytes\n",mumps->id.INFO(2)); 1164151787a6SHong Zhang } 1165151787a6SHong Zhang } else SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: INFO(1)=%d, INFO(2)=%d\n",mumps->id.INFO(1),mumps->id.INFO(2)); 1166397b6df1SKris Buschelman } 1167a5e57a09SHong Zhang if (!mumps->myid && mumps->id.ICNTL(16) > 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB," mumps->id.ICNTL(16):=%d\n",mumps->id.INFOG(16)); 1168397b6df1SKris Buschelman 1169dcd589f8SShri Abhyankar (F)->assembled = PETSC_TRUE; 1170a5e57a09SHong Zhang mumps->matstruc = SAME_NONZERO_PATTERN; 1171b5fa320bSStefano Zampini mumps->schur_factored = PETSC_FALSE; 117259ac8732SStefano Zampini mumps->schur_inverted = PETSC_FALSE; 117367877ebaSShri Abhyankar 1174066565c5SStefano Zampini /* just to be sure that ICNTL(19) value returned by a call from MatMumpsGetIcntl is always consistent */ 1175066565c5SStefano Zampini if (!mumps->sym && mumps->id.ICNTL(19) && mumps->id.ICNTL(19) != 1) mumps->id.ICNTL(19) = 3; 1176066565c5SStefano Zampini 1177a5e57a09SHong Zhang if (mumps->size > 1) { 117867877ebaSShri Abhyankar PetscInt lsol_loc; 117967877ebaSShri Abhyankar PetscScalar *sol_loc; 11802205254eSKarl Rupp 1181c2093ab7SHong Zhang ierr = PetscObjectTypeCompare((PetscObject)A,MATMPIAIJ,&isMPIAIJ);CHKERRQ(ierr); 1182c2093ab7SHong Zhang if (isMPIAIJ) F_diag = ((Mat_MPIAIJ*)(F)->data)->A; 1183c2093ab7SHong Zhang else F_diag = ((Mat_MPISBAIJ*)(F)->data)->A; 1184c2093ab7SHong Zhang F_diag->assembled = PETSC_TRUE; 1185c2093ab7SHong Zhang 1186c2093ab7SHong Zhang /* distributed solution; Create x_seq=sol_loc for repeated use */ 1187c2093ab7SHong Zhang if (mumps->x_seq) { 1188c2093ab7SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 1189c2093ab7SHong Zhang ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr); 1190c2093ab7SHong Zhang ierr = VecDestroy(&mumps->x_seq);CHKERRQ(ierr); 1191c2093ab7SHong Zhang } 1192a5e57a09SHong Zhang lsol_loc = mumps->id.INFO(23); /* length of sol_loc */ 1193dcca6d9dSJed Brown ierr = PetscMalloc2(lsol_loc,&sol_loc,lsol_loc,&mumps->id.isol_loc);CHKERRQ(ierr); 1194a5e57a09SHong Zhang mumps->id.lsol_loc = lsol_loc; 1195940cd9d6SSatish Balay mumps->id.sol_loc = (MumpsScalar*)sol_loc; 1196a5e57a09SHong Zhang ierr = VecCreateSeqWithArray(PETSC_COMM_SELF,1,lsol_loc,sol_loc,&mumps->x_seq);CHKERRQ(ierr); 119767877ebaSShri Abhyankar } 1198397b6df1SKris Buschelman PetscFunctionReturn(0); 1199397b6df1SKris Buschelman } 1200397b6df1SKris Buschelman 12019a2535b5SHong Zhang /* Sets MUMPS options from the options database */ 1202dcd589f8SShri Abhyankar #undef __FUNCT__ 12039a2535b5SHong Zhang #define __FUNCT__ "PetscSetMUMPSFromOptions" 12049a2535b5SHong Zhang PetscErrorCode PetscSetMUMPSFromOptions(Mat F, Mat A) 1205dcd589f8SShri Abhyankar { 12069a2535b5SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1207dcd589f8SShri Abhyankar PetscErrorCode ierr; 1208b34f08ffSHong Zhang PetscInt icntl,info[40],i,ninfo=40; 1209ace3abfcSBarry Smith PetscBool flg; 1210dcd589f8SShri Abhyankar 1211dcd589f8SShri Abhyankar PetscFunctionBegin; 1212ce94432eSBarry Smith ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)A),((PetscObject)A)->prefix,"MUMPS Options","Mat");CHKERRQ(ierr); 12139a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_1","ICNTL(1): output stream for error messages","None",mumps->id.ICNTL(1),&icntl,&flg);CHKERRQ(ierr); 12149a2535b5SHong Zhang if (flg) mumps->id.ICNTL(1) = icntl; 12159a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_2","ICNTL(2): output stream for diagnostic printing, statistics, and warning","None",mumps->id.ICNTL(2),&icntl,&flg);CHKERRQ(ierr); 12169a2535b5SHong Zhang if (flg) mumps->id.ICNTL(2) = icntl; 12179a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_3","ICNTL(3): output stream for global information, collected on the host","None",mumps->id.ICNTL(3),&icntl,&flg);CHKERRQ(ierr); 12189a2535b5SHong Zhang if (flg) mumps->id.ICNTL(3) = icntl; 1219dcd589f8SShri Abhyankar 12209a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_4","ICNTL(4): level of printing (0 to 4)","None",mumps->id.ICNTL(4),&icntl,&flg);CHKERRQ(ierr); 12219a2535b5SHong Zhang if (flg) mumps->id.ICNTL(4) = icntl; 12229a2535b5SHong Zhang if (mumps->id.ICNTL(4) || PetscLogPrintInfo) mumps->id.ICNTL(3) = 6; /* resume MUMPS default id.ICNTL(3) = 6 */ 12239a2535b5SHong Zhang 1224d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_6","ICNTL(6): permutes to a zero-free diagonal and/or scale the matrix (0 to 7)","None",mumps->id.ICNTL(6),&icntl,&flg);CHKERRQ(ierr); 12259a2535b5SHong Zhang if (flg) mumps->id.ICNTL(6) = icntl; 12269a2535b5SHong Zhang 1227d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_7","ICNTL(7): computes a symmetric permutation in sequential analysis (0 to 7). 3=Scotch, 4=PORD, 5=Metis","None",mumps->id.ICNTL(7),&icntl,&flg);CHKERRQ(ierr); 1228dcd589f8SShri Abhyankar if (flg) { 12292205254eSKarl Rupp if (icntl== 1 && mumps->size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"pivot order be set by the user in PERM_IN -- not supported by the PETSc/MUMPS interface\n"); 12302205254eSKarl Rupp else mumps->id.ICNTL(7) = icntl; 1231dcd589f8SShri Abhyankar } 1232e0b74bf9SHong Zhang 12330298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_8","ICNTL(8): scaling strategy (-2 to 8 or 77)","None",mumps->id.ICNTL(8),&mumps->id.ICNTL(8),NULL);CHKERRQ(ierr); 1234d341cd04SHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_9","ICNTL(9): computes the solution using A or A^T","None",mumps->id.ICNTL(9),&mumps->id.ICNTL(9),NULL);CHKERRQ(ierr); handled by MatSolveTranspose_MUMPS() */ 12350298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_10","ICNTL(10): max num of refinements","None",mumps->id.ICNTL(10),&mumps->id.ICNTL(10),NULL);CHKERRQ(ierr); 1236d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_11","ICNTL(11): statistics related to an error analysis (via -ksp_view)","None",mumps->id.ICNTL(11),&mumps->id.ICNTL(11),NULL);CHKERRQ(ierr); 1237d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_12","ICNTL(12): an ordering strategy for symmetric matrices (0 to 3)","None",mumps->id.ICNTL(12),&mumps->id.ICNTL(12),NULL);CHKERRQ(ierr); 1238d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_13","ICNTL(13): parallelism of the root node (enable ScaLAPACK) and its splitting","None",mumps->id.ICNTL(13),&mumps->id.ICNTL(13),NULL);CHKERRQ(ierr); 1239d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_14","ICNTL(14): percentage increase in the estimated working space","None",mumps->id.ICNTL(14),&mumps->id.ICNTL(14),NULL);CHKERRQ(ierr); 1240d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_19","ICNTL(19): computes the Schur complement","None",mumps->id.ICNTL(19),&mumps->id.ICNTL(19),NULL);CHKERRQ(ierr); 124159ac8732SStefano Zampini if (mumps->id.ICNTL(19) <= 0 || mumps->id.ICNTL(19) > 3) { /* reset any schur data (if any) */ 124259ac8732SStefano Zampini ierr = MatMumpsResetSchur_Private(mumps);CHKERRQ(ierr); 124359ac8732SStefano Zampini } 12444e34a73bSHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_20","ICNTL(20): the format (dense or sparse) of the right-hand sides","None",mumps->id.ICNTL(20),&mumps->id.ICNTL(20),NULL);CHKERRQ(ierr); -- sparse rhs is not supported in PETSc API */ 1245d341cd04SHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_21","ICNTL(21): the distribution (centralized or distributed) of the solution vectors","None",mumps->id.ICNTL(21),&mumps->id.ICNTL(21),NULL);CHKERRQ(ierr); we only use distributed solution vector */ 12469a2535b5SHong Zhang 1247d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_22","ICNTL(22): in-core/out-of-core factorization and solve (0 or 1)","None",mumps->id.ICNTL(22),&mumps->id.ICNTL(22),NULL);CHKERRQ(ierr); 12480298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_23","ICNTL(23): max size of the working memory (MB) that can allocate per processor","None",mumps->id.ICNTL(23),&mumps->id.ICNTL(23),NULL);CHKERRQ(ierr); 12490298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_24","ICNTL(24): detection of null pivot rows (0 or 1)","None",mumps->id.ICNTL(24),&mumps->id.ICNTL(24),NULL);CHKERRQ(ierr); 12509a2535b5SHong Zhang if (mumps->id.ICNTL(24)) { 12519a2535b5SHong Zhang mumps->id.ICNTL(13) = 1; /* turn-off ScaLAPACK to help with the correct detection of null pivots */ 1252d7ebd59bSHong Zhang } 1253d7ebd59bSHong Zhang 1254d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_25","ICNTL(25): compute a solution of a deficient matrix and a null space basis","None",mumps->id.ICNTL(25),&mumps->id.ICNTL(25),NULL);CHKERRQ(ierr); 1255d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_26","ICNTL(26): drives the solution phase if a Schur complement matrix","None",mumps->id.ICNTL(26),&mumps->id.ICNTL(26),NULL);CHKERRQ(ierr); 12562cd7d884SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_27","ICNTL(27): the blocking size for multiple right-hand sides","None",mumps->id.ICNTL(27),&mumps->id.ICNTL(27),NULL);CHKERRQ(ierr); 12570298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_28","ICNTL(28): use 1 for sequential analysis and ictnl(7) ordering, or 2 for parallel analysis and ictnl(29) ordering","None",mumps->id.ICNTL(28),&mumps->id.ICNTL(28),NULL);CHKERRQ(ierr); 1258d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_29","ICNTL(29): parallel ordering 1 = ptscotch, 2 = parmetis","None",mumps->id.ICNTL(29),&mumps->id.ICNTL(29),NULL);CHKERRQ(ierr); 12590298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_30","ICNTL(30): compute user-specified set of entries in inv(A)","None",mumps->id.ICNTL(30),&mumps->id.ICNTL(30),NULL);CHKERRQ(ierr); 1260d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_31","ICNTL(31): indicates which factors may be discarded during factorization","None",mumps->id.ICNTL(31),&mumps->id.ICNTL(31),NULL);CHKERRQ(ierr); 12614e34a73bSHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_32","ICNTL(32): performs the forward elemination of the right-hand sides during factorization","None",mumps->id.ICNTL(32),&mumps->id.ICNTL(32),NULL);CHKERRQ(ierr); -- not supported by PETSc API */ 12620298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_33","ICNTL(33): compute determinant","None",mumps->id.ICNTL(33),&mumps->id.ICNTL(33),NULL);CHKERRQ(ierr); 1263dcd589f8SShri Abhyankar 12640298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_1","CNTL(1): relative pivoting threshold","None",mumps->id.CNTL(1),&mumps->id.CNTL(1),NULL);CHKERRQ(ierr); 12650298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_2","CNTL(2): stopping criterion of refinement","None",mumps->id.CNTL(2),&mumps->id.CNTL(2),NULL);CHKERRQ(ierr); 12660298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_3","CNTL(3): absolute pivoting threshold","None",mumps->id.CNTL(3),&mumps->id.CNTL(3),NULL);CHKERRQ(ierr); 12670298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_4","CNTL(4): value for static pivoting","None",mumps->id.CNTL(4),&mumps->id.CNTL(4),NULL);CHKERRQ(ierr); 12680298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_5","CNTL(5): fixation for null pivots","None",mumps->id.CNTL(5),&mumps->id.CNTL(5),NULL);CHKERRQ(ierr); 1269e5bb22a1SHong Zhang 12700298fd71SBarry Smith ierr = PetscOptionsString("-mat_mumps_ooc_tmpdir", "out of core directory", "None", mumps->id.ooc_tmpdir, mumps->id.ooc_tmpdir, 256, NULL); 1271b34f08ffSHong Zhang 127216d797efSHong Zhang ierr = PetscOptionsIntArray("-mat_mumps_view_info","request INFO local to each processor","",info,&ninfo,NULL);CHKERRQ(ierr); 1273b34f08ffSHong Zhang if (ninfo) { 1274b34f08ffSHong Zhang if (ninfo > 40) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"number of INFO %d must <= 40\n",ninfo); 1275b34f08ffSHong Zhang ierr = PetscMalloc1(ninfo,&mumps->info);CHKERRQ(ierr); 1276b34f08ffSHong Zhang mumps->ninfo = ninfo; 1277b34f08ffSHong Zhang for (i=0; i<ninfo; i++) { 1278*6c4ed002SBarry Smith if (info[i] < 0 || info[i]>40) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"index of INFO %d must between 1 and 40\n",ninfo); 1279*6c4ed002SBarry Smith else { 1280b34f08ffSHong Zhang mumps->info[i] = info[i]; 1281b34f08ffSHong Zhang } 1282b34f08ffSHong Zhang } 1283b34f08ffSHong Zhang } 1284b34f08ffSHong Zhang 1285dcd589f8SShri Abhyankar PetscOptionsEnd(); 1286dcd589f8SShri Abhyankar PetscFunctionReturn(0); 1287dcd589f8SShri Abhyankar } 1288dcd589f8SShri Abhyankar 1289dcd589f8SShri Abhyankar #undef __FUNCT__ 1290dcd589f8SShri Abhyankar #define __FUNCT__ "PetscInitializeMUMPS" 1291f697e70eSHong Zhang PetscErrorCode PetscInitializeMUMPS(Mat A,Mat_MUMPS *mumps) 1292dcd589f8SShri Abhyankar { 1293dcd589f8SShri Abhyankar PetscErrorCode ierr; 1294dcd589f8SShri Abhyankar 1295dcd589f8SShri Abhyankar PetscFunctionBegin; 1296ce94432eSBarry Smith ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)A), &mumps->myid); 1297ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)A),&mumps->size);CHKERRQ(ierr); 1298ce94432eSBarry Smith ierr = MPI_Comm_dup(PetscObjectComm((PetscObject)A),&(mumps->comm_mumps));CHKERRQ(ierr); 12992205254eSKarl Rupp 1300f697e70eSHong Zhang mumps->id.comm_fortran = MPI_Comm_c2f(mumps->comm_mumps); 1301f697e70eSHong Zhang 1302f697e70eSHong Zhang mumps->id.job = JOB_INIT; 1303f697e70eSHong Zhang mumps->id.par = 1; /* host participates factorizaton and solve */ 1304f697e70eSHong Zhang mumps->id.sym = mumps->sym; 13052907cef9SHong Zhang PetscMUMPS_c(&mumps->id); 1306f697e70eSHong Zhang 13070298fd71SBarry Smith mumps->scat_rhs = NULL; 13080298fd71SBarry Smith mumps->scat_sol = NULL; 13099a2535b5SHong Zhang 131070544d5fSHong Zhang /* set PETSc-MUMPS default options - override MUMPS default */ 13119a2535b5SHong Zhang mumps->id.ICNTL(3) = 0; 13129a2535b5SHong Zhang mumps->id.ICNTL(4) = 0; 13139a2535b5SHong Zhang if (mumps->size == 1) { 13149a2535b5SHong Zhang mumps->id.ICNTL(18) = 0; /* centralized assembled matrix input */ 13159a2535b5SHong Zhang } else { 13169a2535b5SHong Zhang mumps->id.ICNTL(18) = 3; /* distributed assembled matrix input */ 13174e34a73bSHong Zhang mumps->id.ICNTL(20) = 0; /* rhs is in dense format */ 131870544d5fSHong Zhang mumps->id.ICNTL(21) = 1; /* distributed solution */ 13199a2535b5SHong Zhang } 13206444a565SStefano Zampini 13216444a565SStefano Zampini /* schur */ 13226444a565SStefano Zampini mumps->id.size_schur = 0; 13236444a565SStefano Zampini mumps->id.listvar_schur = NULL; 13246444a565SStefano Zampini mumps->id.schur = NULL; 1325b5fa320bSStefano Zampini mumps->schur_second_solve = PETSC_FALSE; 1326b5fa320bSStefano Zampini mumps->sizeredrhs = 0; 1327b5fa320bSStefano Zampini mumps->schur_pivots = NULL; 1328b5fa320bSStefano Zampini mumps->schur_work = NULL; 132959ac8732SStefano Zampini mumps->schur_sol = NULL; 133059ac8732SStefano Zampini mumps->schur_sizesol = 0; 133159ac8732SStefano Zampini mumps->schur_restored = PETSC_TRUE; 133259ac8732SStefano Zampini mumps->schur_factored = PETSC_FALSE; 133359ac8732SStefano Zampini mumps->schur_inverted = PETSC_FALSE; 1334dcd589f8SShri Abhyankar PetscFunctionReturn(0); 1335dcd589f8SShri Abhyankar } 1336dcd589f8SShri Abhyankar 1337a5e57a09SHong Zhang /* Note Petsc r(=c) permutation is used when mumps->id.ICNTL(7)==1 with centralized assembled matrix input; otherwise r and c are ignored */ 1338397b6df1SKris Buschelman #undef __FUNCT__ 1339f0c56d0fSKris Buschelman #define __FUNCT__ "MatLUFactorSymbolic_AIJMUMPS" 13400481f469SBarry Smith PetscErrorCode MatLUFactorSymbolic_AIJMUMPS(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info) 1341b24902e0SBarry Smith { 1342a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1343dcd589f8SShri Abhyankar PetscErrorCode ierr; 134467877ebaSShri Abhyankar Vec b; 134567877ebaSShri Abhyankar IS is_iden; 134667877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1347397b6df1SKris Buschelman 1348397b6df1SKris Buschelman PetscFunctionBegin; 1349a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1350dcd589f8SShri Abhyankar 13519a2535b5SHong Zhang /* Set MUMPS options from the options database */ 13529a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1353dcd589f8SShri Abhyankar 1354a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 1355dcd589f8SShri Abhyankar 135667877ebaSShri Abhyankar /* analysis phase */ 135767877ebaSShri Abhyankar /*----------------*/ 1358a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1359a5e57a09SHong Zhang mumps->id.n = M; 1360a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 136167877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1362a5e57a09SHong Zhang if (!mumps->myid) { 1363a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1364a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1365940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 136667877ebaSShri Abhyankar } 1367a5e57a09SHong Zhang if (mumps->id.ICNTL(7) == 1) { /* use user-provide matrix ordering - assuming r = c ordering */ 13685248a706SHong Zhang /* 13695248a706SHong Zhang PetscBool flag; 13705248a706SHong Zhang ierr = ISEqual(r,c,&flag);CHKERRQ(ierr); 13715248a706SHong Zhang if (!flag) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"row_perm != col_perm"); 13725248a706SHong Zhang ierr = ISView(r,PETSC_VIEWER_STDOUT_SELF); 13735248a706SHong Zhang */ 1374a5e57a09SHong Zhang if (!mumps->myid) { 1375e0b74bf9SHong Zhang const PetscInt *idx; 1376e0b74bf9SHong Zhang PetscInt i,*perm_in; 13772205254eSKarl Rupp 1378785e854fSJed Brown ierr = PetscMalloc1(M,&perm_in);CHKERRQ(ierr); 1379e0b74bf9SHong Zhang ierr = ISGetIndices(r,&idx);CHKERRQ(ierr); 13802205254eSKarl Rupp 1381a5e57a09SHong Zhang mumps->id.perm_in = perm_in; 1382e0b74bf9SHong Zhang for (i=0; i<M; i++) perm_in[i] = idx[i]+1; /* perm_in[]: start from 1, not 0! */ 1383e0b74bf9SHong Zhang ierr = ISRestoreIndices(r,&idx);CHKERRQ(ierr); 1384e0b74bf9SHong Zhang } 1385e0b74bf9SHong Zhang } 138667877ebaSShri Abhyankar } 138767877ebaSShri Abhyankar break; 138867877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1389a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1390a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1391a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1392940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 139367877ebaSShri Abhyankar } 139467877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1395a5e57a09SHong Zhang if (!mumps->myid) { 13962cd7d884SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->rmap->N,&mumps->b_seq);CHKERRQ(ierr); 13972cd7d884SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,A->rmap->N,0,1,&is_iden);CHKERRQ(ierr); 139867877ebaSShri Abhyankar } else { 1399a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 140067877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 140167877ebaSShri Abhyankar } 14022a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1403a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 14046bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 14056bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 140667877ebaSShri Abhyankar break; 140767877ebaSShri Abhyankar } 1408a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1409a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 141067877ebaSShri Abhyankar 1411719d5645SBarry Smith F->ops->lufactornumeric = MatFactorNumeric_MUMPS; 1412dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 141351d5961aSHong Zhang F->ops->solvetranspose = MatSolveTranspose_MUMPS; 14144e34a73bSHong Zhang F->ops->matsolve = MatMatSolve_MUMPS; 1415b24902e0SBarry Smith PetscFunctionReturn(0); 1416b24902e0SBarry Smith } 1417b24902e0SBarry Smith 1418450b117fSShri Abhyankar /* Note the Petsc r and c permutations are ignored */ 1419450b117fSShri Abhyankar #undef __FUNCT__ 1420450b117fSShri Abhyankar #define __FUNCT__ "MatLUFactorSymbolic_BAIJMUMPS" 1421450b117fSShri Abhyankar PetscErrorCode MatLUFactorSymbolic_BAIJMUMPS(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info) 1422450b117fSShri Abhyankar { 1423a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1424dcd589f8SShri Abhyankar PetscErrorCode ierr; 142567877ebaSShri Abhyankar Vec b; 142667877ebaSShri Abhyankar IS is_iden; 142767877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1428450b117fSShri Abhyankar 1429450b117fSShri Abhyankar PetscFunctionBegin; 1430a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1431dcd589f8SShri Abhyankar 14329a2535b5SHong Zhang /* Set MUMPS options from the options database */ 14339a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1434dcd589f8SShri Abhyankar 1435a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 143667877ebaSShri Abhyankar 143767877ebaSShri Abhyankar /* analysis phase */ 143867877ebaSShri Abhyankar /*----------------*/ 1439a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1440a5e57a09SHong Zhang mumps->id.n = M; 1441a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 144267877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1443a5e57a09SHong Zhang if (!mumps->myid) { 1444a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1445a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1446940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 144767877ebaSShri Abhyankar } 144867877ebaSShri Abhyankar } 144967877ebaSShri Abhyankar break; 145067877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1451a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1452a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1453a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1454940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 145567877ebaSShri Abhyankar } 145667877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1457a5e57a09SHong Zhang if (!mumps->myid) { 1458a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr); 145967877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr); 146067877ebaSShri Abhyankar } else { 1461a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 146267877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 146367877ebaSShri Abhyankar } 14642a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1465a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 14666bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 14676bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 146867877ebaSShri Abhyankar break; 146967877ebaSShri Abhyankar } 1470a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1471a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 147267877ebaSShri Abhyankar 1473450b117fSShri Abhyankar F->ops->lufactornumeric = MatFactorNumeric_MUMPS; 1474dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 147551d5961aSHong Zhang F->ops->solvetranspose = MatSolveTranspose_MUMPS; 1476450b117fSShri Abhyankar PetscFunctionReturn(0); 1477450b117fSShri Abhyankar } 1478b24902e0SBarry Smith 1479141f4205SHong Zhang /* Note the Petsc r permutation and factor info are ignored */ 1480397b6df1SKris Buschelman #undef __FUNCT__ 148167877ebaSShri Abhyankar #define __FUNCT__ "MatCholeskyFactorSymbolic_MUMPS" 148267877ebaSShri Abhyankar PetscErrorCode MatCholeskyFactorSymbolic_MUMPS(Mat F,Mat A,IS r,const MatFactorInfo *info) 1483b24902e0SBarry Smith { 1484a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1485dcd589f8SShri Abhyankar PetscErrorCode ierr; 148667877ebaSShri Abhyankar Vec b; 148767877ebaSShri Abhyankar IS is_iden; 148867877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1489397b6df1SKris Buschelman 1490397b6df1SKris Buschelman PetscFunctionBegin; 1491a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1492dcd589f8SShri Abhyankar 14939a2535b5SHong Zhang /* Set MUMPS options from the options database */ 14949a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1495dcd589f8SShri Abhyankar 1496a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 1497dcd589f8SShri Abhyankar 149867877ebaSShri Abhyankar /* analysis phase */ 149967877ebaSShri Abhyankar /*----------------*/ 1500a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1501a5e57a09SHong Zhang mumps->id.n = M; 1502a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 150367877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1504a5e57a09SHong Zhang if (!mumps->myid) { 1505a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1506a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1507940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 150867877ebaSShri Abhyankar } 150967877ebaSShri Abhyankar } 151067877ebaSShri Abhyankar break; 151167877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1512a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1513a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1514a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1515940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 151667877ebaSShri Abhyankar } 151767877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1518a5e57a09SHong Zhang if (!mumps->myid) { 1519a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr); 152067877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr); 152167877ebaSShri Abhyankar } else { 1522a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 152367877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 152467877ebaSShri Abhyankar } 15252a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1526a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 15276bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 15286bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 152967877ebaSShri Abhyankar break; 153067877ebaSShri Abhyankar } 1531a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1532a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 153367877ebaSShri Abhyankar 15342792810eSHong Zhang F->ops->choleskyfactornumeric = MatFactorNumeric_MUMPS; 1535dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 153651d5961aSHong Zhang F->ops->solvetranspose = MatSolve_MUMPS; 15374e34a73bSHong Zhang F->ops->matsolve = MatMatSolve_MUMPS; 15384e34a73bSHong Zhang #if defined(PETSC_USE_COMPLEX) 15390298fd71SBarry Smith F->ops->getinertia = NULL; 15404e34a73bSHong Zhang #else 15414e34a73bSHong Zhang F->ops->getinertia = MatGetInertia_SBAIJMUMPS; 1542db4efbfdSBarry Smith #endif 1543b24902e0SBarry Smith PetscFunctionReturn(0); 1544b24902e0SBarry Smith } 1545b24902e0SBarry Smith 1546397b6df1SKris Buschelman #undef __FUNCT__ 154764e6c443SBarry Smith #define __FUNCT__ "MatView_MUMPS" 154864e6c443SBarry Smith PetscErrorCode MatView_MUMPS(Mat A,PetscViewer viewer) 154974ed9c26SBarry Smith { 1550f6c57405SHong Zhang PetscErrorCode ierr; 155164e6c443SBarry Smith PetscBool iascii; 155264e6c443SBarry Smith PetscViewerFormat format; 1553a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 1554f6c57405SHong Zhang 1555f6c57405SHong Zhang PetscFunctionBegin; 155664e6c443SBarry Smith /* check if matrix is mumps type */ 155764e6c443SBarry Smith if (A->ops->solve != MatSolve_MUMPS) PetscFunctionReturn(0); 155864e6c443SBarry Smith 1559251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 156064e6c443SBarry Smith if (iascii) { 156164e6c443SBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 156264e6c443SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO) { 156364e6c443SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"MUMPS run parameters:\n");CHKERRQ(ierr); 1564a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," SYM (matrix type): %d \n",mumps->id.sym);CHKERRQ(ierr); 1565a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," PAR (host participation): %d \n",mumps->id.par);CHKERRQ(ierr); 1566a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(1) (output for error): %d \n",mumps->id.ICNTL(1));CHKERRQ(ierr); 1567a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(2) (output of diagnostic msg): %d \n",mumps->id.ICNTL(2));CHKERRQ(ierr); 1568a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(3) (output for global info): %d \n",mumps->id.ICNTL(3));CHKERRQ(ierr); 1569a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(4) (level of printing): %d \n",mumps->id.ICNTL(4));CHKERRQ(ierr); 1570a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(5) (input mat struct): %d \n",mumps->id.ICNTL(5));CHKERRQ(ierr); 1571a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(6) (matrix prescaling): %d \n",mumps->id.ICNTL(6));CHKERRQ(ierr); 1572a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(7) (sequentia matrix ordering):%d \n",mumps->id.ICNTL(7));CHKERRQ(ierr); 1573a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(8) (scalling strategy): %d \n",mumps->id.ICNTL(8));CHKERRQ(ierr); 1574a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(10) (max num of refinements): %d \n",mumps->id.ICNTL(10));CHKERRQ(ierr); 1575a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(11) (error analysis): %d \n",mumps->id.ICNTL(11));CHKERRQ(ierr); 1576a5e57a09SHong Zhang if (mumps->id.ICNTL(11)>0) { 1577a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(4) (inf norm of input mat): %g\n",mumps->id.RINFOG(4));CHKERRQ(ierr); 1578a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(5) (inf norm of solution): %g\n",mumps->id.RINFOG(5));CHKERRQ(ierr); 1579a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(6) (inf norm of residual): %g\n",mumps->id.RINFOG(6));CHKERRQ(ierr); 1580a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(7),RINFOG(8) (backward error est): %g, %g\n",mumps->id.RINFOG(7),mumps->id.RINFOG(8));CHKERRQ(ierr); 1581a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(9) (error estimate): %g \n",mumps->id.RINFOG(9));CHKERRQ(ierr); 1582a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(10),RINFOG(11)(condition numbers): %g, %g\n",mumps->id.RINFOG(10),mumps->id.RINFOG(11));CHKERRQ(ierr); 1583f6c57405SHong Zhang } 1584a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(12) (efficiency control): %d \n",mumps->id.ICNTL(12));CHKERRQ(ierr); 1585a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(13) (efficiency control): %d \n",mumps->id.ICNTL(13));CHKERRQ(ierr); 1586a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(14) (percentage of estimated workspace increase): %d \n",mumps->id.ICNTL(14));CHKERRQ(ierr); 1587f6c57405SHong Zhang /* ICNTL(15-17) not used */ 1588a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(18) (input mat struct): %d \n",mumps->id.ICNTL(18));CHKERRQ(ierr); 1589a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(19) (Shur complement info): %d \n",mumps->id.ICNTL(19));CHKERRQ(ierr); 1590a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(20) (rhs sparse pattern): %d \n",mumps->id.ICNTL(20));CHKERRQ(ierr); 1591ca3dc52bSPierre Jolivet ierr = PetscViewerASCIIPrintf(viewer," ICNTL(21) (solution struct): %d \n",mumps->id.ICNTL(21));CHKERRQ(ierr); 1592a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(22) (in-core/out-of-core facility): %d \n",mumps->id.ICNTL(22));CHKERRQ(ierr); 1593a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(23) (max size of memory can be allocated locally):%d \n",mumps->id.ICNTL(23));CHKERRQ(ierr); 1594c0165424SHong Zhang 1595a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(24) (detection of null pivot rows): %d \n",mumps->id.ICNTL(24));CHKERRQ(ierr); 1596a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(25) (computation of a null space basis): %d \n",mumps->id.ICNTL(25));CHKERRQ(ierr); 1597a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(26) (Schur options for rhs or solution): %d \n",mumps->id.ICNTL(26));CHKERRQ(ierr); 1598a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(27) (experimental parameter): %d \n",mumps->id.ICNTL(27));CHKERRQ(ierr); 1599a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(28) (use parallel or sequential ordering): %d \n",mumps->id.ICNTL(28));CHKERRQ(ierr); 1600a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(29) (parallel ordering): %d \n",mumps->id.ICNTL(29));CHKERRQ(ierr); 160142179a6aSHong Zhang 1602a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(30) (user-specified set of entries in inv(A)): %d \n",mumps->id.ICNTL(30));CHKERRQ(ierr); 1603a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(31) (factors is discarded in the solve phase): %d \n",mumps->id.ICNTL(31));CHKERRQ(ierr); 1604a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(33) (compute determinant): %d \n",mumps->id.ICNTL(33));CHKERRQ(ierr); 1605f6c57405SHong Zhang 1606a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(1) (relative pivoting threshold): %g \n",mumps->id.CNTL(1));CHKERRQ(ierr); 1607a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(2) (stopping criterion of refinement): %g \n",mumps->id.CNTL(2));CHKERRQ(ierr); 1608ca3dc52bSPierre Jolivet ierr = PetscViewerASCIIPrintf(viewer," CNTL(3) (absolute pivoting threshold): %g \n",mumps->id.CNTL(3));CHKERRQ(ierr); 1609ca3dc52bSPierre Jolivet ierr = PetscViewerASCIIPrintf(viewer," CNTL(4) (value of static pivoting): %g \n",mumps->id.CNTL(4));CHKERRQ(ierr); 1610a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(5) (fixation for null pivots): %g \n",mumps->id.CNTL(5));CHKERRQ(ierr); 1611f6c57405SHong Zhang 1612f6c57405SHong Zhang /* infomation local to each processor */ 161334ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(1) (local estimated flops for the elimination after analysis): \n");CHKERRQ(ierr); 16141575c14dSBarry Smith ierr = PetscViewerASCIIPushSynchronized(viewer);CHKERRQ(ierr); 1615a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(1));CHKERRQ(ierr); 161634ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 161734ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(2) (local estimated flops for the assembly after factorization): \n");CHKERRQ(ierr); 1618a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(2));CHKERRQ(ierr); 161934ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 162034ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(3) (local estimated flops for the elimination after factorization): \n");CHKERRQ(ierr); 1621a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(3));CHKERRQ(ierr); 162234ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1623f6c57405SHong Zhang 162434ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(15) (estimated size of (in MB) MUMPS internal data for running numerical factorization): \n");CHKERRQ(ierr); 1625a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(15));CHKERRQ(ierr); 162634ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1627f6c57405SHong Zhang 162834ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(16) (size of (in MB) MUMPS internal data used during numerical factorization): \n");CHKERRQ(ierr); 1629a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(16));CHKERRQ(ierr); 163034ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1631f6c57405SHong Zhang 163234ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(23) (num of pivots eliminated on this processor after factorization): \n");CHKERRQ(ierr); 1633a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(23));CHKERRQ(ierr); 163434ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1635b34f08ffSHong Zhang 1636b34f08ffSHong Zhang if (mumps->ninfo && mumps->ninfo <= 40){ 1637b34f08ffSHong Zhang PetscInt i; 1638b34f08ffSHong Zhang for (i=0; i<mumps->ninfo; i++){ 1639b34f08ffSHong Zhang ierr = PetscViewerASCIIPrintf(viewer, " INFO(%d): \n",mumps->info[i]);CHKERRQ(ierr); 1640b34f08ffSHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(mumps->info[i]));CHKERRQ(ierr); 1641b34f08ffSHong Zhang ierr = PetscViewerFlush(viewer); 1642b34f08ffSHong Zhang } 1643b34f08ffSHong Zhang } 1644b34f08ffSHong Zhang 1645b34f08ffSHong Zhang 16461575c14dSBarry Smith ierr = PetscViewerASCIIPopSynchronized(viewer);CHKERRQ(ierr); 1647f6c57405SHong Zhang 1648a5e57a09SHong Zhang if (!mumps->myid) { /* information from the host */ 1649a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(1) (global estimated flops for the elimination after analysis): %g \n",mumps->id.RINFOG(1));CHKERRQ(ierr); 1650a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(2) (global estimated flops for the assembly after factorization): %g \n",mumps->id.RINFOG(2));CHKERRQ(ierr); 1651a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(3) (global estimated flops for the elimination after factorization): %g \n",mumps->id.RINFOG(3));CHKERRQ(ierr); 1652a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," (RINFOG(12) RINFOG(13))*2^INFOG(34) (determinant): (%g,%g)*(2^%d)\n",mumps->id.RINFOG(12),mumps->id.RINFOG(13),mumps->id.INFOG(34));CHKERRQ(ierr); 1653f6c57405SHong Zhang 1654a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(3) (estimated real workspace for factors on all processors after analysis): %d \n",mumps->id.INFOG(3));CHKERRQ(ierr); 1655a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(4) (estimated integer workspace for factors on all processors after analysis): %d \n",mumps->id.INFOG(4));CHKERRQ(ierr); 1656a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(5) (estimated maximum front size in the complete tree): %d \n",mumps->id.INFOG(5));CHKERRQ(ierr); 1657a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(6) (number of nodes in the complete tree): %d \n",mumps->id.INFOG(6));CHKERRQ(ierr); 1658a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(7) (ordering option effectively use after analysis): %d \n",mumps->id.INFOG(7));CHKERRQ(ierr); 1659a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(8) (structural symmetry in percent of the permuted matrix after analysis): %d \n",mumps->id.INFOG(8));CHKERRQ(ierr); 1660a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(9) (total real/complex workspace to store the matrix factors after factorization): %d \n",mumps->id.INFOG(9));CHKERRQ(ierr); 1661a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(10) (total integer space store the matrix factors after factorization): %d \n",mumps->id.INFOG(10));CHKERRQ(ierr); 1662a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(11) (order of largest frontal matrix after factorization): %d \n",mumps->id.INFOG(11));CHKERRQ(ierr); 1663a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(12) (number of off-diagonal pivots): %d \n",mumps->id.INFOG(12));CHKERRQ(ierr); 1664a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(13) (number of delayed pivots after factorization): %d \n",mumps->id.INFOG(13));CHKERRQ(ierr); 1665a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(14) (number of memory compress after factorization): %d \n",mumps->id.INFOG(14));CHKERRQ(ierr); 1666a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(15) (number of steps of iterative refinement after solution): %d \n",mumps->id.INFOG(15));CHKERRQ(ierr); 1667a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(16) (estimated size (in MB) of all MUMPS internal data for factorization after analysis: value on the most memory consuming processor): %d \n",mumps->id.INFOG(16));CHKERRQ(ierr); 1668a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(17) (estimated size of all MUMPS internal data for factorization after analysis: sum over all processors): %d \n",mumps->id.INFOG(17));CHKERRQ(ierr); 1669a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(18) (size of all MUMPS internal data allocated during factorization: value on the most memory consuming processor): %d \n",mumps->id.INFOG(18));CHKERRQ(ierr); 1670a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(19) (size of all MUMPS internal data allocated during factorization: sum over all processors): %d \n",mumps->id.INFOG(19));CHKERRQ(ierr); 1671a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(20) (estimated number of entries in the factors): %d \n",mumps->id.INFOG(20));CHKERRQ(ierr); 1672a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(21) (size in MB of memory effectively used during factorization - value on the most memory consuming processor): %d \n",mumps->id.INFOG(21));CHKERRQ(ierr); 1673a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(22) (size in MB of memory effectively used during factorization - sum over all processors): %d \n",mumps->id.INFOG(22));CHKERRQ(ierr); 1674a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(23) (after analysis: value of ICNTL(6) effectively used): %d \n",mumps->id.INFOG(23));CHKERRQ(ierr); 1675a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(24) (after analysis: value of ICNTL(12) effectively used): %d \n",mumps->id.INFOG(24));CHKERRQ(ierr); 1676a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(25) (after factorization: number of pivots modified by static pivoting): %d \n",mumps->id.INFOG(25));CHKERRQ(ierr); 167740d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(28) (after factorization: number of null pivots encountered): %d\n",mumps->id.INFOG(28));CHKERRQ(ierr); 167840d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(29) (after factorization: effective number of entries in the factors (sum over all processors)): %d\n",mumps->id.INFOG(29));CHKERRQ(ierr); 167940d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(30, 31) (after solution: size in Mbytes of memory used during solution phase): %d, %d\n",mumps->id.INFOG(30),mumps->id.INFOG(31));CHKERRQ(ierr); 168040d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(32) (after analysis: type of analysis done): %d\n",mumps->id.INFOG(32));CHKERRQ(ierr); 168140d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(33) (value used for ICNTL(8)): %d\n",mumps->id.INFOG(33));CHKERRQ(ierr); 168240d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(34) (exponent of the determinant if determinant is requested): %d\n",mumps->id.INFOG(34));CHKERRQ(ierr); 1683f6c57405SHong Zhang } 1684f6c57405SHong Zhang } 1685cb828f0fSHong Zhang } 1686f6c57405SHong Zhang PetscFunctionReturn(0); 1687f6c57405SHong Zhang } 1688f6c57405SHong Zhang 168935bd34faSBarry Smith #undef __FUNCT__ 169035bd34faSBarry Smith #define __FUNCT__ "MatGetInfo_MUMPS" 169135bd34faSBarry Smith PetscErrorCode MatGetInfo_MUMPS(Mat A,MatInfoType flag,MatInfo *info) 169235bd34faSBarry Smith { 1693cb828f0fSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)A->spptr; 169435bd34faSBarry Smith 169535bd34faSBarry Smith PetscFunctionBegin; 169635bd34faSBarry Smith info->block_size = 1.0; 1697cb828f0fSHong Zhang info->nz_allocated = mumps->id.INFOG(20); 1698cb828f0fSHong Zhang info->nz_used = mumps->id.INFOG(20); 169935bd34faSBarry Smith info->nz_unneeded = 0.0; 170035bd34faSBarry Smith info->assemblies = 0.0; 170135bd34faSBarry Smith info->mallocs = 0.0; 170235bd34faSBarry Smith info->memory = 0.0; 170335bd34faSBarry Smith info->fill_ratio_given = 0; 170435bd34faSBarry Smith info->fill_ratio_needed = 0; 170535bd34faSBarry Smith info->factor_mallocs = 0; 170635bd34faSBarry Smith PetscFunctionReturn(0); 170735bd34faSBarry Smith } 170835bd34faSBarry Smith 17095ccb76cbSHong Zhang /* -------------------------------------------------------------------------------------------*/ 17105ccb76cbSHong Zhang #undef __FUNCT__ 17116444a565SStefano Zampini #define __FUNCT__ "MatMumpsSetSchurIndices_MUMPS" 17126444a565SStefano Zampini PetscErrorCode MatMumpsSetSchurIndices_MUMPS(Mat F,PetscInt size,PetscInt idxs[]) 17136444a565SStefano Zampini { 17146444a565SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 17156444a565SStefano Zampini PetscErrorCode ierr; 17166444a565SStefano Zampini 17176444a565SStefano Zampini PetscFunctionBegin; 171859ac8732SStefano Zampini if (mumps->size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"MUMPS parallel Schur complements not yet supported from PETSc\n"); 17196444a565SStefano Zampini if (mumps->id.size_schur != size) { 17206444a565SStefano Zampini ierr = PetscFree2(mumps->id.listvar_schur,mumps->id.schur);CHKERRQ(ierr); 17216444a565SStefano Zampini mumps->id.size_schur = size; 17226444a565SStefano Zampini mumps->id.schur_lld = size; 17236444a565SStefano Zampini ierr = PetscMalloc2(size,&mumps->id.listvar_schur,size*size,&mumps->id.schur);CHKERRQ(ierr); 17246444a565SStefano Zampini } 17256444a565SStefano Zampini ierr = PetscMemcpy(mumps->id.listvar_schur,idxs,size*sizeof(PetscInt));CHKERRQ(ierr); 17266444a565SStefano Zampini if (F->factortype == MAT_FACTOR_LU) { 172759ac8732SStefano Zampini mumps->id.ICNTL(19) = 3; /* MUMPS returns full matrix */ 17286444a565SStefano Zampini } else { 172959ac8732SStefano Zampini mumps->id.ICNTL(19) = 2; /* MUMPS returns lower triangular part */ 17306444a565SStefano Zampini } 173159ac8732SStefano Zampini /* set a special value of ICNTL (not handled my MUMPS) to be used in the solve phase by PETSc */ 1732b5fa320bSStefano Zampini mumps->id.ICNTL(26) = -1; 17336444a565SStefano Zampini PetscFunctionReturn(0); 17346444a565SStefano Zampini } 17356444a565SStefano Zampini 17366444a565SStefano Zampini #undef __FUNCT__ 17376444a565SStefano Zampini #define __FUNCT__ "MatMumpsSetSchurIndices" 17386444a565SStefano Zampini /*@ 17396444a565SStefano Zampini MatMumpsSetSchurIndices - Set indices defining the Schur complement that MUMPS will compute during the factorization steps 17406444a565SStefano Zampini 17416444a565SStefano Zampini Logically Collective on Mat 17426444a565SStefano Zampini 17436444a565SStefano Zampini Input Parameters: 17446444a565SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 17456444a565SStefano Zampini . size - size of the Schur complement indices 17466444a565SStefano Zampini - idxs[] - array of Schur complement indices 17476444a565SStefano Zampini 17486444a565SStefano Zampini Notes: 174959ac8732SStefano Zampini The user has to free the array idxs[] since the indices are copied by the routine. 175059ac8732SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 17516444a565SStefano Zampini 17526444a565SStefano Zampini Level: advanced 17536444a565SStefano Zampini 17546444a565SStefano Zampini References: MUMPS Users' Guide 17556444a565SStefano Zampini 175659ac8732SStefano Zampini .seealso: MatGetFactor(), MatMumpsCreateSchurComplement(), MatMumpsGetSchurComplement() 17576444a565SStefano Zampini @*/ 17586444a565SStefano Zampini PetscErrorCode MatMumpsSetSchurIndices(Mat F,PetscInt size,PetscInt idxs[]) 17596444a565SStefano Zampini { 17606444a565SStefano Zampini PetscErrorCode ierr; 17616444a565SStefano Zampini 17626444a565SStefano Zampini PetscFunctionBegin; 1763e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 1764e807eca7SStefano Zampini if (size) PetscValidIntPointer(idxs,3); 17656444a565SStefano Zampini ierr = PetscTryMethod(F,"MatMumpsSetSchurIndices_C",(Mat,PetscInt,PetscInt[]),(F,size,idxs));CHKERRQ(ierr); 17666444a565SStefano Zampini PetscFunctionReturn(0); 17676444a565SStefano Zampini } 176859ac8732SStefano Zampini 17696444a565SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 17706444a565SStefano Zampini #undef __FUNCT__ 177159ac8732SStefano Zampini #define __FUNCT__ "MatMumpsCreateSchurComplement_MUMPS" 177259ac8732SStefano Zampini PetscErrorCode MatMumpsCreateSchurComplement_MUMPS(Mat F,Mat* S) 17736444a565SStefano Zampini { 17746444a565SStefano Zampini Mat St; 17756444a565SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 17766444a565SStefano Zampini PetscScalar *array; 17776444a565SStefano Zampini #if defined(PETSC_USE_COMPLEX) 17788ac429a0SStefano Zampini PetscScalar im = PetscSqrtScalar((PetscScalar)-1.0); 17796444a565SStefano Zampini #endif 17806444a565SStefano Zampini PetscErrorCode ierr; 17816444a565SStefano Zampini 17826444a565SStefano Zampini PetscFunctionBegin; 17836f3cc6f9SBarry Smith if (!mumps->id.ICNTL(19)) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatMumpsSetSchurIndices to enable it"); 17846f3cc6f9SBarry Smith else if (!mumps->id.size_schur) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 17856f3cc6f9SBarry Smith else if (!mumps->schur_restored) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 17866f3cc6f9SBarry Smith 17876444a565SStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)F),&St);CHKERRQ(ierr); 17886444a565SStefano Zampini ierr = MatSetSizes(St,PETSC_DECIDE,PETSC_DECIDE,mumps->id.size_schur,mumps->id.size_schur);CHKERRQ(ierr); 17896444a565SStefano Zampini ierr = MatSetType(St,MATDENSE);CHKERRQ(ierr); 17906444a565SStefano Zampini ierr = MatSetUp(St);CHKERRQ(ierr); 17916444a565SStefano Zampini ierr = MatDenseGetArray(St,&array);CHKERRQ(ierr); 179259ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full matrix */ 17936444a565SStefano Zampini if (mumps->id.ICNTL(19) == 1) { /* stored by rows */ 17946444a565SStefano Zampini PetscInt i,j,N=mumps->id.size_schur; 17956444a565SStefano Zampini for (i=0;i<N;i++) { 17966444a565SStefano Zampini for (j=0;j<N;j++) { 17976444a565SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 17986444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j]; 17996444a565SStefano Zampini #else 18006444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j].r + im*mumps->id.schur[i*N+j].i; 18016444a565SStefano Zampini #endif 18026444a565SStefano Zampini array[j*N+i] = val; 18036444a565SStefano Zampini } 18046444a565SStefano Zampini } 18056444a565SStefano Zampini } else { /* stored by columns */ 18066444a565SStefano Zampini ierr = PetscMemcpy(array,mumps->id.schur,mumps->id.size_schur*mumps->id.size_schur*sizeof(PetscScalar));CHKERRQ(ierr); 18076444a565SStefano Zampini } 18086444a565SStefano Zampini } else { /* either full or lower-triangular (not packed) */ 18096444a565SStefano Zampini if (mumps->id.ICNTL(19) == 2) { /* lower triangular stored by columns */ 18106444a565SStefano Zampini PetscInt i,j,N=mumps->id.size_schur; 18116444a565SStefano Zampini for (i=0;i<N;i++) { 18126444a565SStefano Zampini for (j=i;j<N;j++) { 18136444a565SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 18146444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j]; 18156444a565SStefano Zampini #else 18166444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j].r + im*mumps->id.schur[i*N+j].i; 18176444a565SStefano Zampini #endif 18186444a565SStefano Zampini array[i*N+j] = val; 18196444a565SStefano Zampini array[j*N+i] = val; 18206444a565SStefano Zampini } 18216444a565SStefano Zampini } 18226444a565SStefano Zampini } else if (mumps->id.ICNTL(19) == 3) { /* full matrix */ 18236444a565SStefano Zampini ierr = PetscMemcpy(array,mumps->id.schur,mumps->id.size_schur*mumps->id.size_schur*sizeof(PetscScalar));CHKERRQ(ierr); 18246444a565SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 18256444a565SStefano Zampini PetscInt i,j,N=mumps->id.size_schur; 18266444a565SStefano Zampini for (i=0;i<N;i++) { 18276444a565SStefano Zampini for (j=0;j<i+1;j++) { 18286444a565SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 18296444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j]; 18306444a565SStefano Zampini #else 18316444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j].r + im*mumps->id.schur[i*N+j].i; 18326444a565SStefano Zampini #endif 18336444a565SStefano Zampini array[i*N+j] = val; 18346444a565SStefano Zampini array[j*N+i] = val; 18356444a565SStefano Zampini } 18366444a565SStefano Zampini } 18376444a565SStefano Zampini } 18386444a565SStefano Zampini } 18396444a565SStefano Zampini ierr = MatDenseRestoreArray(St,&array);CHKERRQ(ierr); 18406444a565SStefano Zampini *S = St; 18416444a565SStefano Zampini PetscFunctionReturn(0); 18426444a565SStefano Zampini } 18436444a565SStefano Zampini 18446444a565SStefano Zampini #undef __FUNCT__ 184559ac8732SStefano Zampini #define __FUNCT__ "MatMumpsCreateSchurComplement" 18466444a565SStefano Zampini /*@ 184759ac8732SStefano Zampini MatMumpsCreateSchurComplement - Create a Schur complement matrix object using Schur data computed by MUMPS during the factorization step 18486444a565SStefano Zampini 18496444a565SStefano Zampini Logically Collective on Mat 18506444a565SStefano Zampini 18516444a565SStefano Zampini Input Parameters: 18526444a565SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 18536444a565SStefano Zampini . *S - location where to return the Schur complement (MATDENSE) 18546444a565SStefano Zampini 18556444a565SStefano Zampini Notes: 185659ac8732SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 185759ac8732SStefano Zampini The routine provides a copy of the Schur data stored within MUMPS data strutures. The caller must destroy the object when it is no longer needed. 1858066565c5SStefano Zampini If MatMumpsInvertSchurComplement has been called, the routine gets back the inverse 18596444a565SStefano Zampini 18606444a565SStefano Zampini Level: advanced 18616444a565SStefano Zampini 18626444a565SStefano Zampini References: MUMPS Users' Guide 18636444a565SStefano Zampini 186459ac8732SStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices(), MatMumpsGetSchurComplement() 186559ac8732SStefano Zampini @*/ 186659ac8732SStefano Zampini PetscErrorCode MatMumpsCreateSchurComplement(Mat F,Mat* S) 186759ac8732SStefano Zampini { 186859ac8732SStefano Zampini PetscErrorCode ierr; 186959ac8732SStefano Zampini 187059ac8732SStefano Zampini PetscFunctionBegin; 1871e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 187259ac8732SStefano Zampini ierr = PetscTryMethod(F,"MatMumpsCreateSchurComplement_C",(Mat,Mat*),(F,S));CHKERRQ(ierr); 187359ac8732SStefano Zampini PetscFunctionReturn(0); 187459ac8732SStefano Zampini } 187559ac8732SStefano Zampini 187659ac8732SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 187759ac8732SStefano Zampini #undef __FUNCT__ 187859ac8732SStefano Zampini #define __FUNCT__ "MatMumpsGetSchurComplement_MUMPS" 187959ac8732SStefano Zampini PetscErrorCode MatMumpsGetSchurComplement_MUMPS(Mat F,Mat* S) 188059ac8732SStefano Zampini { 188159ac8732SStefano Zampini Mat St; 188259ac8732SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 188359ac8732SStefano Zampini PetscErrorCode ierr; 188459ac8732SStefano Zampini 188559ac8732SStefano Zampini PetscFunctionBegin; 18866f3cc6f9SBarry Smith if (!mumps->id.ICNTL(19)) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatMumpsSetSchurIndices to enable it"); 18876f3cc6f9SBarry Smith else if (!mumps->id.size_schur) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 18886f3cc6f9SBarry Smith else if (!mumps->schur_restored) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 18896f3cc6f9SBarry Smith 189059ac8732SStefano Zampini /* It should be the responsibility of the user to handle different ICNTL(19) cases if they want to work with the raw data */ 189159ac8732SStefano Zampini /* should I also add errors when the Schur complement has been already factored? */ 189259ac8732SStefano Zampini ierr = MatCreateSeqDense(PetscObjectComm((PetscObject)F),mumps->id.size_schur,mumps->id.size_schur,(PetscScalar*)mumps->id.schur,&St);CHKERRQ(ierr); 189359ac8732SStefano Zampini *S = St; 189459ac8732SStefano Zampini mumps->schur_restored = PETSC_FALSE; 189559ac8732SStefano Zampini PetscFunctionReturn(0); 189659ac8732SStefano Zampini } 189759ac8732SStefano Zampini 189859ac8732SStefano Zampini #undef __FUNCT__ 189959ac8732SStefano Zampini #define __FUNCT__ "MatMumpsGetSchurComplement" 190059ac8732SStefano Zampini /*@ 190159ac8732SStefano Zampini MatMumpsGetSchurComplement - Get a Schur complement matrix object using the current status of the raw Schur data computed by MUMPS during the factorization step 190259ac8732SStefano Zampini 190359ac8732SStefano Zampini Logically Collective on Mat 190459ac8732SStefano Zampini 190559ac8732SStefano Zampini Input Parameters: 190659ac8732SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 190759ac8732SStefano Zampini . *S - location where to return the Schur complement (MATDENSE) 190859ac8732SStefano Zampini 190959ac8732SStefano Zampini Notes: 191059ac8732SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 191159ac8732SStefano Zampini The routine uses the pointer to the raw data of the Schur Complement stored within MUMPS data strutures. The caller should call MatMumpsRestoreSchurComplement when the object is no longer needed. 1912066565c5SStefano Zampini If MatMumpsInvertSchurComplement has been called, the routine gets back the inverse 191359ac8732SStefano Zampini 191459ac8732SStefano Zampini Level: advanced 191559ac8732SStefano Zampini 191659ac8732SStefano Zampini References: MUMPS Users' Guide 191759ac8732SStefano Zampini 191859ac8732SStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices(), MatMumpsRestoreSchurComplement(), MatMumpsCreateSchurComplement() 19196444a565SStefano Zampini @*/ 19206444a565SStefano Zampini PetscErrorCode MatMumpsGetSchurComplement(Mat F,Mat* S) 19216444a565SStefano Zampini { 19226444a565SStefano Zampini PetscErrorCode ierr; 19236444a565SStefano Zampini 19246444a565SStefano Zampini PetscFunctionBegin; 1925e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 192659ac8732SStefano Zampini ierr = PetscUseMethod(F,"MatMumpsGetSchurComplement_C",(Mat,Mat*),(F,S));CHKERRQ(ierr); 192759ac8732SStefano Zampini PetscFunctionReturn(0); 192859ac8732SStefano Zampini } 192959ac8732SStefano Zampini 193059ac8732SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 193159ac8732SStefano Zampini #undef __FUNCT__ 193259ac8732SStefano Zampini #define __FUNCT__ "MatMumpsRestoreSchurComplement_MUMPS" 193359ac8732SStefano Zampini PetscErrorCode MatMumpsRestoreSchurComplement_MUMPS(Mat F,Mat* S) 193459ac8732SStefano Zampini { 193559ac8732SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 193659ac8732SStefano Zampini PetscErrorCode ierr; 193759ac8732SStefano Zampini 193859ac8732SStefano Zampini PetscFunctionBegin; 19396f3cc6f9SBarry Smith if (!mumps->id.ICNTL(19)) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatMumpsSetSchurIndices to enable it"); 19406f3cc6f9SBarry Smith else if (!mumps->id.size_schur) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 19416f3cc6f9SBarry Smith else if (mumps->schur_restored) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has been already restored"); 194259ac8732SStefano Zampini ierr = MatDestroy(S);CHKERRQ(ierr); 194359ac8732SStefano Zampini *S = NULL; 194459ac8732SStefano Zampini mumps->schur_restored = PETSC_TRUE; 194559ac8732SStefano Zampini PetscFunctionReturn(0); 194659ac8732SStefano Zampini } 194759ac8732SStefano Zampini 194859ac8732SStefano Zampini #undef __FUNCT__ 194959ac8732SStefano Zampini #define __FUNCT__ "MatMumpsRestoreSchurComplement" 195059ac8732SStefano Zampini /*@ 195159ac8732SStefano Zampini MatMumpsRestoreSchurComplement - Restore the Schur complement matrix object obtained from a call to MatGetSchurComplement 195259ac8732SStefano Zampini 195359ac8732SStefano Zampini Logically Collective on Mat 195459ac8732SStefano Zampini 195559ac8732SStefano Zampini Input Parameters: 195659ac8732SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 195759ac8732SStefano Zampini . *S - location where the Schur complement is stored 195859ac8732SStefano Zampini 195959ac8732SStefano Zampini Notes: 196059ac8732SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 196159ac8732SStefano Zampini 196259ac8732SStefano Zampini Level: advanced 196359ac8732SStefano Zampini 196459ac8732SStefano Zampini References: MUMPS Users' Guide 196559ac8732SStefano Zampini 196659ac8732SStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices(), MatMumpsGetSchurComplement(), MatMumpsCreateSchurComplement() 196759ac8732SStefano Zampini @*/ 196859ac8732SStefano Zampini PetscErrorCode MatMumpsRestoreSchurComplement(Mat F,Mat* S) 196959ac8732SStefano Zampini { 197059ac8732SStefano Zampini PetscErrorCode ierr; 197159ac8732SStefano Zampini 197259ac8732SStefano Zampini PetscFunctionBegin; 1973e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 197459ac8732SStefano Zampini ierr = PetscUseMethod(F,"MatMumpsRestoreSchurComplement_C",(Mat,Mat*),(F,S));CHKERRQ(ierr); 197559ac8732SStefano Zampini PetscFunctionReturn(0); 197659ac8732SStefano Zampini } 197759ac8732SStefano Zampini 197859ac8732SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 197959ac8732SStefano Zampini #undef __FUNCT__ 198059ac8732SStefano Zampini #define __FUNCT__ "MatMumpsInvertSchurComplement_MUMPS" 198159ac8732SStefano Zampini PetscErrorCode MatMumpsInvertSchurComplement_MUMPS(Mat F) 198259ac8732SStefano Zampini { 198359ac8732SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 198459ac8732SStefano Zampini PetscErrorCode ierr; 198559ac8732SStefano Zampini 198659ac8732SStefano Zampini PetscFunctionBegin; 198759ac8732SStefano Zampini if (!mumps->id.ICNTL(19)) { /* do nothing */ 198859ac8732SStefano Zampini PetscFunctionReturn(0); 198959ac8732SStefano Zampini } 19906f3cc6f9SBarry Smith if (!mumps->id.size_schur) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 19916f3cc6f9SBarry Smith else if (!mumps->schur_restored) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 199259ac8732SStefano Zampini ierr = MatMumpsInvertSchur_Private(mumps);CHKERRQ(ierr); 199359ac8732SStefano Zampini PetscFunctionReturn(0); 199459ac8732SStefano Zampini } 199559ac8732SStefano Zampini 199659ac8732SStefano Zampini #undef __FUNCT__ 199759ac8732SStefano Zampini #define __FUNCT__ "MatMumpsInvertSchurComplement" 199859ac8732SStefano Zampini /*@ 199959ac8732SStefano Zampini MatMumpsInvertSchurComplement - Invert the raw Schur data computed by MUMPS during the factorization step 200059ac8732SStefano Zampini 200159ac8732SStefano Zampini Logically Collective on Mat 200259ac8732SStefano Zampini 200359ac8732SStefano Zampini Input Parameters: 200459ac8732SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 200559ac8732SStefano Zampini 200659ac8732SStefano Zampini Notes: 200759ac8732SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 200859ac8732SStefano Zampini The routine uses the pointer to the raw data of the Schur Complement stored within MUMPS data strutures. 200959ac8732SStefano Zampini 201059ac8732SStefano Zampini Level: advanced 201159ac8732SStefano Zampini 201259ac8732SStefano Zampini References: MUMPS Users' Guide 201359ac8732SStefano Zampini 201459ac8732SStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices() 201559ac8732SStefano Zampini @*/ 201659ac8732SStefano Zampini PetscErrorCode MatMumpsInvertSchurComplement(Mat F) 201759ac8732SStefano Zampini { 201859ac8732SStefano Zampini PetscErrorCode ierr; 201959ac8732SStefano Zampini 202059ac8732SStefano Zampini PetscFunctionBegin; 2021e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 202259ac8732SStefano Zampini ierr = PetscTryMethod(F,"MatMumpsInvertSchurComplement_C",(Mat),(F));CHKERRQ(ierr); 20236444a565SStefano Zampini PetscFunctionReturn(0); 20246444a565SStefano Zampini } 20256444a565SStefano Zampini 20266444a565SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 20276444a565SStefano Zampini #undef __FUNCT__ 2028e807eca7SStefano Zampini #define __FUNCT__ "MatMumpsSolveSchurComplement_MUMPS" 2029e807eca7SStefano Zampini PetscErrorCode MatMumpsSolveSchurComplement_MUMPS(Mat F, Vec rhs, Vec sol) 2030e807eca7SStefano Zampini { 2031e807eca7SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2032e807eca7SStefano Zampini MumpsScalar *orhs; 2033e807eca7SStefano Zampini PetscScalar *osol,*nrhs,*nsol; 20349a3a5937SStefano Zampini PetscInt orhs_size,osol_size,olrhs_size; 2035e807eca7SStefano Zampini PetscErrorCode ierr; 2036e807eca7SStefano Zampini 2037e807eca7SStefano Zampini PetscFunctionBegin; 20386f3cc6f9SBarry Smith if (!mumps->id.ICNTL(19)) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatMumpsSetSchurIndices to enable it"); 20396f3cc6f9SBarry Smith if (!mumps->id.size_schur) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 20406f3cc6f9SBarry Smith else if (!mumps->schur_restored) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 20416f3cc6f9SBarry Smith 2042e807eca7SStefano Zampini /* swap pointers */ 2043e807eca7SStefano Zampini orhs = mumps->id.redrhs; 20449a3a5937SStefano Zampini olrhs_size = mumps->id.lredrhs; 2045a12f35bfSStefano Zampini orhs_size = mumps->sizeredrhs; 2046e807eca7SStefano Zampini osol = mumps->schur_sol; 2047a12f35bfSStefano Zampini osol_size = mumps->schur_sizesol; 2048e807eca7SStefano Zampini ierr = VecGetArray(rhs,&nrhs);CHKERRQ(ierr); 2049e807eca7SStefano Zampini ierr = VecGetArray(sol,&nsol);CHKERRQ(ierr); 2050e807eca7SStefano Zampini mumps->id.redrhs = (MumpsScalar*)nrhs; 2051a12f35bfSStefano Zampini ierr = VecGetLocalSize(rhs,&mumps->sizeredrhs);CHKERRQ(ierr); 20529a3a5937SStefano Zampini mumps->id.lredrhs = mumps->sizeredrhs; 2053e807eca7SStefano Zampini mumps->schur_sol = nsol; 2054a12f35bfSStefano Zampini ierr = VecGetLocalSize(sol,&mumps->schur_sizesol);CHKERRQ(ierr); 2055a12f35bfSStefano Zampini 2056e807eca7SStefano Zampini /* solve Schur complement */ 2057e807eca7SStefano Zampini mumps->id.nrhs = 1; 2058e807eca7SStefano Zampini ierr = MatMumpsSolveSchur_Private(mumps,PETSC_FALSE);CHKERRQ(ierr); 2059e807eca7SStefano Zampini /* restore pointers */ 2060e807eca7SStefano Zampini ierr = VecRestoreArray(rhs,&nrhs);CHKERRQ(ierr); 2061e807eca7SStefano Zampini ierr = VecRestoreArray(sol,&nsol);CHKERRQ(ierr); 2062e807eca7SStefano Zampini mumps->id.redrhs = orhs; 20639a3a5937SStefano Zampini mumps->id.lredrhs = olrhs_size; 2064a12f35bfSStefano Zampini mumps->sizeredrhs = orhs_size; 2065e807eca7SStefano Zampini mumps->schur_sol = osol; 2066a12f35bfSStefano Zampini mumps->schur_sizesol = osol_size; 2067e807eca7SStefano Zampini PetscFunctionReturn(0); 2068e807eca7SStefano Zampini } 2069e807eca7SStefano Zampini 2070e807eca7SStefano Zampini #undef __FUNCT__ 2071e807eca7SStefano Zampini #define __FUNCT__ "MatMumpsSolveSchurComplement" 2072e807eca7SStefano Zampini /*@ 2073e807eca7SStefano Zampini MatMumpsSolveSchurComplement - Solve the Schur complement system computed by MUMPS during the factorization step 2074e807eca7SStefano Zampini 2075e807eca7SStefano Zampini Logically Collective on Mat 2076e807eca7SStefano Zampini 2077e807eca7SStefano Zampini Input Parameters: 2078e807eca7SStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2079e807eca7SStefano Zampini . rhs - location where the right hand side of the Schur complement system is stored 2080e807eca7SStefano Zampini - sol - location where the solution of the Schur complement system has to be returned 2081e807eca7SStefano Zampini 2082e807eca7SStefano Zampini Notes: 2083e807eca7SStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 2084e807eca7SStefano Zampini The sizes of the vectors should match the size of the Schur complement 2085e807eca7SStefano Zampini 2086e807eca7SStefano Zampini Level: advanced 2087e807eca7SStefano Zampini 2088e807eca7SStefano Zampini References: MUMPS Users' Guide 2089e807eca7SStefano Zampini 2090e807eca7SStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices() 2091e807eca7SStefano Zampini @*/ 2092e807eca7SStefano Zampini PetscErrorCode MatMumpsSolveSchurComplement(Mat F, Vec rhs, Vec sol) 2093e807eca7SStefano Zampini { 2094e807eca7SStefano Zampini PetscErrorCode ierr; 2095e807eca7SStefano Zampini 2096e807eca7SStefano Zampini PetscFunctionBegin; 2097e807eca7SStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 2098e807eca7SStefano Zampini PetscValidHeaderSpecific(rhs,VEC_CLASSID,2); 2099e807eca7SStefano Zampini PetscValidHeaderSpecific(sol,VEC_CLASSID,2); 2100e807eca7SStefano Zampini PetscCheckSameComm(F,1,rhs,2); 2101e807eca7SStefano Zampini PetscCheckSameComm(F,1,sol,3); 21027404bcfbSStefano Zampini ierr = PetscUseMethod(F,"MatMumpsSolveSchurComplement_C",(Mat,Vec,Vec),(F,rhs,sol));CHKERRQ(ierr); 21037404bcfbSStefano Zampini PetscFunctionReturn(0); 21047404bcfbSStefano Zampini } 21057404bcfbSStefano Zampini 21067404bcfbSStefano Zampini /* -------------------------------------------------------------------------------------------*/ 21077404bcfbSStefano Zampini #undef __FUNCT__ 21087404bcfbSStefano Zampini #define __FUNCT__ "MatMumpsSolveSchurComplementTranspose_MUMPS" 21097404bcfbSStefano Zampini PetscErrorCode MatMumpsSolveSchurComplementTranspose_MUMPS(Mat F, Vec rhs, Vec sol) 21107404bcfbSStefano Zampini { 21117404bcfbSStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 21127404bcfbSStefano Zampini MumpsScalar *orhs; 21137404bcfbSStefano Zampini PetscScalar *osol,*nrhs,*nsol; 2114a12f35bfSStefano Zampini PetscInt orhs_size,osol_size; 21157404bcfbSStefano Zampini PetscErrorCode ierr; 21167404bcfbSStefano Zampini 21177404bcfbSStefano Zampini PetscFunctionBegin; 21186f3cc6f9SBarry Smith if (!mumps->id.ICNTL(19)) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatMumpsSetSchurIndices to enable it"); 21196f3cc6f9SBarry Smith else if (!mumps->id.size_schur) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatMumpsSetSchurIndices before"); 21206f3cc6f9SBarry Smith if (!mumps->schur_restored) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur matrix has not been restored using MatMumpsRestoreSchurComplement"); 21216f3cc6f9SBarry Smith 21227404bcfbSStefano Zampini /* swap pointers */ 21237404bcfbSStefano Zampini orhs = mumps->id.redrhs; 2124a12f35bfSStefano Zampini orhs_size = mumps->sizeredrhs; 21257404bcfbSStefano Zampini osol = mumps->schur_sol; 2126a12f35bfSStefano Zampini osol_size = mumps->schur_sizesol; 21277404bcfbSStefano Zampini ierr = VecGetArray(rhs,&nrhs);CHKERRQ(ierr); 21287404bcfbSStefano Zampini ierr = VecGetArray(sol,&nsol);CHKERRQ(ierr); 21297404bcfbSStefano Zampini mumps->id.redrhs = (MumpsScalar*)nrhs; 2130a12f35bfSStefano Zampini ierr = VecGetLocalSize(rhs,&mumps->sizeredrhs);CHKERRQ(ierr); 21317404bcfbSStefano Zampini mumps->schur_sol = nsol; 2132a12f35bfSStefano Zampini ierr = VecGetLocalSize(sol,&mumps->schur_sizesol);CHKERRQ(ierr); 2133a12f35bfSStefano Zampini 21347404bcfbSStefano Zampini /* solve Schur complement */ 21357404bcfbSStefano Zampini mumps->id.nrhs = 1; 21367404bcfbSStefano Zampini mumps->id.ICNTL(9) = 0; 21377404bcfbSStefano Zampini ierr = MatMumpsSolveSchur_Private(mumps,PETSC_FALSE);CHKERRQ(ierr); 21387404bcfbSStefano Zampini mumps->id.ICNTL(9) = 1; 21397404bcfbSStefano Zampini /* restore pointers */ 21407404bcfbSStefano Zampini ierr = VecRestoreArray(rhs,&nrhs);CHKERRQ(ierr); 21417404bcfbSStefano Zampini ierr = VecRestoreArray(sol,&nsol);CHKERRQ(ierr); 21427404bcfbSStefano Zampini mumps->id.redrhs = orhs; 2143a12f35bfSStefano Zampini mumps->sizeredrhs = orhs_size; 21447404bcfbSStefano Zampini mumps->schur_sol = osol; 2145a12f35bfSStefano Zampini mumps->schur_sizesol = osol_size; 21467404bcfbSStefano Zampini PetscFunctionReturn(0); 21477404bcfbSStefano Zampini } 21487404bcfbSStefano Zampini 21497404bcfbSStefano Zampini #undef __FUNCT__ 21507404bcfbSStefano Zampini #define __FUNCT__ "MatMumpsSolveSchurComplementTranspose" 21517404bcfbSStefano Zampini /*@ 21527404bcfbSStefano Zampini MatMumpsSolveSchurComplementTranspose - Solve the transpose of the Schur complement system computed by MUMPS during the factorization step 21537404bcfbSStefano Zampini 21547404bcfbSStefano Zampini Logically Collective on Mat 21557404bcfbSStefano Zampini 21567404bcfbSStefano Zampini Input Parameters: 21577404bcfbSStefano Zampini + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 21587404bcfbSStefano Zampini . rhs - location where the right hand side of the Schur complement system is stored 21597404bcfbSStefano Zampini - sol - location where the solution of the Schur complement system has to be returned 21607404bcfbSStefano Zampini 21617404bcfbSStefano Zampini Notes: 21627404bcfbSStefano Zampini MUMPS Schur complement mode is currently implemented for sequential matrices. 21637404bcfbSStefano Zampini The sizes of the vectors should match the size of the Schur complement 21647404bcfbSStefano Zampini 21657404bcfbSStefano Zampini Level: advanced 21667404bcfbSStefano Zampini 21677404bcfbSStefano Zampini References: MUMPS Users' Guide 21687404bcfbSStefano Zampini 21697404bcfbSStefano Zampini .seealso: MatGetFactor(), MatMumpsSetSchurIndices() 21707404bcfbSStefano Zampini @*/ 21717404bcfbSStefano Zampini PetscErrorCode MatMumpsSolveSchurComplementTranspose(Mat F, Vec rhs, Vec sol) 21727404bcfbSStefano Zampini { 21737404bcfbSStefano Zampini PetscErrorCode ierr; 21747404bcfbSStefano Zampini 21757404bcfbSStefano Zampini PetscFunctionBegin; 21767404bcfbSStefano Zampini PetscValidHeaderSpecific(F,MAT_CLASSID,1); 21777404bcfbSStefano Zampini PetscValidHeaderSpecific(rhs,VEC_CLASSID,2); 21787404bcfbSStefano Zampini PetscValidHeaderSpecific(sol,VEC_CLASSID,2); 21797404bcfbSStefano Zampini PetscCheckSameComm(F,1,rhs,2); 21807404bcfbSStefano Zampini PetscCheckSameComm(F,1,sol,3); 21817404bcfbSStefano Zampini ierr = PetscUseMethod(F,"MatMumpsSolveSchurComplementTranspose_C",(Mat,Vec,Vec),(F,rhs,sol));CHKERRQ(ierr); 2182e807eca7SStefano Zampini PetscFunctionReturn(0); 2183e807eca7SStefano Zampini } 2184e807eca7SStefano Zampini 2185e807eca7SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 2186e807eca7SStefano Zampini #undef __FUNCT__ 21875ccb76cbSHong Zhang #define __FUNCT__ "MatMumpsSetIcntl_MUMPS" 21885ccb76cbSHong Zhang PetscErrorCode MatMumpsSetIcntl_MUMPS(Mat F,PetscInt icntl,PetscInt ival) 21895ccb76cbSHong Zhang { 2190a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 21915ccb76cbSHong Zhang 21925ccb76cbSHong Zhang PetscFunctionBegin; 2193a5e57a09SHong Zhang mumps->id.ICNTL(icntl) = ival; 21945ccb76cbSHong Zhang PetscFunctionReturn(0); 21955ccb76cbSHong Zhang } 21965ccb76cbSHong Zhang 21975ccb76cbSHong Zhang #undef __FUNCT__ 2198bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetIcntl_MUMPS" 2199bc6112feSHong Zhang PetscErrorCode MatMumpsGetIcntl_MUMPS(Mat F,PetscInt icntl,PetscInt *ival) 2200bc6112feSHong Zhang { 2201bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2202bc6112feSHong Zhang 2203bc6112feSHong Zhang PetscFunctionBegin; 2204bc6112feSHong Zhang *ival = mumps->id.ICNTL(icntl); 2205bc6112feSHong Zhang PetscFunctionReturn(0); 2206bc6112feSHong Zhang } 2207bc6112feSHong Zhang 2208bc6112feSHong Zhang #undef __FUNCT__ 22095ccb76cbSHong Zhang #define __FUNCT__ "MatMumpsSetIcntl" 22105ccb76cbSHong Zhang /*@ 22115ccb76cbSHong Zhang MatMumpsSetIcntl - Set MUMPS parameter ICNTL() 22125ccb76cbSHong Zhang 22135ccb76cbSHong Zhang Logically Collective on Mat 22145ccb76cbSHong Zhang 22155ccb76cbSHong Zhang Input Parameters: 22165ccb76cbSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 22175ccb76cbSHong Zhang . icntl - index of MUMPS parameter array ICNTL() 22185ccb76cbSHong Zhang - ival - value of MUMPS ICNTL(icntl) 22195ccb76cbSHong Zhang 22205ccb76cbSHong Zhang Options Database: 22215ccb76cbSHong Zhang . -mat_mumps_icntl_<icntl> <ival> 22225ccb76cbSHong Zhang 22235ccb76cbSHong Zhang Level: beginner 22245ccb76cbSHong Zhang 22255ccb76cbSHong Zhang References: MUMPS Users' Guide 22265ccb76cbSHong Zhang 22275ccb76cbSHong Zhang .seealso: MatGetFactor() 22285ccb76cbSHong Zhang @*/ 22295ccb76cbSHong Zhang PetscErrorCode MatMumpsSetIcntl(Mat F,PetscInt icntl,PetscInt ival) 22305ccb76cbSHong Zhang { 22315ccb76cbSHong Zhang PetscErrorCode ierr; 22325ccb76cbSHong Zhang 22335ccb76cbSHong Zhang PetscFunctionBegin; 22345ccb76cbSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 22355ccb76cbSHong Zhang PetscValidLogicalCollectiveInt(F,ival,3); 22365ccb76cbSHong Zhang ierr = PetscTryMethod(F,"MatMumpsSetIcntl_C",(Mat,PetscInt,PetscInt),(F,icntl,ival));CHKERRQ(ierr); 22375ccb76cbSHong Zhang PetscFunctionReturn(0); 22385ccb76cbSHong Zhang } 22395ccb76cbSHong Zhang 2240bc6112feSHong Zhang #undef __FUNCT__ 2241bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetIcntl" 2242a21f80fcSHong Zhang /*@ 2243a21f80fcSHong Zhang MatMumpsGetIcntl - Get MUMPS parameter ICNTL() 2244a21f80fcSHong Zhang 2245a21f80fcSHong Zhang Logically Collective on Mat 2246a21f80fcSHong Zhang 2247a21f80fcSHong Zhang Input Parameters: 2248a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2249a21f80fcSHong Zhang - icntl - index of MUMPS parameter array ICNTL() 2250a21f80fcSHong Zhang 2251a21f80fcSHong Zhang Output Parameter: 2252a21f80fcSHong Zhang . ival - value of MUMPS ICNTL(icntl) 2253a21f80fcSHong Zhang 2254a21f80fcSHong Zhang Level: beginner 2255a21f80fcSHong Zhang 2256a21f80fcSHong Zhang References: MUMPS Users' Guide 2257a21f80fcSHong Zhang 2258a21f80fcSHong Zhang .seealso: MatGetFactor() 2259a21f80fcSHong Zhang @*/ 2260bc6112feSHong Zhang PetscErrorCode MatMumpsGetIcntl(Mat F,PetscInt icntl,PetscInt *ival) 2261bc6112feSHong Zhang { 2262bc6112feSHong Zhang PetscErrorCode ierr; 2263bc6112feSHong Zhang 2264bc6112feSHong Zhang PetscFunctionBegin; 2265bc6112feSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 2266bc6112feSHong Zhang PetscValidIntPointer(ival,3); 2267bc6112feSHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetIcntl_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 2268bc6112feSHong Zhang PetscFunctionReturn(0); 2269bc6112feSHong Zhang } 2270bc6112feSHong Zhang 22718928b65cSHong Zhang /* -------------------------------------------------------------------------------------------*/ 22728928b65cSHong Zhang #undef __FUNCT__ 22738928b65cSHong Zhang #define __FUNCT__ "MatMumpsSetCntl_MUMPS" 22748928b65cSHong Zhang PetscErrorCode MatMumpsSetCntl_MUMPS(Mat F,PetscInt icntl,PetscReal val) 22758928b65cSHong Zhang { 22768928b65cSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 22778928b65cSHong Zhang 22788928b65cSHong Zhang PetscFunctionBegin; 22798928b65cSHong Zhang mumps->id.CNTL(icntl) = val; 22808928b65cSHong Zhang PetscFunctionReturn(0); 22818928b65cSHong Zhang } 22828928b65cSHong Zhang 22838928b65cSHong Zhang #undef __FUNCT__ 2284bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetCntl_MUMPS" 2285bc6112feSHong Zhang PetscErrorCode MatMumpsGetCntl_MUMPS(Mat F,PetscInt icntl,PetscReal *val) 2286bc6112feSHong Zhang { 2287bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2288bc6112feSHong Zhang 2289bc6112feSHong Zhang PetscFunctionBegin; 2290bc6112feSHong Zhang *val = mumps->id.CNTL(icntl); 2291bc6112feSHong Zhang PetscFunctionReturn(0); 2292bc6112feSHong Zhang } 2293bc6112feSHong Zhang 2294bc6112feSHong Zhang #undef __FUNCT__ 22958928b65cSHong Zhang #define __FUNCT__ "MatMumpsSetCntl" 22968928b65cSHong Zhang /*@ 22978928b65cSHong Zhang MatMumpsSetCntl - Set MUMPS parameter CNTL() 22988928b65cSHong Zhang 22998928b65cSHong Zhang Logically Collective on Mat 23008928b65cSHong Zhang 23018928b65cSHong Zhang Input Parameters: 23028928b65cSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 23038928b65cSHong Zhang . icntl - index of MUMPS parameter array CNTL() 23048928b65cSHong Zhang - val - value of MUMPS CNTL(icntl) 23058928b65cSHong Zhang 23068928b65cSHong Zhang Options Database: 23078928b65cSHong Zhang . -mat_mumps_cntl_<icntl> <val> 23088928b65cSHong Zhang 23098928b65cSHong Zhang Level: beginner 23108928b65cSHong Zhang 23118928b65cSHong Zhang References: MUMPS Users' Guide 23128928b65cSHong Zhang 23138928b65cSHong Zhang .seealso: MatGetFactor() 23148928b65cSHong Zhang @*/ 23158928b65cSHong Zhang PetscErrorCode MatMumpsSetCntl(Mat F,PetscInt icntl,PetscReal val) 23168928b65cSHong Zhang { 23178928b65cSHong Zhang PetscErrorCode ierr; 23188928b65cSHong Zhang 23198928b65cSHong Zhang PetscFunctionBegin; 23208928b65cSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 2321bc6112feSHong Zhang PetscValidLogicalCollectiveReal(F,val,3); 23228928b65cSHong Zhang ierr = PetscTryMethod(F,"MatMumpsSetCntl_C",(Mat,PetscInt,PetscReal),(F,icntl,val));CHKERRQ(ierr); 23238928b65cSHong Zhang PetscFunctionReturn(0); 23248928b65cSHong Zhang } 23258928b65cSHong Zhang 2326bc6112feSHong Zhang #undef __FUNCT__ 2327bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetCntl" 2328a21f80fcSHong Zhang /*@ 2329a21f80fcSHong Zhang MatMumpsGetCntl - Get MUMPS parameter CNTL() 2330a21f80fcSHong Zhang 2331a21f80fcSHong Zhang Logically Collective on Mat 2332a21f80fcSHong Zhang 2333a21f80fcSHong Zhang Input Parameters: 2334a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2335a21f80fcSHong Zhang - icntl - index of MUMPS parameter array CNTL() 2336a21f80fcSHong Zhang 2337a21f80fcSHong Zhang Output Parameter: 2338a21f80fcSHong Zhang . val - value of MUMPS CNTL(icntl) 2339a21f80fcSHong Zhang 2340a21f80fcSHong Zhang Level: beginner 2341a21f80fcSHong Zhang 2342a21f80fcSHong Zhang References: MUMPS Users' Guide 2343a21f80fcSHong Zhang 2344a21f80fcSHong Zhang .seealso: MatGetFactor() 2345a21f80fcSHong Zhang @*/ 2346bc6112feSHong Zhang PetscErrorCode MatMumpsGetCntl(Mat F,PetscInt icntl,PetscReal *val) 2347bc6112feSHong Zhang { 2348bc6112feSHong Zhang PetscErrorCode ierr; 2349bc6112feSHong Zhang 2350bc6112feSHong Zhang PetscFunctionBegin; 2351bc6112feSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 2352bc6112feSHong Zhang PetscValidRealPointer(val,3); 2353bc6112feSHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetCntl_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 2354bc6112feSHong Zhang PetscFunctionReturn(0); 2355bc6112feSHong Zhang } 2356bc6112feSHong Zhang 2357bc6112feSHong Zhang #undef __FUNCT__ 2358ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfo_MUMPS" 2359ca810319SHong Zhang PetscErrorCode MatMumpsGetInfo_MUMPS(Mat F,PetscInt icntl,PetscInt *info) 2360bc6112feSHong Zhang { 2361bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2362bc6112feSHong Zhang 2363bc6112feSHong Zhang PetscFunctionBegin; 2364bc6112feSHong Zhang *info = mumps->id.INFO(icntl); 2365bc6112feSHong Zhang PetscFunctionReturn(0); 2366bc6112feSHong Zhang } 2367bc6112feSHong Zhang 2368bc6112feSHong Zhang #undef __FUNCT__ 2369ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfog_MUMPS" 2370ca810319SHong Zhang PetscErrorCode MatMumpsGetInfog_MUMPS(Mat F,PetscInt icntl,PetscInt *infog) 2371bc6112feSHong Zhang { 2372bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2373bc6112feSHong Zhang 2374bc6112feSHong Zhang PetscFunctionBegin; 2375bc6112feSHong Zhang *infog = mumps->id.INFOG(icntl); 2376bc6112feSHong Zhang PetscFunctionReturn(0); 2377bc6112feSHong Zhang } 2378bc6112feSHong Zhang 2379bc6112feSHong Zhang #undef __FUNCT__ 2380ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfo_MUMPS" 2381ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfo_MUMPS(Mat F,PetscInt icntl,PetscReal *rinfo) 2382bc6112feSHong Zhang { 2383bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2384bc6112feSHong Zhang 2385bc6112feSHong Zhang PetscFunctionBegin; 2386bc6112feSHong Zhang *rinfo = mumps->id.RINFO(icntl); 2387bc6112feSHong Zhang PetscFunctionReturn(0); 2388bc6112feSHong Zhang } 2389bc6112feSHong Zhang 2390bc6112feSHong Zhang #undef __FUNCT__ 2391ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfog_MUMPS" 2392ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfog_MUMPS(Mat F,PetscInt icntl,PetscReal *rinfog) 2393bc6112feSHong Zhang { 2394bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2395bc6112feSHong Zhang 2396bc6112feSHong Zhang PetscFunctionBegin; 2397bc6112feSHong Zhang *rinfog = mumps->id.RINFOG(icntl); 2398bc6112feSHong Zhang PetscFunctionReturn(0); 2399bc6112feSHong Zhang } 2400bc6112feSHong Zhang 2401bc6112feSHong Zhang #undef __FUNCT__ 2402ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfo" 2403a21f80fcSHong Zhang /*@ 2404a21f80fcSHong Zhang MatMumpsGetInfo - Get MUMPS parameter INFO() 2405a21f80fcSHong Zhang 2406a21f80fcSHong Zhang Logically Collective on Mat 2407a21f80fcSHong Zhang 2408a21f80fcSHong Zhang Input Parameters: 2409a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2410a21f80fcSHong Zhang - icntl - index of MUMPS parameter array INFO() 2411a21f80fcSHong Zhang 2412a21f80fcSHong Zhang Output Parameter: 2413a21f80fcSHong Zhang . ival - value of MUMPS INFO(icntl) 2414a21f80fcSHong Zhang 2415a21f80fcSHong Zhang Level: beginner 2416a21f80fcSHong Zhang 2417a21f80fcSHong Zhang References: MUMPS Users' Guide 2418a21f80fcSHong Zhang 2419a21f80fcSHong Zhang .seealso: MatGetFactor() 2420a21f80fcSHong Zhang @*/ 2421ca810319SHong Zhang PetscErrorCode MatMumpsGetInfo(Mat F,PetscInt icntl,PetscInt *ival) 2422bc6112feSHong Zhang { 2423bc6112feSHong Zhang PetscErrorCode ierr; 2424bc6112feSHong Zhang 2425bc6112feSHong Zhang PetscFunctionBegin; 2426ca810319SHong Zhang PetscValidIntPointer(ival,3); 2427ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetInfo_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 2428bc6112feSHong Zhang PetscFunctionReturn(0); 2429bc6112feSHong Zhang } 2430bc6112feSHong Zhang 2431bc6112feSHong Zhang #undef __FUNCT__ 2432ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfog" 2433a21f80fcSHong Zhang /*@ 2434a21f80fcSHong Zhang MatMumpsGetInfog - Get MUMPS parameter INFOG() 2435a21f80fcSHong Zhang 2436a21f80fcSHong Zhang Logically Collective on Mat 2437a21f80fcSHong Zhang 2438a21f80fcSHong Zhang Input Parameters: 2439a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2440a21f80fcSHong Zhang - icntl - index of MUMPS parameter array INFOG() 2441a21f80fcSHong Zhang 2442a21f80fcSHong Zhang Output Parameter: 2443a21f80fcSHong Zhang . ival - value of MUMPS INFOG(icntl) 2444a21f80fcSHong Zhang 2445a21f80fcSHong Zhang Level: beginner 2446a21f80fcSHong Zhang 2447a21f80fcSHong Zhang References: MUMPS Users' Guide 2448a21f80fcSHong Zhang 2449a21f80fcSHong Zhang .seealso: MatGetFactor() 2450a21f80fcSHong Zhang @*/ 2451ca810319SHong Zhang PetscErrorCode MatMumpsGetInfog(Mat F,PetscInt icntl,PetscInt *ival) 2452bc6112feSHong Zhang { 2453bc6112feSHong Zhang PetscErrorCode ierr; 2454bc6112feSHong Zhang 2455bc6112feSHong Zhang PetscFunctionBegin; 2456ca810319SHong Zhang PetscValidIntPointer(ival,3); 2457ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetInfog_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 2458bc6112feSHong Zhang PetscFunctionReturn(0); 2459bc6112feSHong Zhang } 2460bc6112feSHong Zhang 2461bc6112feSHong Zhang #undef __FUNCT__ 2462ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfo" 2463a21f80fcSHong Zhang /*@ 2464a21f80fcSHong Zhang MatMumpsGetRinfo - Get MUMPS parameter RINFO() 2465a21f80fcSHong Zhang 2466a21f80fcSHong Zhang Logically Collective on Mat 2467a21f80fcSHong Zhang 2468a21f80fcSHong Zhang Input Parameters: 2469a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2470a21f80fcSHong Zhang - icntl - index of MUMPS parameter array RINFO() 2471a21f80fcSHong Zhang 2472a21f80fcSHong Zhang Output Parameter: 2473a21f80fcSHong Zhang . val - value of MUMPS RINFO(icntl) 2474a21f80fcSHong Zhang 2475a21f80fcSHong Zhang Level: beginner 2476a21f80fcSHong Zhang 2477a21f80fcSHong Zhang References: MUMPS Users' Guide 2478a21f80fcSHong Zhang 2479a21f80fcSHong Zhang .seealso: MatGetFactor() 2480a21f80fcSHong Zhang @*/ 2481ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfo(Mat F,PetscInt icntl,PetscReal *val) 2482bc6112feSHong Zhang { 2483bc6112feSHong Zhang PetscErrorCode ierr; 2484bc6112feSHong Zhang 2485bc6112feSHong Zhang PetscFunctionBegin; 2486bc6112feSHong Zhang PetscValidRealPointer(val,3); 2487ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetRinfo_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 2488bc6112feSHong Zhang PetscFunctionReturn(0); 2489bc6112feSHong Zhang } 2490bc6112feSHong Zhang 2491bc6112feSHong Zhang #undef __FUNCT__ 2492ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfog" 2493a21f80fcSHong Zhang /*@ 2494a21f80fcSHong Zhang MatMumpsGetRinfog - Get MUMPS parameter RINFOG() 2495a21f80fcSHong Zhang 2496a21f80fcSHong Zhang Logically Collective on Mat 2497a21f80fcSHong Zhang 2498a21f80fcSHong Zhang Input Parameters: 2499a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2500a21f80fcSHong Zhang - icntl - index of MUMPS parameter array RINFOG() 2501a21f80fcSHong Zhang 2502a21f80fcSHong Zhang Output Parameter: 2503a21f80fcSHong Zhang . val - value of MUMPS RINFOG(icntl) 2504a21f80fcSHong Zhang 2505a21f80fcSHong Zhang Level: beginner 2506a21f80fcSHong Zhang 2507a21f80fcSHong Zhang References: MUMPS Users' Guide 2508a21f80fcSHong Zhang 2509a21f80fcSHong Zhang .seealso: MatGetFactor() 2510a21f80fcSHong Zhang @*/ 2511ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfog(Mat F,PetscInt icntl,PetscReal *val) 2512bc6112feSHong Zhang { 2513bc6112feSHong Zhang PetscErrorCode ierr; 2514bc6112feSHong Zhang 2515bc6112feSHong Zhang PetscFunctionBegin; 2516bc6112feSHong Zhang PetscValidRealPointer(val,3); 2517ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetRinfog_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 2518bc6112feSHong Zhang PetscFunctionReturn(0); 2519bc6112feSHong Zhang } 2520bc6112feSHong Zhang 252124b6179bSKris Buschelman /*MC 25222692d6eeSBarry Smith MATSOLVERMUMPS - A matrix type providing direct solvers (LU and Cholesky) for 252324b6179bSKris Buschelman distributed and sequential matrices via the external package MUMPS. 252424b6179bSKris Buschelman 252541c8de11SBarry Smith Works with MATAIJ and MATSBAIJ matrices 252624b6179bSKris Buschelman 2527c2b89b5dSBarry Smith Use ./configure --download-mumps --download-scalapack --download-parmetis --download-metis --download-ptscotch to have PETSc installed with MUMPS 2528c2b89b5dSBarry Smith 2529c2b89b5dSBarry Smith Use -pc_type cholesky or lu -pc_factor_mat_solver_package mumps to us this direct solver 2530c2b89b5dSBarry Smith 253124b6179bSKris Buschelman Options Database Keys: 25324e34a73bSHong Zhang + -mat_mumps_icntl_1 <6>: ICNTL(1): output stream for error messages (None) 25334e34a73bSHong Zhang . -mat_mumps_icntl_2 <0>: ICNTL(2): output stream for diagnostic printing, statistics, and warning (None) 25344e34a73bSHong Zhang . -mat_mumps_icntl_3 <0>: ICNTL(3): output stream for global information, collected on the host (None) 25354e34a73bSHong Zhang . -mat_mumps_icntl_4 <0>: ICNTL(4): level of printing (0 to 4) (None) 25364e34a73bSHong Zhang . -mat_mumps_icntl_6 <7>: ICNTL(6): permutes to a zero-free diagonal and/or scale the matrix (0 to 7) (None) 25374e34a73bSHong Zhang . -mat_mumps_icntl_7 <7>: ICNTL(7): computes a symmetric permutation in sequential analysis (0 to 7). 3=Scotch, 4=PORD, 5=Metis (None) 25384e34a73bSHong Zhang . -mat_mumps_icntl_8 <77>: ICNTL(8): scaling strategy (-2 to 8 or 77) (None) 25394e34a73bSHong Zhang . -mat_mumps_icntl_10 <0>: ICNTL(10): max num of refinements (None) 25404e34a73bSHong Zhang . -mat_mumps_icntl_11 <0>: ICNTL(11): statistics related to an error analysis (via -ksp_view) (None) 25414e34a73bSHong Zhang . -mat_mumps_icntl_12 <1>: ICNTL(12): an ordering strategy for symmetric matrices (0 to 3) (None) 25424e34a73bSHong Zhang . -mat_mumps_icntl_13 <0>: ICNTL(13): parallelism of the root node (enable ScaLAPACK) and its splitting (None) 25434e34a73bSHong Zhang . -mat_mumps_icntl_14 <20>: ICNTL(14): percentage increase in the estimated working space (None) 25444e34a73bSHong Zhang . -mat_mumps_icntl_19 <0>: ICNTL(19): computes the Schur complement (None) 25454e34a73bSHong Zhang . -mat_mumps_icntl_22 <0>: ICNTL(22): in-core/out-of-core factorization and solve (0 or 1) (None) 25464e34a73bSHong Zhang . -mat_mumps_icntl_23 <0>: ICNTL(23): max size of the working memory (MB) that can allocate per processor (None) 25474e34a73bSHong Zhang . -mat_mumps_icntl_24 <0>: ICNTL(24): detection of null pivot rows (0 or 1) (None) 25484e34a73bSHong Zhang . -mat_mumps_icntl_25 <0>: ICNTL(25): compute a solution of a deficient matrix and a null space basis (None) 25494e34a73bSHong Zhang . -mat_mumps_icntl_26 <0>: ICNTL(26): drives the solution phase if a Schur complement matrix (None) 25504e34a73bSHong Zhang . -mat_mumps_icntl_28 <1>: ICNTL(28): use 1 for sequential analysis and ictnl(7) ordering, or 2 for parallel analysis and ictnl(29) ordering (None) 25514e34a73bSHong Zhang . -mat_mumps_icntl_29 <0>: ICNTL(29): parallel ordering 1 = ptscotch, 2 = parmetis (None) 25524e34a73bSHong Zhang . -mat_mumps_icntl_30 <0>: ICNTL(30): compute user-specified set of entries in inv(A) (None) 25534e34a73bSHong Zhang . -mat_mumps_icntl_31 <0>: ICNTL(31): indicates which factors may be discarded during factorization (None) 25544e34a73bSHong Zhang . -mat_mumps_icntl_33 <0>: ICNTL(33): compute determinant (None) 25554e34a73bSHong Zhang . -mat_mumps_cntl_1 <0.01>: CNTL(1): relative pivoting threshold (None) 25564e34a73bSHong Zhang . -mat_mumps_cntl_2 <1.49012e-08>: CNTL(2): stopping criterion of refinement (None) 25574e34a73bSHong Zhang . -mat_mumps_cntl_3 <0>: CNTL(3): absolute pivoting threshold (None) 25584e34a73bSHong Zhang . -mat_mumps_cntl_4 <-1>: CNTL(4): value for static pivoting (None) 25594e34a73bSHong Zhang - -mat_mumps_cntl_5 <0>: CNTL(5): fixation for null pivots (None) 256024b6179bSKris Buschelman 256124b6179bSKris Buschelman Level: beginner 256224b6179bSKris Buschelman 256341c8de11SBarry Smith .seealso: PCFactorSetMatSolverPackage(), MatSolverPackage 256441c8de11SBarry Smith 256524b6179bSKris Buschelman M*/ 256624b6179bSKris Buschelman 256735bd34faSBarry Smith #undef __FUNCT__ 256835bd34faSBarry Smith #define __FUNCT__ "MatFactorGetSolverPackage_mumps" 2569f7a08781SBarry Smith static PetscErrorCode MatFactorGetSolverPackage_mumps(Mat A,const MatSolverPackage *type) 257035bd34faSBarry Smith { 257135bd34faSBarry Smith PetscFunctionBegin; 25722692d6eeSBarry Smith *type = MATSOLVERMUMPS; 257335bd34faSBarry Smith PetscFunctionReturn(0); 257435bd34faSBarry Smith } 257535bd34faSBarry Smith 2576bccb9932SShri Abhyankar /* MatGetFactor for Seq and MPI AIJ matrices */ 25772877fffaSHong Zhang #undef __FUNCT__ 2578bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_aij_mumps" 25798cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_aij_mumps(Mat A,MatFactorType ftype,Mat *F) 25802877fffaSHong Zhang { 25812877fffaSHong Zhang Mat B; 25822877fffaSHong Zhang PetscErrorCode ierr; 25832877fffaSHong Zhang Mat_MUMPS *mumps; 2584ace3abfcSBarry Smith PetscBool isSeqAIJ; 25852877fffaSHong Zhang 25862877fffaSHong Zhang PetscFunctionBegin; 25872877fffaSHong Zhang /* Create the factorization matrix */ 2588251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQAIJ,&isSeqAIJ);CHKERRQ(ierr); 2589ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 25902877fffaSHong Zhang ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 25912877fffaSHong Zhang ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2592bccb9932SShri Abhyankar if (isSeqAIJ) { 25930298fd71SBarry Smith ierr = MatSeqAIJSetPreallocation(B,0,NULL);CHKERRQ(ierr); 2594bccb9932SShri Abhyankar } else { 25950298fd71SBarry Smith ierr = MatMPIAIJSetPreallocation(B,0,NULL,0,NULL);CHKERRQ(ierr); 2596bccb9932SShri Abhyankar } 25972877fffaSHong Zhang 2598b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 25992205254eSKarl Rupp 26002877fffaSHong Zhang B->ops->view = MatView_MUMPS; 260135bd34faSBarry Smith B->ops->getinfo = MatGetInfo_MUMPS; 260220be8e61SHong Zhang B->ops->getdiagonal = MatGetDiagonal_MUMPS; 26032205254eSKarl Rupp 2604bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 2605bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 2606bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 2607bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 2608bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 2609bc6112feSHong Zhang 2610ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 2611ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 2612ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 2613ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 26146444a565SStefano Zampini 26156444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetSchurIndices_C",MatMumpsSetSchurIndices_MUMPS);CHKERRQ(ierr); 261659ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsInvertSchurComplement_C",MatMumpsInvertSchurComplement_MUMPS);CHKERRQ(ierr); 261759ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsCreateSchurComplement_C",MatMumpsCreateSchurComplement_MUMPS);CHKERRQ(ierr); 26186444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetSchurComplement_C",MatMumpsGetSchurComplement_MUMPS);CHKERRQ(ierr); 261959ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsRestoreSchurComplement_C",MatMumpsRestoreSchurComplement_MUMPS);CHKERRQ(ierr); 2620e807eca7SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplement_C",MatMumpsSolveSchurComplement_MUMPS);CHKERRQ(ierr); 26217404bcfbSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplementTranspose_C",MatMumpsSolveSchurComplementTranspose_MUMPS);CHKERRQ(ierr); 2622e807eca7SStefano Zampini 2623450b117fSShri Abhyankar if (ftype == MAT_FACTOR_LU) { 2624450b117fSShri Abhyankar B->ops->lufactorsymbolic = MatLUFactorSymbolic_AIJMUMPS; 2625d5f3da31SBarry Smith B->factortype = MAT_FACTOR_LU; 2626bccb9932SShri Abhyankar if (isSeqAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqaij_seqaij; 2627bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpiaij_mpiaij; 2628746480a1SHong Zhang mumps->sym = 0; 2629dcd589f8SShri Abhyankar } else { 263067877ebaSShri Abhyankar B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_MUMPS; 2631450b117fSShri Abhyankar B->factortype = MAT_FACTOR_CHOLESKY; 2632bccb9932SShri Abhyankar if (isSeqAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqaij_seqsbaij; 2633bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpiaij_mpisbaij; 263459ac8732SStefano Zampini #if defined(PETSC_USE_COMPLEX) 263559ac8732SStefano Zampini mumps->sym = 2; 263659ac8732SStefano Zampini #else 26376fdc2a6dSBarry Smith if (A->spd_set && A->spd) mumps->sym = 1; 26386fdc2a6dSBarry Smith else mumps->sym = 2; 263959ac8732SStefano Zampini #endif 2640450b117fSShri Abhyankar } 26412877fffaSHong Zhang 26422877fffaSHong Zhang mumps->isAIJ = PETSC_TRUE; 2643bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 26442877fffaSHong Zhang B->ops->destroy = MatDestroy_MUMPS; 26452877fffaSHong Zhang B->spptr = (void*)mumps; 26462205254eSKarl Rupp 2647f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 2648746480a1SHong Zhang 26492877fffaSHong Zhang *F = B; 26502877fffaSHong Zhang PetscFunctionReturn(0); 26512877fffaSHong Zhang } 26522877fffaSHong Zhang 2653bccb9932SShri Abhyankar /* MatGetFactor for Seq and MPI SBAIJ matrices */ 26542877fffaSHong Zhang #undef __FUNCT__ 2655bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_sbaij_mumps" 26568cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_sbaij_mumps(Mat A,MatFactorType ftype,Mat *F) 26572877fffaSHong Zhang { 26582877fffaSHong Zhang Mat B; 26592877fffaSHong Zhang PetscErrorCode ierr; 26602877fffaSHong Zhang Mat_MUMPS *mumps; 2661ace3abfcSBarry Smith PetscBool isSeqSBAIJ; 26622877fffaSHong Zhang 26632877fffaSHong Zhang PetscFunctionBegin; 2664ce94432eSBarry Smith if (ftype != MAT_FACTOR_CHOLESKY) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with MUMPS LU, use AIJ matrix"); 2665ce94432eSBarry Smith if (A->rmap->bs > 1) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with block size > 1 with MUMPS Cholesky, use AIJ matrix instead"); 2666251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQSBAIJ,&isSeqSBAIJ);CHKERRQ(ierr); 26672877fffaSHong Zhang /* Create the factorization matrix */ 2668ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 26692877fffaSHong Zhang ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 26702877fffaSHong Zhang ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2671b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 2672bccb9932SShri Abhyankar if (isSeqSBAIJ) { 26730298fd71SBarry Smith ierr = MatSeqSBAIJSetPreallocation(B,1,0,NULL);CHKERRQ(ierr); 26742205254eSKarl Rupp 267516ebf90aSShri Abhyankar mumps->ConvertToTriples = MatConvertToTriples_seqsbaij_seqsbaij; 2676dcd589f8SShri Abhyankar } else { 26770298fd71SBarry Smith ierr = MatMPISBAIJSetPreallocation(B,1,0,NULL,0,NULL);CHKERRQ(ierr); 26782205254eSKarl Rupp 2679bccb9932SShri Abhyankar mumps->ConvertToTriples = MatConvertToTriples_mpisbaij_mpisbaij; 2680bccb9932SShri Abhyankar } 2681bccb9932SShri Abhyankar 268267877ebaSShri Abhyankar B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_MUMPS; 2683bccb9932SShri Abhyankar B->ops->view = MatView_MUMPS; 268420be8e61SHong Zhang B->ops->getdiagonal = MatGetDiagonal_MUMPS; 26852205254eSKarl Rupp 2686bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 2687b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 2688b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 2689b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 2690b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 2691bc6112feSHong Zhang 2692ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 2693ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 2694ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 2695ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 26962205254eSKarl Rupp 26976444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetSchurIndices_C",MatMumpsSetSchurIndices_MUMPS);CHKERRQ(ierr); 269859ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsInvertSchurComplement_C",MatMumpsInvertSchurComplement_MUMPS);CHKERRQ(ierr); 269959ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsCreateSchurComplement_C",MatMumpsCreateSchurComplement_MUMPS);CHKERRQ(ierr); 27006444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetSchurComplement_C",MatMumpsGetSchurComplement_MUMPS);CHKERRQ(ierr); 270159ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsRestoreSchurComplement_C",MatMumpsRestoreSchurComplement_MUMPS);CHKERRQ(ierr); 2702e807eca7SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplement_C",MatMumpsSolveSchurComplement_MUMPS);CHKERRQ(ierr); 27037404bcfbSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplementTranspose_C",MatMumpsSolveSchurComplementTranspose_MUMPS);CHKERRQ(ierr); 27046444a565SStefano Zampini 2705f4762488SHong Zhang B->factortype = MAT_FACTOR_CHOLESKY; 270659ac8732SStefano Zampini #if defined(PETSC_USE_COMPLEX) 270759ac8732SStefano Zampini mumps->sym = 2; 270859ac8732SStefano Zampini #else 27096fdc2a6dSBarry Smith if (A->spd_set && A->spd) mumps->sym = 1; 27106fdc2a6dSBarry Smith else mumps->sym = 2; 271159ac8732SStefano Zampini #endif 2712a214ac2aSShri Abhyankar 2713bccb9932SShri Abhyankar mumps->isAIJ = PETSC_FALSE; 2714bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 2715f3c0ef26SHong Zhang B->ops->destroy = MatDestroy_MUMPS; 27162877fffaSHong Zhang B->spptr = (void*)mumps; 27172205254eSKarl Rupp 2718f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 2719746480a1SHong Zhang 27202877fffaSHong Zhang *F = B; 27212877fffaSHong Zhang PetscFunctionReturn(0); 27222877fffaSHong Zhang } 272397969023SHong Zhang 2724450b117fSShri Abhyankar #undef __FUNCT__ 2725bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_baij_mumps" 27268cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_baij_mumps(Mat A,MatFactorType ftype,Mat *F) 272767877ebaSShri Abhyankar { 272867877ebaSShri Abhyankar Mat B; 272967877ebaSShri Abhyankar PetscErrorCode ierr; 273067877ebaSShri Abhyankar Mat_MUMPS *mumps; 2731ace3abfcSBarry Smith PetscBool isSeqBAIJ; 273267877ebaSShri Abhyankar 273367877ebaSShri Abhyankar PetscFunctionBegin; 273467877ebaSShri Abhyankar /* Create the factorization matrix */ 2735251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQBAIJ,&isSeqBAIJ);CHKERRQ(ierr); 2736ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 273767877ebaSShri Abhyankar ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 273867877ebaSShri Abhyankar ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2739bccb9932SShri Abhyankar if (isSeqBAIJ) { 27400298fd71SBarry Smith ierr = MatSeqBAIJSetPreallocation(B,A->rmap->bs,0,NULL);CHKERRQ(ierr); 2741bccb9932SShri Abhyankar } else { 27420298fd71SBarry Smith ierr = MatMPIBAIJSetPreallocation(B,A->rmap->bs,0,NULL,0,NULL);CHKERRQ(ierr); 2743bccb9932SShri Abhyankar } 2744450b117fSShri Abhyankar 2745b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 2746450b117fSShri Abhyankar if (ftype == MAT_FACTOR_LU) { 2747450b117fSShri Abhyankar B->ops->lufactorsymbolic = MatLUFactorSymbolic_BAIJMUMPS; 2748450b117fSShri Abhyankar B->factortype = MAT_FACTOR_LU; 2749bccb9932SShri Abhyankar if (isSeqBAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqbaij_seqaij; 2750bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpibaij_mpiaij; 2751746480a1SHong Zhang mumps->sym = 0; 2752f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Cannot use PETSc BAIJ matrices with MUMPS Cholesky, use SBAIJ or AIJ matrix instead\n"); 2753bccb9932SShri Abhyankar 2754450b117fSShri Abhyankar B->ops->view = MatView_MUMPS; 275520be8e61SHong Zhang B->ops->getdiagonal = MatGetDiagonal_MUMPS; 27562205254eSKarl Rupp 2757bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 2758bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 2759bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 2760bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 2761bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 2762bc6112feSHong Zhang 2763ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 2764ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 2765ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 2766ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 2767450b117fSShri Abhyankar 27686444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetSchurIndices_C",MatMumpsSetSchurIndices_MUMPS);CHKERRQ(ierr); 276959ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsInvertSchurComplement_C",MatMumpsInvertSchurComplement_MUMPS);CHKERRQ(ierr); 277059ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsCreateSchurComplement_C",MatMumpsCreateSchurComplement_MUMPS);CHKERRQ(ierr); 27716444a565SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetSchurComplement_C",MatMumpsGetSchurComplement_MUMPS);CHKERRQ(ierr); 277259ac8732SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsRestoreSchurComplement_C",MatMumpsRestoreSchurComplement_MUMPS);CHKERRQ(ierr); 2773e807eca7SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplement_C",MatMumpsSolveSchurComplement_MUMPS);CHKERRQ(ierr); 27747404bcfbSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSolveSchurComplementTranspose_C",MatMumpsSolveSchurComplementTranspose_MUMPS);CHKERRQ(ierr); 27756444a565SStefano Zampini 2776450b117fSShri Abhyankar mumps->isAIJ = PETSC_TRUE; 2777bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 2778450b117fSShri Abhyankar B->ops->destroy = MatDestroy_MUMPS; 2779450b117fSShri Abhyankar B->spptr = (void*)mumps; 27802205254eSKarl Rupp 2781f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 2782746480a1SHong Zhang 2783450b117fSShri Abhyankar *F = B; 2784450b117fSShri Abhyankar PetscFunctionReturn(0); 2785450b117fSShri Abhyankar } 278642c9c57cSBarry Smith 278742c9c57cSBarry Smith PETSC_EXTERN PetscErrorCode MatGetFactor_aij_mumps(Mat,MatFactorType,Mat*); 278842c9c57cSBarry Smith PETSC_EXTERN PetscErrorCode MatGetFactor_baij_mumps(Mat,MatFactorType,Mat*); 278942c9c57cSBarry Smith PETSC_EXTERN PetscErrorCode MatGetFactor_sbaij_mumps(Mat,MatFactorType,Mat*); 279042c9c57cSBarry Smith 279142c9c57cSBarry Smith #undef __FUNCT__ 279242c9c57cSBarry Smith #define __FUNCT__ "MatSolverPackageRegister_MUMPS" 279329b38603SBarry Smith PETSC_EXTERN PetscErrorCode MatSolverPackageRegister_MUMPS(void) 279442c9c57cSBarry Smith { 279542c9c57cSBarry Smith PetscErrorCode ierr; 279642c9c57cSBarry Smith 279742c9c57cSBarry Smith PetscFunctionBegin; 279842c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIAIJ,MAT_FACTOR_LU,MatGetFactor_aij_mumps);CHKERRQ(ierr); 279942c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_aij_mumps);CHKERRQ(ierr); 280042c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIBAIJ,MAT_FACTOR_LU,MatGetFactor_baij_mumps);CHKERRQ(ierr); 280142c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_baij_mumps);CHKERRQ(ierr); 280242c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPISBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_sbaij_mumps);CHKERRQ(ierr); 280342c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQAIJ,MAT_FACTOR_LU,MatGetFactor_aij_mumps);CHKERRQ(ierr); 280442c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_aij_mumps);CHKERRQ(ierr); 280542c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQBAIJ,MAT_FACTOR_LU,MatGetFactor_baij_mumps);CHKERRQ(ierr); 280642c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_baij_mumps);CHKERRQ(ierr); 280742c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQSBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_sbaij_mumps);CHKERRQ(ierr); 280842c9c57cSBarry Smith PetscFunctionReturn(0); 280942c9c57cSBarry Smith } 281042c9c57cSBarry Smith 2811