1dba47a55SKris Buschelman 29b54502bSHong Zhang /* 39b54502bSHong Zhang Defines a direct factorization preconditioner for any Mat implementation 49b54502bSHong Zhang Note: this need not be consided a preconditioner since it supplies 59b54502bSHong Zhang a direct solver. 69b54502bSHong Zhang */ 7ee45ca4aSHong Zhang 8c6db04a5SJed Brown #include <../src/ksp/pc/impls/factor/lu/lu.h> /*I "petscpc.h" I*/ 99b54502bSHong Zhang 10680c5173SHong Zhang 117087cfbeSBarry Smith PetscErrorCode PCFactorReorderForNonzeroDiagonal_LU(PC pc,PetscReal z) 129b54502bSHong Zhang { 139b54502bSHong Zhang PC_LU *lu = (PC_LU*)pc->data; 149b54502bSHong Zhang 159b54502bSHong Zhang PetscFunctionBegin; 169b54502bSHong Zhang lu->nonzerosalongdiagonal = PETSC_TRUE; 172fa5cd67SKarl Rupp if (z == PETSC_DECIDE) lu->nonzerosalongdiagonaltol = 1.e-10; 182fa5cd67SKarl Rupp else lu->nonzerosalongdiagonaltol = z; 199b54502bSHong Zhang PetscFunctionReturn(0); 209b54502bSHong Zhang } 219b54502bSHong Zhang 224416b707SBarry Smith static PetscErrorCode PCSetFromOptions_LU(PetscOptionItems *PetscOptionsObject,PC pc) 239b54502bSHong Zhang { 249b54502bSHong Zhang PC_LU *lu = (PC_LU*)pc->data; 259b54502bSHong Zhang PetscErrorCode ierr; 26ace3abfcSBarry Smith PetscBool flg = PETSC_FALSE; 279b54502bSHong Zhang PetscReal tol; 289b54502bSHong Zhang 299b54502bSHong Zhang PetscFunctionBegin; 30e55864a3SBarry Smith ierr = PetscOptionsHead(PetscOptionsObject,"LU options");CHKERRQ(ierr); 31e55864a3SBarry Smith ierr = PCSetFromOptions_Factor(PetscOptionsObject,pc);CHKERRQ(ierr); 325c9eb25fSBarry Smith 332401956bSBarry Smith ierr = PetscOptionsName("-pc_factor_nonzeros_along_diagonal","Reorder to remove zeros from diagonal","PCFactorReorderForNonzeroDiagonal",&flg);CHKERRQ(ierr); 349b54502bSHong Zhang if (flg) { 359b54502bSHong Zhang tol = PETSC_DECIDE; 362401956bSBarry Smith ierr = PetscOptionsReal("-pc_factor_nonzeros_along_diagonal","Reorder to remove zeros from diagonal","PCFactorReorderForNonzeroDiagonal",lu->nonzerosalongdiagonaltol,&tol,0);CHKERRQ(ierr); 372401956bSBarry Smith ierr = PCFactorReorderForNonzeroDiagonal(pc,tol);CHKERRQ(ierr); 389b54502bSHong Zhang } 399b54502bSHong Zhang ierr = PetscOptionsTail();CHKERRQ(ierr); 409b54502bSHong Zhang PetscFunctionReturn(0); 419b54502bSHong Zhang } 429b54502bSHong Zhang 439b54502bSHong Zhang static PetscErrorCode PCView_LU(PC pc,PetscViewer viewer) 449b54502bSHong Zhang { 459b54502bSHong Zhang PetscErrorCode ierr; 469b54502bSHong Zhang 479b54502bSHong Zhang PetscFunctionBegin; 48914a5d51SHong Zhang ierr = PCView_Factor(pc,viewer);CHKERRQ(ierr); 499b54502bSHong Zhang PetscFunctionReturn(0); 509b54502bSHong Zhang } 519b54502bSHong Zhang 529b54502bSHong Zhang static PetscErrorCode PCSetUp_LU(PC pc) 539b54502bSHong Zhang { 549b54502bSHong Zhang PetscErrorCode ierr; 559b54502bSHong Zhang PC_LU *dir = (PC_LU*)pc->data; 56ea799195SBarry Smith MatSolverType stype; 5700e125f8SBarry Smith MatFactorError err; 583d1c1ea0SBarry Smith 599b54502bSHong Zhang PetscFunctionBegin; 60c6e4fdc6SHong Zhang pc->failedreason = PC_NOERROR; 613d1c1ea0SBarry Smith if (dir->hdr.reusefill && pc->setupcalled) ((PC_Factor*)dir)->info.fill = dir->hdr.actualfill; 629b54502bSHong Zhang 6384d44b13SHong Zhang ierr = MatSetErrorIfFailure(pc->pmat,pc->erroriffailure);CHKERRQ(ierr); 643d1c1ea0SBarry Smith if (dir->hdr.inplace) { 65fcfd50ebSBarry Smith if (dir->row && dir->col && dir->row != dir->col) {ierr = ISDestroy(&dir->row);CHKERRQ(ierr);} 66fcfd50ebSBarry Smith ierr = ISDestroy(&dir->col);CHKERRQ(ierr); 67075768bcSBarry Smith ierr = MatGetOrdering(pc->pmat,((PC_Factor*)dir)->ordering,&dir->row,&dir->col);CHKERRQ(ierr); 6803c60df9SBarry Smith if (dir->row) { 693bb1ff40SBarry Smith ierr = PetscLogObjectParent((PetscObject)pc,(PetscObject)dir->row);CHKERRQ(ierr); 703bb1ff40SBarry Smith ierr = PetscLogObjectParent((PetscObject)pc,(PetscObject)dir->col);CHKERRQ(ierr); 7103c60df9SBarry Smith } 72075768bcSBarry Smith ierr = MatLUFactor(pc->pmat,dir->row,dir->col,&((PC_Factor*)dir)->info);CHKERRQ(ierr); 7300e125f8SBarry Smith ierr = MatFactorGetError(pc->pmat,&err);CHKERRQ(ierr); 7400e125f8SBarry Smith if (err) { /* Factor() fails */ 7500e125f8SBarry Smith pc->failedreason = (PCFailedReason)err; 766baea169SHong Zhang PetscFunctionReturn(0); 776baea169SHong Zhang } 786baea169SHong Zhang 79075768bcSBarry Smith ((PC_Factor*)dir)->fact = pc->pmat; 809b54502bSHong Zhang } else { 819b54502bSHong Zhang MatInfo info; 8200e125f8SBarry Smith 839b54502bSHong Zhang if (!pc->setupcalled) { 84075768bcSBarry Smith ierr = MatGetOrdering(pc->pmat,((PC_Factor*)dir)->ordering,&dir->row,&dir->col);CHKERRQ(ierr); 859b54502bSHong Zhang if (dir->nonzerosalongdiagonal) { 869b54502bSHong Zhang ierr = MatReorderForNonzeroDiagonal(pc->pmat,dir->nonzerosalongdiagonaltol,dir->row,dir->col);CHKERRQ(ierr); 879b54502bSHong Zhang } 8803c60df9SBarry Smith if (dir->row) { 893bb1ff40SBarry Smith ierr = PetscLogObjectParent((PetscObject)pc,(PetscObject)dir->row);CHKERRQ(ierr); 903bb1ff40SBarry Smith ierr = PetscLogObjectParent((PetscObject)pc,(PetscObject)dir->col);CHKERRQ(ierr); 9103c60df9SBarry Smith } 92d09a07f4SBarry Smith if (!((PC_Factor*)dir)->fact) { 93075768bcSBarry Smith ierr = MatGetFactor(pc->pmat,((PC_Factor*)dir)->solvertype,MAT_FACTOR_LU,&((PC_Factor*)dir)->fact);CHKERRQ(ierr); 94a1f19f5aSHong Zhang } 95075768bcSBarry Smith ierr = MatLUFactorSymbolic(((PC_Factor*)dir)->fact,pc->pmat,dir->row,dir->col,&((PC_Factor*)dir)->info);CHKERRQ(ierr); 96075768bcSBarry Smith ierr = MatGetInfo(((PC_Factor*)dir)->fact,MAT_LOCAL,&info);CHKERRQ(ierr); 973d1c1ea0SBarry Smith dir->hdr.actualfill = info.fill_ratio_needed; 983bb1ff40SBarry Smith ierr = PetscLogObjectParent((PetscObject)pc,(PetscObject)((PC_Factor*)dir)->fact);CHKERRQ(ierr); 999b54502bSHong Zhang } else if (pc->flag != SAME_NONZERO_PATTERN) { 1003d1c1ea0SBarry Smith if (!dir->hdr.reuseordering) { 101fcfd50ebSBarry Smith if (dir->row && dir->col && dir->row != dir->col) {ierr = ISDestroy(&dir->row);CHKERRQ(ierr);} 102fcfd50ebSBarry Smith ierr = ISDestroy(&dir->col);CHKERRQ(ierr); 103075768bcSBarry Smith ierr = MatGetOrdering(pc->pmat,((PC_Factor*)dir)->ordering,&dir->row,&dir->col);CHKERRQ(ierr); 1049b54502bSHong Zhang if (dir->nonzerosalongdiagonal) { 1059b54502bSHong Zhang ierr = MatReorderForNonzeroDiagonal(pc->pmat,dir->nonzerosalongdiagonaltol,dir->row,dir->col);CHKERRQ(ierr); 1069b54502bSHong Zhang } 10703c60df9SBarry Smith if (dir->row) { 1083bb1ff40SBarry Smith ierr = PetscLogObjectParent((PetscObject)pc,(PetscObject)dir->row);CHKERRQ(ierr); 1093bb1ff40SBarry Smith ierr = PetscLogObjectParent((PetscObject)pc,(PetscObject)dir->col);CHKERRQ(ierr); 11003c60df9SBarry Smith } 1119b54502bSHong Zhang } 1126bf464f9SBarry Smith ierr = MatDestroy(&((PC_Factor*)dir)->fact);CHKERRQ(ierr); 113075768bcSBarry Smith ierr = MatGetFactor(pc->pmat,((PC_Factor*)dir)->solvertype,MAT_FACTOR_LU,&((PC_Factor*)dir)->fact);CHKERRQ(ierr); 114075768bcSBarry Smith ierr = MatLUFactorSymbolic(((PC_Factor*)dir)->fact,pc->pmat,dir->row,dir->col,&((PC_Factor*)dir)->info);CHKERRQ(ierr); 115075768bcSBarry Smith ierr = MatGetInfo(((PC_Factor*)dir)->fact,MAT_LOCAL,&info);CHKERRQ(ierr); 1163d1c1ea0SBarry Smith dir->hdr.actualfill = info.fill_ratio_needed; 1173bb1ff40SBarry Smith ierr = PetscLogObjectParent((PetscObject)pc,(PetscObject)((PC_Factor*)dir)->fact);CHKERRQ(ierr); 11804545d6dSBarry Smith } else { 119b8b68cfdSBarry Smith ierr = MatFactorGetError(((PC_Factor*)dir)->fact,&err);CHKERRQ(ierr); 120160a8794SBarry Smith if (err == MAT_FACTOR_NUMERIC_ZEROPIVOT) { 121b8b68cfdSBarry Smith ierr = MatFactorClearError(((PC_Factor*)dir)->fact);CHKERRQ(ierr); 122b8b68cfdSBarry Smith pc->failedreason = PC_NOERROR; 12304545d6dSBarry Smith } 1249b54502bSHong Zhang } 12500e125f8SBarry Smith ierr = MatFactorGetError(((PC_Factor*)dir)->fact,&err);CHKERRQ(ierr); 12600e125f8SBarry Smith if (err) { /* FactorSymbolic() fails */ 12700e125f8SBarry Smith pc->failedreason = (PCFailedReason)err; 1288c1cd74cSHong Zhang PetscFunctionReturn(0); 1298c1cd74cSHong Zhang } 1308c1cd74cSHong Zhang 131075768bcSBarry Smith ierr = MatLUFactorNumeric(((PC_Factor*)dir)->fact,pc->pmat,&((PC_Factor*)dir)->info);CHKERRQ(ierr); 13200e125f8SBarry Smith ierr = MatFactorGetError(((PC_Factor*)dir)->fact,&err);CHKERRQ(ierr); 13300e125f8SBarry Smith if (err) { /* FactorNumeric() fails */ 13400e125f8SBarry Smith pc->failedreason = (PCFailedReason)err; 1358c1cd74cSHong Zhang } 136680c5173SHong Zhang 1379b54502bSHong Zhang } 13800c67f3bSHong Zhang 1393ca39a21SBarry Smith ierr = PCFactorGetMatSolverType(pc,&stype);CHKERRQ(ierr); 14000c67f3bSHong Zhang if (!stype) { 141ea799195SBarry Smith MatSolverType solverpackage; 1423ca39a21SBarry Smith ierr = MatFactorGetSolverType(((PC_Factor*)dir)->fact,&solverpackage);CHKERRQ(ierr); 1433ca39a21SBarry Smith ierr = PCFactorSetMatSolverType(pc,solverpackage);CHKERRQ(ierr); 14400c67f3bSHong Zhang } 1459b54502bSHong Zhang PetscFunctionReturn(0); 1469b54502bSHong Zhang } 1479b54502bSHong Zhang 148574deadeSBarry Smith static PetscErrorCode PCReset_LU(PC pc) 1499b54502bSHong Zhang { 1509b54502bSHong Zhang PC_LU *dir = (PC_LU*)pc->data; 1519b54502bSHong Zhang PetscErrorCode ierr; 1529b54502bSHong Zhang 1539b54502bSHong Zhang PetscFunctionBegin; 1543d1c1ea0SBarry Smith if (!dir->hdr.inplace && ((PC_Factor*)dir)->fact) {ierr = MatDestroy(&((PC_Factor*)dir)->fact);CHKERRQ(ierr);} 155fcfd50ebSBarry Smith if (dir->row && dir->col && dir->row != dir->col) {ierr = ISDestroy(&dir->row);CHKERRQ(ierr);} 156fcfd50ebSBarry Smith ierr = ISDestroy(&dir->col);CHKERRQ(ierr); 157574deadeSBarry Smith PetscFunctionReturn(0); 158574deadeSBarry Smith } 159574deadeSBarry Smith 160574deadeSBarry Smith static PetscErrorCode PCDestroy_LU(PC pc) 161574deadeSBarry Smith { 162574deadeSBarry Smith PC_LU *dir = (PC_LU*)pc->data; 163574deadeSBarry Smith PetscErrorCode ierr; 164574deadeSBarry Smith 165574deadeSBarry Smith PetscFunctionBegin; 166574deadeSBarry Smith ierr = PCReset_LU(pc);CHKERRQ(ierr); 167503cfb0cSBarry Smith ierr = PetscFree(((PC_Factor*)dir)->ordering);CHKERRQ(ierr); 168503cfb0cSBarry Smith ierr = PetscFree(((PC_Factor*)dir)->solvertype);CHKERRQ(ierr); 169c31cb41cSBarry Smith ierr = PetscFree(pc->data);CHKERRQ(ierr); 1709b54502bSHong Zhang PetscFunctionReturn(0); 1719b54502bSHong Zhang } 1729b54502bSHong Zhang 1739b54502bSHong Zhang static PetscErrorCode PCApply_LU(PC pc,Vec x,Vec y) 1749b54502bSHong Zhang { 1759b54502bSHong Zhang PC_LU *dir = (PC_LU*)pc->data; 1769b54502bSHong Zhang PetscErrorCode ierr; 1779b54502bSHong Zhang 1789b54502bSHong Zhang PetscFunctionBegin; 1793d1c1ea0SBarry Smith if (dir->hdr.inplace) { 1802fa5cd67SKarl Rupp ierr = MatSolve(pc->pmat,x,y);CHKERRQ(ierr); 1812fa5cd67SKarl Rupp } else { 1822fa5cd67SKarl Rupp ierr = MatSolve(((PC_Factor*)dir)->fact,x,y);CHKERRQ(ierr); 1832fa5cd67SKarl Rupp } 1849b54502bSHong Zhang PetscFunctionReturn(0); 1859b54502bSHong Zhang } 1869b54502bSHong Zhang 1879b54502bSHong Zhang static PetscErrorCode PCApplyTranspose_LU(PC pc,Vec x,Vec y) 1889b54502bSHong Zhang { 1899b54502bSHong Zhang PC_LU *dir = (PC_LU*)pc->data; 1909b54502bSHong Zhang PetscErrorCode ierr; 1919b54502bSHong Zhang 1929b54502bSHong Zhang PetscFunctionBegin; 1933d1c1ea0SBarry Smith if (dir->hdr.inplace) { 1942fa5cd67SKarl Rupp ierr = MatSolveTranspose(pc->pmat,x,y);CHKERRQ(ierr); 1952fa5cd67SKarl Rupp } else { 1962fa5cd67SKarl Rupp ierr = MatSolveTranspose(((PC_Factor*)dir)->fact,x,y);CHKERRQ(ierr); 1972fa5cd67SKarl Rupp } 1989b54502bSHong Zhang PetscFunctionReturn(0); 1999b54502bSHong Zhang } 2009b54502bSHong Zhang 2019b54502bSHong Zhang /* -----------------------------------------------------------------------------------*/ 2029b54502bSHong Zhang 2039b54502bSHong Zhang /*MC 2049b54502bSHong Zhang PCLU - Uses a direct solver, based on LU factorization, as a preconditioner 2059b54502bSHong Zhang 2069b54502bSHong Zhang Options Database Keys: 2072401956bSBarry Smith + -pc_factor_reuse_ordering - Activate PCFactorSetReuseOrdering() 2083ca39a21SBarry Smith . -pc_factor_mat_solver_type - Actives PCFactorSetMatSolverType() to choose the direct solver, like superlu 2092401956bSBarry Smith . -pc_factor_reuse_fill - Activates PCFactorSetReuseFill() 21055ba2a51SBarry Smith . -pc_factor_fill <fill> - Sets fill amount 2112401956bSBarry Smith . -pc_factor_in_place - Activates in-place factorization 2122401956bSBarry Smith . -pc_factor_mat_ordering_type <nd,rcm,...> - Sets ordering routine 2132401956bSBarry Smith . -pc_factor_pivot_in_blocks <true,false> - allow pivoting within the small blocks during factorization (may increase 2149b54502bSHong Zhang stability of factorization. 215145b9266SHong Zhang . -pc_factor_shift_type <shifttype> - Sets shift type or PETSC_DECIDE for the default; use '-help' for a list of available types 216145b9266SHong Zhang . -pc_factor_shift_amount <shiftamount> - Sets shift amount or PETSC_DECIDE for the default 217e22d95b2SBarry Smith - -pc_factor_nonzeros_along_diagonal - permutes the rows and columns to try to put nonzero value along the 218e22d95b2SBarry Smith diagonal. 2199b54502bSHong Zhang 220*95452b02SPatrick Sanan Notes: 221*95452b02SPatrick Sanan Not all options work for all matrix formats 2229b54502bSHong Zhang Run with -help to see additional options for particular matrix formats or factorization 2239b54502bSHong Zhang algorithms 2249b54502bSHong Zhang 2259b54502bSHong Zhang Level: beginner 2269b54502bSHong Zhang 2279b54502bSHong Zhang Concepts: LU factorization, direct solver 2289b54502bSHong Zhang 229*95452b02SPatrick Sanan Notes: 230*95452b02SPatrick Sanan Usually this will compute an "exact" solution in one iteration and does 2319b54502bSHong Zhang not need a Krylov method (i.e. you can use -ksp_type preonly, or 2329b54502bSHong Zhang KSPSetType(ksp,KSPPREONLY) for the Krylov method 2339b54502bSHong Zhang 2349b54502bSHong Zhang .seealso: PCCreate(), PCSetType(), PCType (for list of available types), PC, 235a4fd02acSBarry Smith PCILU, PCCHOLESKY, PCICC, PCFactorSetReuseOrdering(), PCFactorSetReuseFill(), PCFactorGetMatrix(), 2368ff23777SHong Zhang PCFactorSetFill(), PCFactorSetUseInPlace(), PCFactorSetMatOrderingType(), PCFactorSetColumnPivot(), 237145b9266SHong Zhang PCFactorSetPivotingInBlocks(),PCFactorSetShiftType(),PCFactorSetShiftAmount() 2388ff23777SHong Zhang PCFactorReorderForNonzeroDiagonal() 2399b54502bSHong Zhang M*/ 2409b54502bSHong Zhang 2418cc058d9SJed Brown PETSC_EXTERN PetscErrorCode PCCreate_LU(PC pc) 2429b54502bSHong Zhang { 2439b54502bSHong Zhang PetscErrorCode ierr; 2449b54502bSHong Zhang PetscMPIInt size; 2459b54502bSHong Zhang PC_LU *dir; 2469b54502bSHong Zhang 2479b54502bSHong Zhang PetscFunctionBegin; 248b00a9115SJed Brown ierr = PetscNewLog(pc,&dir);CHKERRQ(ierr); 2493d1c1ea0SBarry Smith pc->data = (void*)dir; 2503d1c1ea0SBarry Smith ierr = PCFactorInitialize(pc);CHKERRQ(ierr); 251d5f3da31SBarry Smith ((PC_Factor*)dir)->factortype = MAT_FACTOR_LU; 2529b54502bSHong Zhang dir->nonzerosalongdiagonal = PETSC_FALSE; 2539b54502bSHong Zhang 254075768bcSBarry Smith ((PC_Factor*)dir)->info.fill = 5.0; 255075768bcSBarry Smith ((PC_Factor*)dir)->info.dtcol = 1.e-6; /* default to pivoting; this is only thing PETSc LU supports */ 256f4db908eSBarry Smith ((PC_Factor*)dir)->info.shifttype = (PetscReal)MAT_SHIFT_NONE; 2579b54502bSHong Zhang dir->col = 0; 2589b54502bSHong Zhang dir->row = 0; 2595c9eb25fSBarry Smith 260ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)pc),&size);CHKERRQ(ierr); 2619b54502bSHong Zhang if (size == 1) { 26219fd82e9SBarry Smith ierr = PetscStrallocpy(MATORDERINGND,(char**)&((PC_Factor*)dir)->ordering);CHKERRQ(ierr); 2639b54502bSHong Zhang } else { 26419fd82e9SBarry Smith ierr = PetscStrallocpy(MATORDERINGNATURAL,(char**)&((PC_Factor*)dir)->ordering);CHKERRQ(ierr); 2659b54502bSHong Zhang } 2669b54502bSHong Zhang 267574deadeSBarry Smith pc->ops->reset = PCReset_LU; 2689b54502bSHong Zhang pc->ops->destroy = PCDestroy_LU; 2699b54502bSHong Zhang pc->ops->apply = PCApply_LU; 2709b54502bSHong Zhang pc->ops->applytranspose = PCApplyTranspose_LU; 2719b54502bSHong Zhang pc->ops->setup = PCSetUp_LU; 2729b54502bSHong Zhang pc->ops->setfromoptions = PCSetFromOptions_LU; 2739b54502bSHong Zhang pc->ops->view = PCView_LU; 2749b54502bSHong Zhang pc->ops->applyrichardson = 0; 275bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCFactorReorderForNonzeroDiagonal_C",PCFactorReorderForNonzeroDiagonal_LU);CHKERRQ(ierr); 2769b54502bSHong Zhang PetscFunctionReturn(0); 2779b54502bSHong Zhang } 278