14b3f184cSKarl Rupp 24b3f184cSKarl Rupp /* -------------------------------------------------------------------- */ 34b3f184cSKarl Rupp 44b3f184cSKarl Rupp /* 54b3f184cSKarl Rupp Include files needed for the ViennaCL Chow-Patel parallel ILU preconditioner: 64b3f184cSKarl Rupp pcimpl.h - private include file intended for use by all preconditioners 74b3f184cSKarl Rupp */ 84b3f184cSKarl Rupp #define PETSC_SKIP_SPINLOCK 999acd6aaSStefano Zampini #define PETSC_SKIP_IMMINTRIN_H_CUDAWORKAROUND 1 1099acd6aaSStefano Zampini 114b3f184cSKarl Rupp #include <petsc/private/pcimpl.h> /*I "petscpc.h" I*/ 124b3f184cSKarl Rupp #include <../src/mat/impls/aij/seq/aij.h> 134b3f184cSKarl Rupp #include <../src/vec/vec/impls/dvecimpl.h> 144b3f184cSKarl Rupp #include <../src/mat/impls/aij/seq/seqviennacl/viennaclmatimpl.h> 154b3f184cSKarl Rupp #include <../src/vec/vec/impls/seq/seqviennacl/viennaclvecimpl.h> 164b3f184cSKarl Rupp #include <viennacl/linalg/detail/ilu/chow_patel_ilu.hpp> 174b3f184cSKarl Rupp 184b3f184cSKarl Rupp /* 194b3f184cSKarl Rupp Private context (data structure) for the CHOWILUVIENNACL preconditioner. 204b3f184cSKarl Rupp */ 214b3f184cSKarl Rupp typedef struct { 224b3f184cSKarl Rupp viennacl::linalg::chow_patel_ilu_precond< viennacl::compressed_matrix<PetscScalar> > *CHOWILUVIENNACL; 234b3f184cSKarl Rupp } PC_CHOWILUVIENNACL; 244b3f184cSKarl Rupp 254b3f184cSKarl Rupp /* -------------------------------------------------------------------------- */ 264b3f184cSKarl Rupp /* 274b3f184cSKarl Rupp PCSetUp_CHOWILUVIENNACL - Prepares for the use of the CHOWILUVIENNACL preconditioner 284b3f184cSKarl Rupp by setting data structures and options. 294b3f184cSKarl Rupp 304b3f184cSKarl Rupp Input Parameter: 314b3f184cSKarl Rupp . pc - the preconditioner context 324b3f184cSKarl Rupp 334b3f184cSKarl Rupp Application Interface Routine: PCSetUp() 344b3f184cSKarl Rupp 354b3f184cSKarl Rupp Notes: 364b3f184cSKarl Rupp The interface routine PCSetUp() is not usually called directly by 374b3f184cSKarl Rupp the user, but instead is called by PCApply() if necessary. 384b3f184cSKarl Rupp */ 394b3f184cSKarl Rupp static PetscErrorCode PCSetUp_CHOWILUVIENNACL(PC pc) 404b3f184cSKarl Rupp { 414b3f184cSKarl Rupp PC_CHOWILUVIENNACL *ilu = (PC_CHOWILUVIENNACL*)pc->data; 424b3f184cSKarl Rupp PetscBool flg = PETSC_FALSE; 434b3f184cSKarl Rupp Mat_SeqAIJViennaCL *gpustruct; 444b3f184cSKarl Rupp 454b3f184cSKarl Rupp PetscFunctionBegin; 469566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)pc->pmat,MATSEQAIJVIENNACL,&flg)); 4728b400f6SJacob Faibussowitsch PetscCheck(flg,PetscObjectComm((PetscObject)pc),PETSC_ERR_SUP,"Currently only handles ViennaCL matrices"); 484b3f184cSKarl Rupp if (pc->setupcalled != 0) { 494b3f184cSKarl Rupp try { 504b3f184cSKarl Rupp delete ilu->CHOWILUVIENNACL; 514b3f184cSKarl Rupp } catch(char *ex) { 5298921bdaSJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"ViennaCL error: %s", ex); 534b3f184cSKarl Rupp } 544b3f184cSKarl Rupp } 554b3f184cSKarl Rupp try { 564b3f184cSKarl Rupp #if defined(PETSC_USE_COMPLEX) 574b3f184cSKarl Rupp gpustruct = NULL; 584b3f184cSKarl Rupp SETERRQ(PetscObjectComm((PetscObject)pc),PETSC_ERR_SUP,"No support for complex arithmetic in CHOWILUVIENNACL preconditioner"); 594b3f184cSKarl Rupp #else 609566063dSJacob Faibussowitsch PetscCall(MatViennaCLCopyToGPU(pc->pmat)); 614b3f184cSKarl Rupp gpustruct = (Mat_SeqAIJViennaCL*)(pc->pmat->spptr); 624b3f184cSKarl Rupp 634b3f184cSKarl Rupp viennacl::linalg::chow_patel_tag ilu_tag; 644b3f184cSKarl Rupp ViennaCLAIJMatrix *mat = (ViennaCLAIJMatrix*)gpustruct->mat; 654b3f184cSKarl Rupp ilu->CHOWILUVIENNACL = new viennacl::linalg::chow_patel_ilu_precond<viennacl::compressed_matrix<PetscScalar> >(*mat, ilu_tag); 664b3f184cSKarl Rupp #endif 674b3f184cSKarl Rupp } catch(char *ex) { 6898921bdaSJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"ViennaCL error: %s", ex); 694b3f184cSKarl Rupp } 704b3f184cSKarl Rupp PetscFunctionReturn(0); 714b3f184cSKarl Rupp } 724b3f184cSKarl Rupp 734b3f184cSKarl Rupp /* -------------------------------------------------------------------------- */ 744b3f184cSKarl Rupp /* 754b3f184cSKarl Rupp PCApply_CHOWILUVIENNACL - Applies the CHOWILUVIENNACL preconditioner to a vector. 764b3f184cSKarl Rupp 774b3f184cSKarl Rupp Input Parameters: 784b3f184cSKarl Rupp . pc - the preconditioner context 794b3f184cSKarl Rupp . x - input vector 804b3f184cSKarl Rupp 814b3f184cSKarl Rupp Output Parameter: 824b3f184cSKarl Rupp . y - output vector 834b3f184cSKarl Rupp 844b3f184cSKarl Rupp Application Interface Routine: PCApply() 854b3f184cSKarl Rupp */ 864b3f184cSKarl Rupp static PetscErrorCode PCApply_CHOWILUVIENNACL(PC pc,Vec x,Vec y) 874b3f184cSKarl Rupp { 884b3f184cSKarl Rupp PC_CHOWILUVIENNACL *ilu = (PC_CHOWILUVIENNACL*)pc->data; 894b3f184cSKarl Rupp PetscBool flg1,flg2; 904b3f184cSKarl Rupp viennacl::vector<PetscScalar> const *xarray=NULL; 914b3f184cSKarl Rupp viennacl::vector<PetscScalar> *yarray=NULL; 924b3f184cSKarl Rupp 934b3f184cSKarl Rupp PetscFunctionBegin; 944b3f184cSKarl Rupp /*how to apply a certain fixed number of iterations?*/ 959566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)x,VECSEQVIENNACL,&flg1)); 969566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)y,VECSEQVIENNACL,&flg2)); 9708401ef6SPierre Jolivet PetscCheck((flg1 && flg2),PetscObjectComm((PetscObject)pc),PETSC_ERR_SUP, "Currently only handles ViennaCL vectors"); 984b3f184cSKarl Rupp if (!ilu->CHOWILUVIENNACL) { 999566063dSJacob Faibussowitsch PetscCall(PCSetUp_CHOWILUVIENNACL(pc)); 1004b3f184cSKarl Rupp } 1019566063dSJacob Faibussowitsch PetscCall(VecSet(y,0.0)); 1029566063dSJacob Faibussowitsch PetscCall(VecViennaCLGetArrayRead(x,&xarray)); 1039566063dSJacob Faibussowitsch PetscCall(VecViennaCLGetArrayWrite(y,&yarray)); 1044b3f184cSKarl Rupp try { 1054b3f184cSKarl Rupp #if defined(PETSC_USE_COMPLEX) 1064b3f184cSKarl Rupp 1074b3f184cSKarl Rupp #else 1084b3f184cSKarl Rupp *yarray = *xarray; 1094b3f184cSKarl Rupp ilu->CHOWILUVIENNACL->apply(*yarray); 1104b3f184cSKarl Rupp #endif 1114b3f184cSKarl Rupp } catch(char * ex) { 11298921bdaSJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"ViennaCL error: %s", ex); 1134b3f184cSKarl Rupp } 1149566063dSJacob Faibussowitsch PetscCall(VecViennaCLRestoreArrayRead(x,&xarray)); 1159566063dSJacob Faibussowitsch PetscCall(VecViennaCLRestoreArrayWrite(y,&yarray)); 1169566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)y)); 1174b3f184cSKarl Rupp PetscFunctionReturn(0); 1184b3f184cSKarl Rupp } 1194b3f184cSKarl Rupp /* -------------------------------------------------------------------------- */ 1204b3f184cSKarl Rupp /* 1214b3f184cSKarl Rupp PCDestroy_CHOWILUVIENNACL - Destroys the private context for the CHOWILUVIENNACL preconditioner 1224b3f184cSKarl Rupp that was created with PCCreate_CHOWILUVIENNACL(). 1234b3f184cSKarl Rupp 1244b3f184cSKarl Rupp Input Parameter: 1254b3f184cSKarl Rupp . pc - the preconditioner context 1264b3f184cSKarl Rupp 1274b3f184cSKarl Rupp Application Interface Routine: PCDestroy() 1284b3f184cSKarl Rupp */ 1294b3f184cSKarl Rupp static PetscErrorCode PCDestroy_CHOWILUVIENNACL(PC pc) 1304b3f184cSKarl Rupp { 1314b3f184cSKarl Rupp PC_CHOWILUVIENNACL *ilu = (PC_CHOWILUVIENNACL*)pc->data; 1324b3f184cSKarl Rupp 1334b3f184cSKarl Rupp PetscFunctionBegin; 1344b3f184cSKarl Rupp if (ilu->CHOWILUVIENNACL) { 1354b3f184cSKarl Rupp try { 1364b3f184cSKarl Rupp delete ilu->CHOWILUVIENNACL; 1374b3f184cSKarl Rupp } catch(char *ex) { 13898921bdaSJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"ViennaCL error: %s", ex); 1394b3f184cSKarl Rupp } 1404b3f184cSKarl Rupp } 1414b3f184cSKarl Rupp 1424b3f184cSKarl Rupp /* 1434b3f184cSKarl Rupp Free the private data structure that was hanging off the PC 1444b3f184cSKarl Rupp */ 1459566063dSJacob Faibussowitsch PetscCall(PetscFree(pc->data)); 1464b3f184cSKarl Rupp PetscFunctionReturn(0); 1474b3f184cSKarl Rupp } 1484b3f184cSKarl Rupp 1494b3f184cSKarl Rupp static PetscErrorCode PCSetFromOptions_CHOWILUVIENNACL(PetscOptionItems *PetscOptionsObject,PC pc) 1504b3f184cSKarl Rupp { 1514b3f184cSKarl Rupp PetscFunctionBegin; 152d0609cedSBarry Smith PetscOptionsHeadBegin(PetscOptionsObject,"CHOWILUVIENNACL options"); 153d0609cedSBarry Smith PetscOptionsHeadEnd(); 1544b3f184cSKarl Rupp PetscFunctionReturn(0); 1554b3f184cSKarl Rupp } 1564b3f184cSKarl Rupp 1574b3f184cSKarl Rupp /* -------------------------------------------------------------------------- */ 1584b3f184cSKarl Rupp 1594b3f184cSKarl Rupp /*MC 1604b3f184cSKarl Rupp PCCHOWILUViennaCL - A smoothed agglomeration algorithm that can be used via the CUDA, OpenCL, and OpenMP backends of ViennaCL 1614b3f184cSKarl Rupp 1624b3f184cSKarl Rupp Level: advanced 1634b3f184cSKarl Rupp 164*db781477SPatrick Sanan .seealso: `PCCreate()`, `PCSetType()`, `PCType`, `PC` 1654b3f184cSKarl Rupp 1664b3f184cSKarl Rupp M*/ 1674b3f184cSKarl Rupp 1684b3f184cSKarl Rupp PETSC_EXTERN PetscErrorCode PCCreate_CHOWILUVIENNACL(PC pc) 1694b3f184cSKarl Rupp { 1704b3f184cSKarl Rupp PC_CHOWILUVIENNACL *ilu; 1714b3f184cSKarl Rupp 1724b3f184cSKarl Rupp PetscFunctionBegin; 1734b3f184cSKarl Rupp /* 1744b3f184cSKarl Rupp Creates the private data structure for this preconditioner and 1754b3f184cSKarl Rupp attach it to the PC object. 1764b3f184cSKarl Rupp */ 1779566063dSJacob Faibussowitsch PetscCall(PetscNewLog(pc,&ilu)); 1784b3f184cSKarl Rupp pc->data = (void*)ilu; 1794b3f184cSKarl Rupp 1804b3f184cSKarl Rupp /* 1814b3f184cSKarl Rupp Initialize the pointer to zero 1824b3f184cSKarl Rupp Initialize number of v-cycles to default (1) 1834b3f184cSKarl Rupp */ 1844b3f184cSKarl Rupp ilu->CHOWILUVIENNACL = 0; 1854b3f184cSKarl Rupp 1864b3f184cSKarl Rupp /* 1874b3f184cSKarl Rupp Set the pointers for the functions that are provided above. 1884b3f184cSKarl Rupp Now when the user-level routines (such as PCApply(), PCDestroy(), etc.) 1894b3f184cSKarl Rupp are called, they will automatically call these functions. Note we 1904b3f184cSKarl Rupp choose not to provide a couple of these functions since they are 1914b3f184cSKarl Rupp not needed. 1924b3f184cSKarl Rupp */ 1934b3f184cSKarl Rupp pc->ops->apply = PCApply_CHOWILUVIENNACL; 1944b3f184cSKarl Rupp pc->ops->applytranspose = 0; 1954b3f184cSKarl Rupp pc->ops->setup = PCSetUp_CHOWILUVIENNACL; 1964b3f184cSKarl Rupp pc->ops->destroy = PCDestroy_CHOWILUVIENNACL; 1974b3f184cSKarl Rupp pc->ops->setfromoptions = PCSetFromOptions_CHOWILUVIENNACL; 1984b3f184cSKarl Rupp pc->ops->view = 0; 1994b3f184cSKarl Rupp pc->ops->applyrichardson = 0; 2004b3f184cSKarl Rupp pc->ops->applysymmetricleft = 0; 2014b3f184cSKarl Rupp pc->ops->applysymmetricright = 0; 2024b3f184cSKarl Rupp PetscFunctionReturn(0); 2034b3f184cSKarl Rupp } 204