107598726SKarl Rupp 207598726SKarl Rupp /* 307598726SKarl Rupp Include files needed for the ViennaCL Smoothed Aggregation preconditioner: 407598726SKarl Rupp pcimpl.h - private include file intended for use by all preconditioners 507598726SKarl Rupp */ 607598726SKarl Rupp #define PETSC_SKIP_SPINLOCK 799acd6aaSStefano Zampini #define PETSC_SKIP_IMMINTRIN_H_CUDAWORKAROUND 1 807598726SKarl Rupp #include <petsc/private/pcimpl.h> /*I "petscpc.h" I*/ 907598726SKarl Rupp #include <../src/mat/impls/aij/seq/aij.h> 1007598726SKarl Rupp #include <../src/vec/vec/impls/dvecimpl.h> 1107598726SKarl Rupp #include <../src/mat/impls/aij/seq/seqviennacl/viennaclmatimpl.h> 1207598726SKarl Rupp #include <../src/vec/vec/impls/seq/seqviennacl/viennaclvecimpl.h> 1307598726SKarl Rupp #include <viennacl/linalg/amg.hpp> 1407598726SKarl Rupp 1507598726SKarl Rupp /* 1607598726SKarl Rupp Private context (data structure) for the SAVIENNACL preconditioner. 1707598726SKarl Rupp */ 1807598726SKarl Rupp typedef struct { 1907598726SKarl Rupp viennacl::linalg::amg_precond<viennacl::compressed_matrix<PetscScalar>> *SAVIENNACL; 2007598726SKarl Rupp } PC_SAVIENNACL; 2107598726SKarl Rupp 2207598726SKarl Rupp /* 2307598726SKarl Rupp PCSetUp_SAVIENNACL - Prepares for the use of the SAVIENNACL preconditioner 2407598726SKarl Rupp by setting data structures and options. 2507598726SKarl Rupp 2607598726SKarl Rupp Input Parameter: 2707598726SKarl Rupp . pc - the preconditioner context 2807598726SKarl Rupp 2907598726SKarl Rupp Application Interface Routine: PCSetUp() 3007598726SKarl Rupp 31f1580f4eSBarry Smith Note: 3207598726SKarl Rupp The interface routine PCSetUp() is not usually called directly by 3307598726SKarl Rupp the user, but instead is called by PCApply() if necessary. 3407598726SKarl Rupp */ 35*d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCSetUp_SAVIENNACL(PC pc) 36*d71ae5a4SJacob Faibussowitsch { 3707598726SKarl Rupp PC_SAVIENNACL *sa = (PC_SAVIENNACL *)pc->data; 3807598726SKarl Rupp PetscBool flg = PETSC_FALSE; 3907598726SKarl Rupp Mat_SeqAIJViennaCL *gpustruct; 4007598726SKarl Rupp 4107598726SKarl Rupp PetscFunctionBegin; 429566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)pc->pmat, MATSEQAIJVIENNACL, &flg)); 4328b400f6SJacob Faibussowitsch PetscCheck(flg, PetscObjectComm((PetscObject)pc), PETSC_ERR_SUP, "Currently only handles ViennaCL matrices"); 4407598726SKarl Rupp if (pc->setupcalled != 0) { 4507598726SKarl Rupp try { 4607598726SKarl Rupp delete sa->SAVIENNACL; 47*d71ae5a4SJacob Faibussowitsch } catch (char *ex) { 48*d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_LIB, "ViennaCL error: %s", ex); 49*d71ae5a4SJacob Faibussowitsch } 5007598726SKarl Rupp } 5107598726SKarl Rupp try { 5207598726SKarl Rupp #if defined(PETSC_USE_COMPLEX) 5307598726SKarl Rupp gpustruct = NULL; 5407598726SKarl Rupp SETERRQ(PetscObjectComm((PetscObject)pc), PETSC_ERR_SUP, "No support for complex arithmetic in SAVIENNACL preconditioner"); 5507598726SKarl Rupp #else 569566063dSJacob Faibussowitsch PetscCall(MatViennaCLCopyToGPU(pc->pmat)); 5707598726SKarl Rupp gpustruct = (Mat_SeqAIJViennaCL *)(pc->pmat->spptr); 5807598726SKarl Rupp 5907598726SKarl Rupp viennacl::linalg::amg_tag amg_tag_sa_pmis; 6007598726SKarl Rupp amg_tag_sa_pmis.set_coarsening_method(viennacl::linalg::AMG_COARSENING_METHOD_MIS2_AGGREGATION); 6107598726SKarl Rupp amg_tag_sa_pmis.set_interpolation_method(viennacl::linalg::AMG_INTERPOLATION_METHOD_SMOOTHED_AGGREGATION); 6207598726SKarl Rupp ViennaCLAIJMatrix *mat = (ViennaCLAIJMatrix *)gpustruct->mat; 6307598726SKarl Rupp sa->SAVIENNACL = new viennacl::linalg::amg_precond<viennacl::compressed_matrix<PetscScalar>>(*mat, amg_tag_sa_pmis); 6407598726SKarl Rupp sa->SAVIENNACL->setup(); 6507598726SKarl Rupp #endif 66*d71ae5a4SJacob Faibussowitsch } catch (char *ex) { 67*d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_LIB, "ViennaCL error: %s", ex); 68*d71ae5a4SJacob Faibussowitsch } 6907598726SKarl Rupp PetscFunctionReturn(0); 7007598726SKarl Rupp } 7107598726SKarl Rupp 7207598726SKarl Rupp /* 7307598726SKarl Rupp PCApply_SAVIENNACL - Applies the SAVIENNACL preconditioner to a vector. 7407598726SKarl Rupp 7507598726SKarl Rupp Input Parameters: 7607598726SKarl Rupp . pc - the preconditioner context 7707598726SKarl Rupp . x - input vector 7807598726SKarl Rupp 7907598726SKarl Rupp Output Parameter: 8007598726SKarl Rupp . y - output vector 8107598726SKarl Rupp 8207598726SKarl Rupp Application Interface Routine: PCApply() 8307598726SKarl Rupp */ 84*d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCApply_SAVIENNACL(PC pc, Vec x, Vec y) 85*d71ae5a4SJacob Faibussowitsch { 8607598726SKarl Rupp PC_SAVIENNACL *sac = (PC_SAVIENNACL *)pc->data; 8707598726SKarl Rupp PetscBool flg1, flg2; 8807598726SKarl Rupp viennacl::vector<PetscScalar> const *xarray = NULL; 8907598726SKarl Rupp viennacl::vector<PetscScalar> *yarray = NULL; 9007598726SKarl Rupp 9107598726SKarl Rupp PetscFunctionBegin; 9207598726SKarl Rupp /*how to apply a certain fixed number of iterations?*/ 939566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)x, VECSEQVIENNACL, &flg1)); 949566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)y, VECSEQVIENNACL, &flg2)); 9508401ef6SPierre Jolivet PetscCheck((flg1 && flg2), PetscObjectComm((PetscObject)pc), PETSC_ERR_SUP, "Currently only handles ViennaCL vectors"); 9648a46eb9SPierre Jolivet if (!sac->SAVIENNACL) PetscCall(PCSetUp_SAVIENNACL(pc)); 979566063dSJacob Faibussowitsch PetscCall(VecViennaCLGetArrayRead(x, &xarray)); 989566063dSJacob Faibussowitsch PetscCall(VecViennaCLGetArrayWrite(y, &yarray)); 9907598726SKarl Rupp try { 100c4163675SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 10107598726SKarl Rupp *yarray = *xarray; 10207598726SKarl Rupp sac->SAVIENNACL->apply(*yarray); 10307598726SKarl Rupp #endif 104*d71ae5a4SJacob Faibussowitsch } catch (char *ex) { 105*d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_LIB, "ViennaCL error: %s", ex); 106*d71ae5a4SJacob Faibussowitsch } 1079566063dSJacob Faibussowitsch PetscCall(VecViennaCLRestoreArrayRead(x, &xarray)); 1089566063dSJacob Faibussowitsch PetscCall(VecViennaCLRestoreArrayWrite(y, &yarray)); 1099566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)y)); 11007598726SKarl Rupp PetscFunctionReturn(0); 11107598726SKarl Rupp } 112f1580f4eSBarry Smith 11307598726SKarl Rupp /* 11407598726SKarl Rupp PCDestroy_SAVIENNACL - Destroys the private context for the SAVIENNACL preconditioner 11507598726SKarl Rupp that was created with PCCreate_SAVIENNACL(). 11607598726SKarl Rupp 11707598726SKarl Rupp Input Parameter: 11807598726SKarl Rupp . pc - the preconditioner context 11907598726SKarl Rupp 12007598726SKarl Rupp Application Interface Routine: PCDestroy() 12107598726SKarl Rupp */ 122*d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCDestroy_SAVIENNACL(PC pc) 123*d71ae5a4SJacob Faibussowitsch { 12407598726SKarl Rupp PC_SAVIENNACL *sac = (PC_SAVIENNACL *)pc->data; 12507598726SKarl Rupp 12607598726SKarl Rupp PetscFunctionBegin; 12707598726SKarl Rupp if (sac->SAVIENNACL) { 12807598726SKarl Rupp try { 12907598726SKarl Rupp delete sac->SAVIENNACL; 130*d71ae5a4SJacob Faibussowitsch } catch (char *ex) { 131*d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_LIB, "ViennaCL error: %s", ex); 132*d71ae5a4SJacob Faibussowitsch } 13307598726SKarl Rupp } 13407598726SKarl Rupp 13507598726SKarl Rupp /* 13607598726SKarl Rupp Free the private data structure that was hanging off the PC 13707598726SKarl Rupp */ 1389566063dSJacob Faibussowitsch PetscCall(PetscFree(pc->data)); 13907598726SKarl Rupp PetscFunctionReturn(0); 14007598726SKarl Rupp } 14107598726SKarl Rupp 142*d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCSetFromOptions_SAVIENNACL(PC pc, PetscOptionItems *PetscOptionsObject) 143*d71ae5a4SJacob Faibussowitsch { 14407598726SKarl Rupp PetscFunctionBegin; 145d0609cedSBarry Smith PetscOptionsHeadBegin(PetscOptionsObject, "SAVIENNACL options"); 146d0609cedSBarry Smith PetscOptionsHeadEnd(); 14707598726SKarl Rupp PetscFunctionReturn(0); 14807598726SKarl Rupp } 14907598726SKarl Rupp 15007598726SKarl Rupp /*MC 15107598726SKarl Rupp PCSAViennaCL - A smoothed agglomeration algorithm that can be used via the CUDA, OpenCL, and OpenMP backends of ViennaCL 15207598726SKarl Rupp 15307598726SKarl Rupp Level: advanced 15407598726SKarl Rupp 155f1580f4eSBarry Smith Developer Note: 156f1580f4eSBarry Smith This `PCType` does not appear to be registered 15707598726SKarl Rupp 158f1580f4eSBarry Smith .seealso: `PCCreate()`, `PCSetType()`, `PCType`, `PC` 15907598726SKarl Rupp M*/ 16007598726SKarl Rupp 161*d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode PCCreate_SAVIENNACL(PC pc) 162*d71ae5a4SJacob Faibussowitsch { 16307598726SKarl Rupp PC_SAVIENNACL *sac; 16407598726SKarl Rupp 16507598726SKarl Rupp PetscFunctionBegin; 16607598726SKarl Rupp /* 16707598726SKarl Rupp Creates the private data structure for this preconditioner and 16807598726SKarl Rupp attach it to the PC object. 16907598726SKarl Rupp */ 1704dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&sac)); 17107598726SKarl Rupp pc->data = (void *)sac; 17207598726SKarl Rupp 17307598726SKarl Rupp /* 17407598726SKarl Rupp Initialize the pointer to zero 17507598726SKarl Rupp Initialize number of v-cycles to default (1) 17607598726SKarl Rupp */ 17707598726SKarl Rupp sac->SAVIENNACL = 0; 17807598726SKarl Rupp 17907598726SKarl Rupp /* 18007598726SKarl Rupp Set the pointers for the functions that are provided above. 18107598726SKarl Rupp Now when the user-level routines (such as PCApply(), PCDestroy(), etc.) 18207598726SKarl Rupp are called, they will automatically call these functions. Note we 18307598726SKarl Rupp choose not to provide a couple of these functions since they are 18407598726SKarl Rupp not needed. 18507598726SKarl Rupp */ 18607598726SKarl Rupp pc->ops->apply = PCApply_SAVIENNACL; 18707598726SKarl Rupp pc->ops->applytranspose = 0; 18807598726SKarl Rupp pc->ops->setup = PCSetUp_SAVIENNACL; 18907598726SKarl Rupp pc->ops->destroy = PCDestroy_SAVIENNACL; 19007598726SKarl Rupp pc->ops->setfromoptions = PCSetFromOptions_SAVIENNACL; 19107598726SKarl Rupp pc->ops->view = 0; 19207598726SKarl Rupp pc->ops->applyrichardson = 0; 19307598726SKarl Rupp pc->ops->applysymmetricleft = 0; 19407598726SKarl Rupp pc->ops->applysymmetricright = 0; 19507598726SKarl Rupp PetscFunctionReturn(0); 19607598726SKarl Rupp } 197