xref: /petsc/src/ksp/pc/impls/rowscalingviennacl/rowscalingviennacl.cxx (revision 48a46eb9bd028bec07ec0f396b1a3abb43f14558)
170baa948SKarl Rupp 
270baa948SKarl Rupp /*  -------------------------------------------------------------------- */
370baa948SKarl Rupp 
470baa948SKarl Rupp /*
570baa948SKarl Rupp    Include files needed for the ViennaCL row-scaling preconditioner:
670baa948SKarl Rupp      pcimpl.h - private include file intended for use by all preconditioners
770baa948SKarl Rupp */
870baa948SKarl Rupp #define PETSC_SKIP_SPINLOCK
999acd6aaSStefano Zampini #define PETSC_SKIP_IMMINTRIN_H_CUDAWORKAROUND 1
1099acd6aaSStefano Zampini 
1170baa948SKarl Rupp #include <petsc/private/pcimpl.h> /*I "petscpc.h" I*/
1270baa948SKarl Rupp #include <../src/mat/impls/aij/seq/aij.h>
1370baa948SKarl Rupp #include <../src/vec/vec/impls/dvecimpl.h>
1470baa948SKarl Rupp #include <../src/mat/impls/aij/seq/seqviennacl/viennaclmatimpl.h>
1570baa948SKarl Rupp #include <../src/vec/vec/impls/seq/seqviennacl/viennaclvecimpl.h>
1670baa948SKarl Rupp #include <viennacl/linalg/row_scaling.hpp>
1770baa948SKarl Rupp 
1870baa948SKarl Rupp /*
1970baa948SKarl Rupp    Private context (data structure) for the ROWSCALINGVIENNACL preconditioner.
2070baa948SKarl Rupp */
2170baa948SKarl Rupp typedef struct {
2270baa948SKarl Rupp   viennacl::linalg::row_scaling<viennacl::compressed_matrix<PetscScalar>> *ROWSCALINGVIENNACL;
2370baa948SKarl Rupp } PC_ROWSCALINGVIENNACL;
2470baa948SKarl Rupp 
2570baa948SKarl Rupp /* -------------------------------------------------------------------------- */
2670baa948SKarl Rupp /*
2770baa948SKarl Rupp    PCSetUp_ROWSCALINGVIENNACL - Prepares for the use of the ROWSCALINGVIENNACL preconditioner
2870baa948SKarl Rupp                                 by setting data structures and options.
2970baa948SKarl Rupp 
3070baa948SKarl Rupp    Input Parameter:
3170baa948SKarl Rupp .  pc - the preconditioner context
3270baa948SKarl Rupp 
3370baa948SKarl Rupp    Application Interface Routine: PCSetUp()
3470baa948SKarl Rupp 
3570baa948SKarl Rupp    Notes:
3670baa948SKarl Rupp    The interface routine PCSetUp() is not usually called directly by
3770baa948SKarl Rupp    the user, but instead is called by PCApply() if necessary.
3870baa948SKarl Rupp */
399371c9d4SSatish Balay static PetscErrorCode PCSetUp_ROWSCALINGVIENNACL(PC pc) {
4070baa948SKarl Rupp   PC_ROWSCALINGVIENNACL *rowscaling = (PC_ROWSCALINGVIENNACL *)pc->data;
4170baa948SKarl Rupp   PetscBool              flg        = PETSC_FALSE;
4270baa948SKarl Rupp   Mat_SeqAIJViennaCL    *gpustruct;
4370baa948SKarl Rupp 
4470baa948SKarl Rupp   PetscFunctionBegin;
459566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)pc->pmat, MATSEQAIJVIENNACL, &flg));
4628b400f6SJacob Faibussowitsch   PetscCheck(flg, PetscObjectComm((PetscObject)pc), PETSC_ERR_SUP, "Currently only handles ViennaCL matrices");
4770baa948SKarl Rupp   if (pc->setupcalled != 0) {
4870baa948SKarl Rupp     try {
4970baa948SKarl Rupp       delete rowscaling->ROWSCALINGVIENNACL;
509371c9d4SSatish Balay     } catch (char *ex) { SETERRQ(PETSC_COMM_SELF, PETSC_ERR_LIB, "ViennaCL error: %s", ex); }
5170baa948SKarl Rupp   }
5270baa948SKarl Rupp   try {
5370baa948SKarl Rupp #if defined(PETSC_USE_COMPLEX)
5470baa948SKarl Rupp     gpustruct = NULL;
5570baa948SKarl Rupp     SETERRQ(PetscObjectComm((PetscObject)pc), PETSC_ERR_SUP, "No support for complex arithmetic in ROWSCALINGVIENNACL preconditioner");
5670baa948SKarl Rupp #else
579566063dSJacob Faibussowitsch     PetscCall(MatViennaCLCopyToGPU(pc->pmat));
5870baa948SKarl Rupp     gpustruct = (Mat_SeqAIJViennaCL *)(pc->pmat->spptr);
5970baa948SKarl Rupp 
6070baa948SKarl Rupp     viennacl::linalg::row_scaling_tag pc_tag(1);
6170baa948SKarl Rupp     ViennaCLAIJMatrix                *mat = (ViennaCLAIJMatrix *)gpustruct->mat;
6270baa948SKarl Rupp     rowscaling->ROWSCALINGVIENNACL        = new viennacl::linalg::row_scaling<viennacl::compressed_matrix<PetscScalar>>(*mat, pc_tag);
6370baa948SKarl Rupp #endif
649371c9d4SSatish Balay   } catch (char *ex) { SETERRQ(PETSC_COMM_SELF, PETSC_ERR_LIB, "ViennaCL error: %s", ex); }
6570baa948SKarl Rupp   PetscFunctionReturn(0);
6670baa948SKarl Rupp }
6770baa948SKarl Rupp 
6870baa948SKarl Rupp /* -------------------------------------------------------------------------- */
6970baa948SKarl Rupp /*
7070baa948SKarl Rupp    PCApply_ROWSCALINGVIENNACL - Applies the ROWSCALINGVIENNACL preconditioner to a vector.
7170baa948SKarl Rupp 
7270baa948SKarl Rupp    Input Parameters:
7370baa948SKarl Rupp .  pc - the preconditioner context
7470baa948SKarl Rupp .  x - input vector
7570baa948SKarl Rupp 
7670baa948SKarl Rupp    Output Parameter:
7770baa948SKarl Rupp .  y - output vector
7870baa948SKarl Rupp 
7970baa948SKarl Rupp    Application Interface Routine: PCApply()
8070baa948SKarl Rupp  */
819371c9d4SSatish Balay static PetscErrorCode PCApply_ROWSCALINGVIENNACL(PC pc, Vec x, Vec y) {
8270baa948SKarl Rupp   PC_ROWSCALINGVIENNACL               *ilu = (PC_ROWSCALINGVIENNACL *)pc->data;
8370baa948SKarl Rupp   PetscBool                            flg1, flg2;
8470baa948SKarl Rupp   viennacl::vector<PetscScalar> const *xarray = NULL;
8570baa948SKarl Rupp   viennacl::vector<PetscScalar>       *yarray = NULL;
8670baa948SKarl Rupp 
8770baa948SKarl Rupp   PetscFunctionBegin;
8870baa948SKarl Rupp   /*how to apply a certain fixed number of iterations?*/
899566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)x, VECSEQVIENNACL, &flg1));
909566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)y, VECSEQVIENNACL, &flg2));
9108401ef6SPierre Jolivet   PetscCheck((flg1 && flg2), PetscObjectComm((PetscObject)pc), PETSC_ERR_SUP, "Currently only handles ViennaCL vectors");
92*48a46eb9SPierre Jolivet   if (!ilu->ROWSCALINGVIENNACL) PetscCall(PCSetUp_ROWSCALINGVIENNACL(pc));
939566063dSJacob Faibussowitsch   PetscCall(VecSet(y, 0.0));
949566063dSJacob Faibussowitsch   PetscCall(VecViennaCLGetArrayRead(x, &xarray));
959566063dSJacob Faibussowitsch   PetscCall(VecViennaCLGetArrayWrite(y, &yarray));
9670baa948SKarl Rupp   try {
9770baa948SKarl Rupp #if defined(PETSC_USE_COMPLEX)
9870baa948SKarl Rupp 
9970baa948SKarl Rupp #else
10070baa948SKarl Rupp     *yarray                               = *xarray;
10170baa948SKarl Rupp     ilu->ROWSCALINGVIENNACL->apply(*yarray);
10270baa948SKarl Rupp #endif
1039371c9d4SSatish Balay   } catch (char *ex) { SETERRQ(PETSC_COMM_SELF, PETSC_ERR_LIB, "ViennaCL error: %s", ex); }
1049566063dSJacob Faibussowitsch   PetscCall(VecViennaCLRestoreArrayRead(x, &xarray));
1059566063dSJacob Faibussowitsch   PetscCall(VecViennaCLRestoreArrayWrite(y, &yarray));
1069566063dSJacob Faibussowitsch   PetscCall(PetscObjectStateIncrease((PetscObject)y));
10770baa948SKarl Rupp   PetscFunctionReturn(0);
10870baa948SKarl Rupp }
10970baa948SKarl Rupp /* -------------------------------------------------------------------------- */
11070baa948SKarl Rupp /*
11170baa948SKarl Rupp    PCDestroy_ROWSCALINGVIENNACL - Destroys the private context for the ROWSCALINGVIENNACL preconditioner
11270baa948SKarl Rupp    that was created with PCCreate_ROWSCALINGVIENNACL().
11370baa948SKarl Rupp 
11470baa948SKarl Rupp    Input Parameter:
11570baa948SKarl Rupp .  pc - the preconditioner context
11670baa948SKarl Rupp 
11770baa948SKarl Rupp    Application Interface Routine: PCDestroy()
11870baa948SKarl Rupp */
1199371c9d4SSatish Balay static PetscErrorCode PCDestroy_ROWSCALINGVIENNACL(PC pc) {
12070baa948SKarl Rupp   PC_ROWSCALINGVIENNACL *rowscaling = (PC_ROWSCALINGVIENNACL *)pc->data;
12170baa948SKarl Rupp 
12270baa948SKarl Rupp   PetscFunctionBegin;
12370baa948SKarl Rupp   if (rowscaling->ROWSCALINGVIENNACL) {
12470baa948SKarl Rupp     try {
12570baa948SKarl Rupp       delete rowscaling->ROWSCALINGVIENNACL;
1269371c9d4SSatish Balay     } catch (char *ex) { SETERRQ(PETSC_COMM_SELF, PETSC_ERR_LIB, "ViennaCL error: %s", ex); }
12770baa948SKarl Rupp   }
12870baa948SKarl Rupp 
12970baa948SKarl Rupp   /*
13070baa948SKarl Rupp       Free the private data structure that was hanging off the PC
13170baa948SKarl Rupp   */
1329566063dSJacob Faibussowitsch   PetscCall(PetscFree(pc->data));
13370baa948SKarl Rupp   PetscFunctionReturn(0);
13470baa948SKarl Rupp }
13570baa948SKarl Rupp 
1369371c9d4SSatish Balay static PetscErrorCode PCSetFromOptions_ROWSCALINGVIENNACL(PC pc, PetscOptionItems *PetscOptionsObject) {
13770baa948SKarl Rupp   PetscFunctionBegin;
138d0609cedSBarry Smith   PetscOptionsHeadBegin(PetscOptionsObject, "ROWSCALINGVIENNACL options");
139d0609cedSBarry Smith   PetscOptionsHeadEnd();
14070baa948SKarl Rupp   PetscFunctionReturn(0);
14170baa948SKarl Rupp }
14270baa948SKarl Rupp 
14370baa948SKarl Rupp /* -------------------------------------------------------------------------- */
14470baa948SKarl Rupp 
14570baa948SKarl Rupp /*MC
14670baa948SKarl Rupp      PCRowScalingViennaCL  - A diagonal preconditioner (scaling rows of matrices by their norm) that can be used via the CUDA, OpenCL, and OpenMP backends of ViennaCL
14770baa948SKarl Rupp 
14870baa948SKarl Rupp    Level: advanced
14970baa948SKarl Rupp 
150db781477SPatrick Sanan .seealso: `PCCreate()`, `PCSetType()`, `PCType`, `PC`
15170baa948SKarl Rupp 
15270baa948SKarl Rupp M*/
15370baa948SKarl Rupp 
1549371c9d4SSatish Balay PETSC_EXTERN PetscErrorCode PCCreate_ROWSCALINGVIENNACL(PC pc) {
15570baa948SKarl Rupp   PC_ROWSCALINGVIENNACL *rowscaling;
15670baa948SKarl Rupp 
15770baa948SKarl Rupp   PetscFunctionBegin;
15870baa948SKarl Rupp   /*
15970baa948SKarl Rupp      Creates the private data structure for this preconditioner and
16070baa948SKarl Rupp      attach it to the PC object.
16170baa948SKarl Rupp   */
1629566063dSJacob Faibussowitsch   PetscCall(PetscNewLog(pc, &rowscaling));
16370baa948SKarl Rupp   pc->data = (void *)rowscaling;
16470baa948SKarl Rupp 
16570baa948SKarl Rupp   /*
16670baa948SKarl Rupp      Initialize the pointer to zero
16770baa948SKarl Rupp      Initialize number of v-cycles to default (1)
16870baa948SKarl Rupp   */
16970baa948SKarl Rupp   rowscaling->ROWSCALINGVIENNACL = 0;
17070baa948SKarl Rupp 
17170baa948SKarl Rupp   /*
17270baa948SKarl Rupp       Set the pointers for the functions that are provided above.
17370baa948SKarl Rupp       Now when the user-level routines (such as PCApply(), PCDestroy(), etc.)
17470baa948SKarl Rupp       are called, they will automatically call these functions.  Note we
17570baa948SKarl Rupp       choose not to provide a couple of these functions since they are
17670baa948SKarl Rupp       not needed.
17770baa948SKarl Rupp   */
17870baa948SKarl Rupp   pc->ops->apply               = PCApply_ROWSCALINGVIENNACL;
17970baa948SKarl Rupp   pc->ops->applytranspose      = 0;
18070baa948SKarl Rupp   pc->ops->setup               = PCSetUp_ROWSCALINGVIENNACL;
18170baa948SKarl Rupp   pc->ops->destroy             = PCDestroy_ROWSCALINGVIENNACL;
18270baa948SKarl Rupp   pc->ops->setfromoptions      = PCSetFromOptions_ROWSCALINGVIENNACL;
18370baa948SKarl Rupp   pc->ops->view                = 0;
18470baa948SKarl Rupp   pc->ops->applyrichardson     = 0;
18570baa948SKarl Rupp   pc->ops->applysymmetricleft  = 0;
18670baa948SKarl Rupp   pc->ops->applysymmetricright = 0;
18770baa948SKarl Rupp   PetscFunctionReturn(0);
18870baa948SKarl Rupp }
189