xref: /petsc/src/ksp/pc/impls/rowscalingviennacl/rowscalingviennacl.cxx (revision d71ae5a4db6382e7f06317b8d368875286fe9008)
170baa948SKarl Rupp 
270baa948SKarl Rupp /*
370baa948SKarl Rupp    Include files needed for the ViennaCL row-scaling preconditioner:
470baa948SKarl Rupp      pcimpl.h - private include file intended for use by all preconditioners
570baa948SKarl Rupp */
670baa948SKarl Rupp #define PETSC_SKIP_SPINLOCK
799acd6aaSStefano Zampini #define PETSC_SKIP_IMMINTRIN_H_CUDAWORKAROUND 1
899acd6aaSStefano Zampini 
970baa948SKarl Rupp #include <petsc/private/pcimpl.h> /*I "petscpc.h" I*/
1070baa948SKarl Rupp #include <../src/mat/impls/aij/seq/aij.h>
1170baa948SKarl Rupp #include <../src/vec/vec/impls/dvecimpl.h>
1270baa948SKarl Rupp #include <../src/mat/impls/aij/seq/seqviennacl/viennaclmatimpl.h>
1370baa948SKarl Rupp #include <../src/vec/vec/impls/seq/seqviennacl/viennaclvecimpl.h>
1470baa948SKarl Rupp #include <viennacl/linalg/row_scaling.hpp>
1570baa948SKarl Rupp 
1670baa948SKarl Rupp /*
1770baa948SKarl Rupp    Private context (data structure) for the ROWSCALINGVIENNACL preconditioner.
1870baa948SKarl Rupp */
1970baa948SKarl Rupp typedef struct {
2070baa948SKarl Rupp   viennacl::linalg::row_scaling<viennacl::compressed_matrix<PetscScalar>> *ROWSCALINGVIENNACL;
2170baa948SKarl Rupp } PC_ROWSCALINGVIENNACL;
2270baa948SKarl Rupp 
2370baa948SKarl Rupp /*
2470baa948SKarl Rupp    PCSetUp_ROWSCALINGVIENNACL - Prepares for the use of the ROWSCALINGVIENNACL preconditioner
2570baa948SKarl Rupp                                 by setting data structures and options.
2670baa948SKarl Rupp 
2770baa948SKarl Rupp    Input Parameter:
2870baa948SKarl Rupp .  pc - the preconditioner context
2970baa948SKarl Rupp 
3070baa948SKarl Rupp    Application Interface Routine: PCSetUp()
3170baa948SKarl Rupp 
32f1580f4eSBarry Smith    Note:
3370baa948SKarl Rupp    The interface routine PCSetUp() is not usually called directly by
3470baa948SKarl Rupp    the user, but instead is called by PCApply() if necessary.
3570baa948SKarl Rupp */
36*d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCSetUp_ROWSCALINGVIENNACL(PC pc)
37*d71ae5a4SJacob Faibussowitsch {
3870baa948SKarl Rupp   PC_ROWSCALINGVIENNACL *rowscaling = (PC_ROWSCALINGVIENNACL *)pc->data;
3970baa948SKarl Rupp   PetscBool              flg        = PETSC_FALSE;
4070baa948SKarl Rupp   Mat_SeqAIJViennaCL    *gpustruct;
4170baa948SKarl Rupp 
4270baa948SKarl Rupp   PetscFunctionBegin;
439566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)pc->pmat, MATSEQAIJVIENNACL, &flg));
4428b400f6SJacob Faibussowitsch   PetscCheck(flg, PetscObjectComm((PetscObject)pc), PETSC_ERR_SUP, "Currently only handles ViennaCL matrices");
4570baa948SKarl Rupp   if (pc->setupcalled != 0) {
4670baa948SKarl Rupp     try {
4770baa948SKarl Rupp       delete rowscaling->ROWSCALINGVIENNACL;
48*d71ae5a4SJacob Faibussowitsch     } catch (char *ex) {
49*d71ae5a4SJacob Faibussowitsch       SETERRQ(PETSC_COMM_SELF, PETSC_ERR_LIB, "ViennaCL error: %s", ex);
50*d71ae5a4SJacob Faibussowitsch     }
5170baa948SKarl Rupp   }
5270baa948SKarl Rupp   try {
5370baa948SKarl Rupp #if defined(PETSC_USE_COMPLEX)
5470baa948SKarl Rupp     gpustruct = NULL;
5570baa948SKarl Rupp     SETERRQ(PetscObjectComm((PetscObject)pc), PETSC_ERR_SUP, "No support for complex arithmetic in ROWSCALINGVIENNACL preconditioner");
5670baa948SKarl Rupp #else
579566063dSJacob Faibussowitsch     PetscCall(MatViennaCLCopyToGPU(pc->pmat));
5870baa948SKarl Rupp     gpustruct = (Mat_SeqAIJViennaCL *)(pc->pmat->spptr);
5970baa948SKarl Rupp 
6070baa948SKarl Rupp     viennacl::linalg::row_scaling_tag pc_tag(1);
6170baa948SKarl Rupp     ViennaCLAIJMatrix                *mat = (ViennaCLAIJMatrix *)gpustruct->mat;
6270baa948SKarl Rupp     rowscaling->ROWSCALINGVIENNACL        = new viennacl::linalg::row_scaling<viennacl::compressed_matrix<PetscScalar>>(*mat, pc_tag);
6370baa948SKarl Rupp #endif
64*d71ae5a4SJacob Faibussowitsch   } catch (char *ex) {
65*d71ae5a4SJacob Faibussowitsch     SETERRQ(PETSC_COMM_SELF, PETSC_ERR_LIB, "ViennaCL error: %s", ex);
66*d71ae5a4SJacob Faibussowitsch   }
6770baa948SKarl Rupp   PetscFunctionReturn(0);
6870baa948SKarl Rupp }
6970baa948SKarl Rupp 
7070baa948SKarl Rupp /*
7170baa948SKarl Rupp    PCApply_ROWSCALINGVIENNACL - Applies the ROWSCALINGVIENNACL preconditioner to a vector.
7270baa948SKarl Rupp 
7370baa948SKarl Rupp    Input Parameters:
7470baa948SKarl Rupp .  pc - the preconditioner context
7570baa948SKarl Rupp .  x - input vector
7670baa948SKarl Rupp 
7770baa948SKarl Rupp    Output Parameter:
7870baa948SKarl Rupp .  y - output vector
7970baa948SKarl Rupp 
8070baa948SKarl Rupp    Application Interface Routine: PCApply()
8170baa948SKarl Rupp  */
82*d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCApply_ROWSCALINGVIENNACL(PC pc, Vec x, Vec y)
83*d71ae5a4SJacob Faibussowitsch {
8470baa948SKarl Rupp   PC_ROWSCALINGVIENNACL               *ilu = (PC_ROWSCALINGVIENNACL *)pc->data;
8570baa948SKarl Rupp   PetscBool                            flg1, flg2;
8670baa948SKarl Rupp   viennacl::vector<PetscScalar> const *xarray = NULL;
8770baa948SKarl Rupp   viennacl::vector<PetscScalar>       *yarray = NULL;
8870baa948SKarl Rupp 
8970baa948SKarl Rupp   PetscFunctionBegin;
9070baa948SKarl Rupp   /*how to apply a certain fixed number of iterations?*/
919566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)x, VECSEQVIENNACL, &flg1));
929566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)y, VECSEQVIENNACL, &flg2));
9308401ef6SPierre Jolivet   PetscCheck((flg1 && flg2), PetscObjectComm((PetscObject)pc), PETSC_ERR_SUP, "Currently only handles ViennaCL vectors");
9448a46eb9SPierre Jolivet   if (!ilu->ROWSCALINGVIENNACL) PetscCall(PCSetUp_ROWSCALINGVIENNACL(pc));
959566063dSJacob Faibussowitsch   PetscCall(VecSet(y, 0.0));
969566063dSJacob Faibussowitsch   PetscCall(VecViennaCLGetArrayRead(x, &xarray));
979566063dSJacob Faibussowitsch   PetscCall(VecViennaCLGetArrayWrite(y, &yarray));
9870baa948SKarl Rupp   try {
9970baa948SKarl Rupp #if defined(PETSC_USE_COMPLEX)
10070baa948SKarl Rupp 
10170baa948SKarl Rupp #else
10270baa948SKarl Rupp     *yarray                               = *xarray;
10370baa948SKarl Rupp     ilu->ROWSCALINGVIENNACL->apply(*yarray);
10470baa948SKarl Rupp #endif
105*d71ae5a4SJacob Faibussowitsch   } catch (char *ex) {
106*d71ae5a4SJacob Faibussowitsch     SETERRQ(PETSC_COMM_SELF, PETSC_ERR_LIB, "ViennaCL error: %s", ex);
107*d71ae5a4SJacob Faibussowitsch   }
1089566063dSJacob Faibussowitsch   PetscCall(VecViennaCLRestoreArrayRead(x, &xarray));
1099566063dSJacob Faibussowitsch   PetscCall(VecViennaCLRestoreArrayWrite(y, &yarray));
1109566063dSJacob Faibussowitsch   PetscCall(PetscObjectStateIncrease((PetscObject)y));
11170baa948SKarl Rupp   PetscFunctionReturn(0);
11270baa948SKarl Rupp }
113f1580f4eSBarry Smith 
11470baa948SKarl Rupp /*
11570baa948SKarl Rupp    PCDestroy_ROWSCALINGVIENNACL - Destroys the private context for the ROWSCALINGVIENNACL preconditioner
11670baa948SKarl Rupp    that was created with PCCreate_ROWSCALINGVIENNACL().
11770baa948SKarl Rupp 
11870baa948SKarl Rupp    Input Parameter:
11970baa948SKarl Rupp .  pc - the preconditioner context
12070baa948SKarl Rupp 
12170baa948SKarl Rupp    Application Interface Routine: PCDestroy()
12270baa948SKarl Rupp */
123*d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCDestroy_ROWSCALINGVIENNACL(PC pc)
124*d71ae5a4SJacob Faibussowitsch {
12570baa948SKarl Rupp   PC_ROWSCALINGVIENNACL *rowscaling = (PC_ROWSCALINGVIENNACL *)pc->data;
12670baa948SKarl Rupp 
12770baa948SKarl Rupp   PetscFunctionBegin;
12870baa948SKarl Rupp   if (rowscaling->ROWSCALINGVIENNACL) {
12970baa948SKarl Rupp     try {
13070baa948SKarl Rupp       delete rowscaling->ROWSCALINGVIENNACL;
131*d71ae5a4SJacob Faibussowitsch     } catch (char *ex) {
132*d71ae5a4SJacob Faibussowitsch       SETERRQ(PETSC_COMM_SELF, PETSC_ERR_LIB, "ViennaCL error: %s", ex);
133*d71ae5a4SJacob Faibussowitsch     }
13470baa948SKarl Rupp   }
13570baa948SKarl Rupp 
13670baa948SKarl Rupp   /*
13770baa948SKarl Rupp       Free the private data structure that was hanging off the PC
13870baa948SKarl Rupp   */
1399566063dSJacob Faibussowitsch   PetscCall(PetscFree(pc->data));
14070baa948SKarl Rupp   PetscFunctionReturn(0);
14170baa948SKarl Rupp }
14270baa948SKarl Rupp 
143*d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCSetFromOptions_ROWSCALINGVIENNACL(PC pc, PetscOptionItems *PetscOptionsObject)
144*d71ae5a4SJacob Faibussowitsch {
14570baa948SKarl Rupp   PetscFunctionBegin;
146d0609cedSBarry Smith   PetscOptionsHeadBegin(PetscOptionsObject, "ROWSCALINGVIENNACL options");
147d0609cedSBarry Smith   PetscOptionsHeadEnd();
14870baa948SKarl Rupp   PetscFunctionReturn(0);
14970baa948SKarl Rupp }
15070baa948SKarl Rupp 
15170baa948SKarl Rupp /*MC
15270baa948SKarl Rupp      PCRowScalingViennaCL  - A diagonal preconditioner (scaling rows of matrices by their norm) that can be used via the CUDA, OpenCL, and OpenMP backends of ViennaCL
15370baa948SKarl Rupp 
15470baa948SKarl Rupp    Level: advanced
15570baa948SKarl Rupp 
156f1580f4eSBarry Smith    Developer Note:
157f1580f4eSBarry Smith    This `PCType` does not appear to be registered
15870baa948SKarl Rupp 
159f1580f4eSBarry Smith .seealso: `PCCreate()`, `PCSetType()`, `PCType`, `PC`
16070baa948SKarl Rupp M*/
16170baa948SKarl Rupp 
162*d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode PCCreate_ROWSCALINGVIENNACL(PC pc)
163*d71ae5a4SJacob Faibussowitsch {
16470baa948SKarl Rupp   PC_ROWSCALINGVIENNACL *rowscaling;
16570baa948SKarl Rupp 
16670baa948SKarl Rupp   PetscFunctionBegin;
16770baa948SKarl Rupp   /*
16870baa948SKarl Rupp      Creates the private data structure for this preconditioner and
16970baa948SKarl Rupp      attach it to the PC object.
17070baa948SKarl Rupp   */
1714dfa11a4SJacob Faibussowitsch   PetscCall(PetscNew(&rowscaling));
17270baa948SKarl Rupp   pc->data = (void *)rowscaling;
17370baa948SKarl Rupp 
17470baa948SKarl Rupp   /*
17570baa948SKarl Rupp      Initialize the pointer to zero
17670baa948SKarl Rupp      Initialize number of v-cycles to default (1)
17770baa948SKarl Rupp   */
17870baa948SKarl Rupp   rowscaling->ROWSCALINGVIENNACL = 0;
17970baa948SKarl Rupp 
18070baa948SKarl Rupp   /*
18170baa948SKarl Rupp       Set the pointers for the functions that are provided above.
18270baa948SKarl Rupp       Now when the user-level routines (such as PCApply(), PCDestroy(), etc.)
18370baa948SKarl Rupp       are called, they will automatically call these functions.  Note we
18470baa948SKarl Rupp       choose not to provide a couple of these functions since they are
18570baa948SKarl Rupp       not needed.
18670baa948SKarl Rupp   */
18770baa948SKarl Rupp   pc->ops->apply               = PCApply_ROWSCALINGVIENNACL;
18870baa948SKarl Rupp   pc->ops->applytranspose      = 0;
18970baa948SKarl Rupp   pc->ops->setup               = PCSetUp_ROWSCALINGVIENNACL;
19070baa948SKarl Rupp   pc->ops->destroy             = PCDestroy_ROWSCALINGVIENNACL;
19170baa948SKarl Rupp   pc->ops->setfromoptions      = PCSetFromOptions_ROWSCALINGVIENNACL;
19270baa948SKarl Rupp   pc->ops->view                = 0;
19370baa948SKarl Rupp   pc->ops->applyrichardson     = 0;
19470baa948SKarl Rupp   pc->ops->applysymmetricleft  = 0;
19570baa948SKarl Rupp   pc->ops->applysymmetricright = 0;
19670baa948SKarl Rupp   PetscFunctionReturn(0);
19770baa948SKarl Rupp }
198