xref: /petsc/src/mat/impls/hypre/mhypre.c (revision cac4c232dc4f93991e342196e27ef7b0655dac7b)
163c07aadSStefano Zampini 
263c07aadSStefano Zampini /*
363c07aadSStefano Zampini     Creates hypre ijmatrix from PETSc matrix
463c07aadSStefano Zampini */
5225daaf8SStefano Zampini 
6c6698e78SStefano Zampini #include <petscpkg_version.h>
739accc25SStefano Zampini #include <petsc/private/petschypre.h>
8dd9c0a25Sstefano_zampini #include <petscmathypre.h>
963c07aadSStefano Zampini #include <petsc/private/matimpl.h>
10a4af0ceeSJacob Faibussowitsch #include <petsc/private/deviceimpl.h>
1163c07aadSStefano Zampini #include <../src/mat/impls/hypre/mhypre.h>
1263c07aadSStefano Zampini #include <../src/mat/impls/aij/mpi/mpiaij.h>
1358968eb6SStefano Zampini #include <../src/vec/vec/impls/hypre/vhyp.h>
1458968eb6SStefano Zampini #include <HYPRE.h>
15c1a070e6SStefano Zampini #include <HYPRE_utilities.h>
16cd8bc7baSStefano Zampini #include <_hypre_parcsr_ls.h>
1768ec7858SStefano Zampini #include <_hypre_sstruct_ls.h>
1863c07aadSStefano Zampini 
190e6427aaSSatish Balay #if PETSC_PKG_HYPRE_VERSION_LT(2,18,0)
200e6427aaSSatish Balay #define  hypre_ParCSRMatrixClone(A,B) hypre_ParCSRMatrixCompleteClone(A)
210e6427aaSSatish Balay #endif
220e6427aaSSatish Balay 
2363c07aadSStefano Zampini static PetscErrorCode MatHYPRE_CreateFromMat(Mat,Mat_HYPRE*);
2463c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixPreallocate(Mat,Mat,HYPRE_IJMatrix);
2563c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixFastCopy_MPIAIJ(Mat,HYPRE_IJMatrix);
2663c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixFastCopy_SeqAIJ(Mat,HYPRE_IJMatrix);
2739accc25SStefano Zampini static PetscErrorCode MatHYPRE_MultKernel_Private(Mat,HYPRE_Complex,Vec,HYPRE_Complex,Vec,PetscBool);
28225daaf8SStefano Zampini static PetscErrorCode hypre_array_destroy(void*);
296ea7df73SStefano Zampini static PetscErrorCode MatSetValues_HYPRE(Mat,PetscInt,const PetscInt[],PetscInt,const PetscInt[],const PetscScalar[],InsertMode ins);
3063c07aadSStefano Zampini 
3163c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixPreallocate(Mat A_d, Mat A_o, HYPRE_IJMatrix ij)
3263c07aadSStefano Zampini {
3363c07aadSStefano Zampini   PetscInt       i,n_d,n_o;
3463c07aadSStefano Zampini   const PetscInt *ia_d,*ia_o;
3563c07aadSStefano Zampini   PetscBool      done_d=PETSC_FALSE,done_o=PETSC_FALSE;
362cf14000SStefano Zampini   HYPRE_Int      *nnz_d=NULL,*nnz_o=NULL;
3763c07aadSStefano Zampini 
3863c07aadSStefano Zampini   PetscFunctionBegin;
3963c07aadSStefano Zampini   if (A_d) { /* determine number of nonzero entries in local diagonal part */
409566063dSJacob Faibussowitsch     PetscCall(MatGetRowIJ(A_d,0,PETSC_FALSE,PETSC_FALSE,&n_d,&ia_d,NULL,&done_d));
4163c07aadSStefano Zampini     if (done_d) {
429566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(n_d,&nnz_d));
4363c07aadSStefano Zampini       for (i=0; i<n_d; i++) {
4463c07aadSStefano Zampini         nnz_d[i] = ia_d[i+1] - ia_d[i];
4563c07aadSStefano Zampini       }
4663c07aadSStefano Zampini     }
479566063dSJacob Faibussowitsch     PetscCall(MatRestoreRowIJ(A_d,0,PETSC_FALSE,PETSC_FALSE,NULL,&ia_d,NULL,&done_d));
4863c07aadSStefano Zampini   }
4963c07aadSStefano Zampini   if (A_o) { /* determine number of nonzero entries in local off-diagonal part */
509566063dSJacob Faibussowitsch     PetscCall(MatGetRowIJ(A_o,0,PETSC_FALSE,PETSC_FALSE,&n_o,&ia_o,NULL,&done_o));
5163c07aadSStefano Zampini     if (done_o) {
529566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(n_o,&nnz_o));
5363c07aadSStefano Zampini       for (i=0; i<n_o; i++) {
5463c07aadSStefano Zampini         nnz_o[i] = ia_o[i+1] - ia_o[i];
5563c07aadSStefano Zampini       }
5663c07aadSStefano Zampini     }
579566063dSJacob Faibussowitsch     PetscCall(MatRestoreRowIJ(A_o,0,PETSC_FALSE,PETSC_FALSE,&n_o,&ia_o,NULL,&done_o));
5863c07aadSStefano Zampini   }
5963c07aadSStefano Zampini   if (done_d) {    /* set number of nonzeros in HYPRE IJ matrix */
6063c07aadSStefano Zampini     if (!done_o) { /* only diagonal part */
619566063dSJacob Faibussowitsch       PetscCall(PetscCalloc1(n_d,&nnz_o));
6263c07aadSStefano Zampini     }
63c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2,16,0)
64c6698e78SStefano Zampini     { /* If we don't do this, the columns of the matrix will be all zeros! */
65c6698e78SStefano Zampini       hypre_AuxParCSRMatrix *aux_matrix;
66c6698e78SStefano Zampini       aux_matrix = (hypre_AuxParCSRMatrix*)hypre_IJMatrixTranslator(ij);
67c6698e78SStefano Zampini       hypre_AuxParCSRMatrixDestroy(aux_matrix);
68c6698e78SStefano Zampini       hypre_IJMatrixTranslator(ij) = NULL;
69a74df02fSJacob Faibussowitsch       PetscStackCallStandard(HYPRE_IJMatrixSetDiagOffdSizes,ij,nnz_d,nnz_o);
7022235d61SPierre Jolivet       /* it seems they partially fixed it in 2.19.0 */
7122235d61SPierre Jolivet #if PETSC_PKG_HYPRE_VERSION_LT(2,19,0)
72c6698e78SStefano Zampini       aux_matrix = (hypre_AuxParCSRMatrix*)hypre_IJMatrixTranslator(ij);
73c6698e78SStefano Zampini       hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 1;
7422235d61SPierre Jolivet #endif
75c6698e78SStefano Zampini     }
76c6698e78SStefano Zampini #else
77a74df02fSJacob Faibussowitsch     PetscStackCallStandard(HYPRE_IJMatrixSetDiagOffdSizes,ij,nnz_d,nnz_o);
78c6698e78SStefano Zampini #endif
799566063dSJacob Faibussowitsch     PetscCall(PetscFree(nnz_d));
809566063dSJacob Faibussowitsch     PetscCall(PetscFree(nnz_o));
8163c07aadSStefano Zampini   }
8263c07aadSStefano Zampini   PetscFunctionReturn(0);
8363c07aadSStefano Zampini }
8463c07aadSStefano Zampini 
8563c07aadSStefano Zampini static PetscErrorCode MatHYPRE_CreateFromMat(Mat A, Mat_HYPRE *hA)
8663c07aadSStefano Zampini {
8763c07aadSStefano Zampini   PetscInt       rstart,rend,cstart,cend;
8863c07aadSStefano Zampini 
8963c07aadSStefano Zampini   PetscFunctionBegin;
909566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->rmap));
919566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->cmap));
9263c07aadSStefano Zampini   rstart = A->rmap->rstart;
9363c07aadSStefano Zampini   rend   = A->rmap->rend;
9463c07aadSStefano Zampini   cstart = A->cmap->rstart;
9563c07aadSStefano Zampini   cend   = A->cmap->rend;
96a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixCreate,hA->comm,rstart,rend-1,cstart,cend-1,&hA->ij);
97a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixSetObjectType,hA->ij,HYPRE_PARCSR);
9863c07aadSStefano Zampini   {
9963c07aadSStefano Zampini     PetscBool      same;
10063c07aadSStefano Zampini     Mat            A_d,A_o;
10163c07aadSStefano Zampini     const PetscInt *colmap;
1029566063dSJacob Faibussowitsch     PetscCall(PetscObjectBaseTypeCompare((PetscObject)A,MATMPIAIJ,&same));
10363c07aadSStefano Zampini     if (same) {
1049566063dSJacob Faibussowitsch       PetscCall(MatMPIAIJGetSeqAIJ(A,&A_d,&A_o,&colmap));
1059566063dSJacob Faibussowitsch       PetscCall(MatHYPRE_IJMatrixPreallocate(A_d,A_o,hA->ij));
10663c07aadSStefano Zampini       PetscFunctionReturn(0);
10763c07aadSStefano Zampini     }
1089566063dSJacob Faibussowitsch     PetscCall(PetscObjectBaseTypeCompare((PetscObject)A,MATMPIBAIJ,&same));
10963c07aadSStefano Zampini     if (same) {
1109566063dSJacob Faibussowitsch       PetscCall(MatMPIBAIJGetSeqBAIJ(A,&A_d,&A_o,&colmap));
1119566063dSJacob Faibussowitsch       PetscCall(MatHYPRE_IJMatrixPreallocate(A_d,A_o,hA->ij));
11263c07aadSStefano Zampini       PetscFunctionReturn(0);
11363c07aadSStefano Zampini     }
1149566063dSJacob Faibussowitsch     PetscCall(PetscObjectBaseTypeCompare((PetscObject)A,MATSEQAIJ,&same));
11563c07aadSStefano Zampini     if (same) {
1169566063dSJacob Faibussowitsch       PetscCall(MatHYPRE_IJMatrixPreallocate(A,NULL,hA->ij));
11763c07aadSStefano Zampini       PetscFunctionReturn(0);
11863c07aadSStefano Zampini     }
1199566063dSJacob Faibussowitsch     PetscCall(PetscObjectBaseTypeCompare((PetscObject)A,MATSEQBAIJ,&same));
12063c07aadSStefano Zampini     if (same) {
1219566063dSJacob Faibussowitsch       PetscCall(MatHYPRE_IJMatrixPreallocate(A,NULL,hA->ij));
12263c07aadSStefano Zampini       PetscFunctionReturn(0);
12363c07aadSStefano Zampini     }
12463c07aadSStefano Zampini   }
12563c07aadSStefano Zampini   PetscFunctionReturn(0);
12663c07aadSStefano Zampini }
12763c07aadSStefano Zampini 
12863c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixCopy(Mat A, HYPRE_IJMatrix ij)
12963c07aadSStefano Zampini {
13063c07aadSStefano Zampini   PetscInt          i,rstart,rend,ncols,nr,nc;
13163c07aadSStefano Zampini   const PetscScalar *values;
13263c07aadSStefano Zampini   const PetscInt    *cols;
13363c07aadSStefano Zampini   PetscBool         flg;
13463c07aadSStefano Zampini 
13563c07aadSStefano Zampini   PetscFunctionBegin;
1366ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2,19,0)
137a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixInitialize,ij);
1386ea7df73SStefano Zampini #else
139a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixInitialize_v2,ij,HYPRE_MEMORY_HOST);
1406ea7df73SStefano Zampini #endif
1419566063dSJacob Faibussowitsch   PetscCall(PetscObjectBaseTypeCompare((PetscObject)A,MATMPIAIJ,&flg));
1429566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A,&nr,&nc));
14363c07aadSStefano Zampini   if (flg && nr == nc) {
1449566063dSJacob Faibussowitsch     PetscCall(MatHYPRE_IJMatrixFastCopy_MPIAIJ(A,ij));
14563c07aadSStefano Zampini     PetscFunctionReturn(0);
14663c07aadSStefano Zampini   }
1479566063dSJacob Faibussowitsch   PetscCall(PetscObjectBaseTypeCompare((PetscObject)A,MATSEQAIJ,&flg));
14863c07aadSStefano Zampini   if (flg) {
1499566063dSJacob Faibussowitsch     PetscCall(MatHYPRE_IJMatrixFastCopy_SeqAIJ(A,ij));
15063c07aadSStefano Zampini     PetscFunctionReturn(0);
15163c07aadSStefano Zampini   }
15263c07aadSStefano Zampini 
1535fbaff96SJunchao Zhang   /* Do not need Aux since we have done precise i[],j[] allocation in MatHYPRE_CreateFromMat() */
1545fbaff96SJunchao Zhang   hypre_AuxParCSRMatrixNeedAux((hypre_AuxParCSRMatrix*)hypre_IJMatrixTranslator(ij)) = 0;
1555fbaff96SJunchao Zhang 
1569566063dSJacob Faibussowitsch   PetscCall(MatGetOwnershipRange(A,&rstart,&rend));
15763c07aadSStefano Zampini   for (i=rstart; i<rend; i++) {
1589566063dSJacob Faibussowitsch     PetscCall(MatGetRow(A,i,&ncols,&cols,&values));
159e3977e59Sstefano_zampini     if (ncols) {
1602cf14000SStefano Zampini       HYPRE_Int nc = (HYPRE_Int)ncols;
1612cf14000SStefano Zampini 
1622c71b3e2SJacob Faibussowitsch       PetscCheckFalse((PetscInt)nc != ncols,PETSC_COMM_SELF,PETSC_ERR_SUP,"Hypre overflow! number of columns %" PetscInt_FMT " for row %" PetscInt_FMT,ncols,i);
163a74df02fSJacob Faibussowitsch       PetscStackCallStandard(HYPRE_IJMatrixSetValues,ij,1,&nc,(HYPRE_BigInt *)&i,(HYPRE_BigInt *)cols,(HYPRE_Complex *)values);
164e3977e59Sstefano_zampini     }
1659566063dSJacob Faibussowitsch     PetscCall(MatRestoreRow(A,i,&ncols,&cols,&values));
16663c07aadSStefano Zampini   }
16763c07aadSStefano Zampini   PetscFunctionReturn(0);
16863c07aadSStefano Zampini }
16963c07aadSStefano Zampini 
17063c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixFastCopy_SeqAIJ(Mat A, HYPRE_IJMatrix ij)
17163c07aadSStefano Zampini {
17263c07aadSStefano Zampini   Mat_SeqAIJ            *pdiag = (Mat_SeqAIJ*)A->data;
17358968eb6SStefano Zampini   HYPRE_Int             type;
17463c07aadSStefano Zampini   hypre_ParCSRMatrix    *par_matrix;
17563c07aadSStefano Zampini   hypre_AuxParCSRMatrix *aux_matrix;
17663c07aadSStefano Zampini   hypre_CSRMatrix       *hdiag;
1772cf14000SStefano Zampini   PetscBool             sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int));
1786ea7df73SStefano Zampini   const PetscScalar     *pa;
17963c07aadSStefano Zampini 
18063c07aadSStefano Zampini   PetscFunctionBegin;
181a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixGetObjectType,ij,&type);
1822c71b3e2SJacob Faibussowitsch   PetscCheckFalse(type != HYPRE_PARCSR,PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported");
183a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixGetObject,ij,(void**)&par_matrix);
18463c07aadSStefano Zampini   hdiag = hypre_ParCSRMatrixDiag(par_matrix);
18563c07aadSStefano Zampini   /*
18663c07aadSStefano Zampini        this is the Hack part where we monkey directly with the hypre datastructures
18763c07aadSStefano Zampini   */
1882cf14000SStefano Zampini   if (sameint) {
1899566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(hdiag->i,pdiag->i,A->rmap->n + 1));
1909566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(hdiag->j,pdiag->j,pdiag->nz));
1912cf14000SStefano Zampini   } else {
1922cf14000SStefano Zampini     PetscInt i;
1932cf14000SStefano Zampini 
1942cf14000SStefano Zampini     for (i=0;i<A->rmap->n + 1;i++) hdiag->i[i] = (HYPRE_Int)pdiag->i[i];
1952cf14000SStefano Zampini     for (i=0;i<pdiag->nz;i++)      hdiag->j[i] = (HYPRE_Int)pdiag->j[i];
1962cf14000SStefano Zampini   }
1976ea7df73SStefano Zampini 
1989566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A,&pa));
1999566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(hdiag->data,pa,pdiag->nz));
2009566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A,&pa));
201ea9daf28SStefano Zampini 
202ea9daf28SStefano Zampini   aux_matrix = (hypre_AuxParCSRMatrix*)hypre_IJMatrixTranslator(ij);
20363c07aadSStefano Zampini   hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0;
20463c07aadSStefano Zampini   PetscFunctionReturn(0);
20563c07aadSStefano Zampini }
20663c07aadSStefano Zampini 
20763c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixFastCopy_MPIAIJ(Mat A, HYPRE_IJMatrix ij)
20863c07aadSStefano Zampini {
20963c07aadSStefano Zampini   Mat_MPIAIJ            *pA = (Mat_MPIAIJ*)A->data;
21063c07aadSStefano Zampini   Mat_SeqAIJ            *pdiag,*poffd;
21163c07aadSStefano Zampini   PetscInt              i,*garray = pA->garray,*jj,cstart,*pjj;
2122cf14000SStefano Zampini   HYPRE_Int             *hjj,type;
21363c07aadSStefano Zampini   hypre_ParCSRMatrix    *par_matrix;
21463c07aadSStefano Zampini   hypre_AuxParCSRMatrix *aux_matrix;
21563c07aadSStefano Zampini   hypre_CSRMatrix       *hdiag,*hoffd;
2162cf14000SStefano Zampini   PetscBool             sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int));
2176ea7df73SStefano Zampini   const PetscScalar     *pa;
21863c07aadSStefano Zampini 
21963c07aadSStefano Zampini   PetscFunctionBegin;
22063c07aadSStefano Zampini   pdiag = (Mat_SeqAIJ*) pA->A->data;
22163c07aadSStefano Zampini   poffd = (Mat_SeqAIJ*) pA->B->data;
22263c07aadSStefano Zampini   /* cstart is only valid for square MPIAIJ layed out in the usual way */
2239566063dSJacob Faibussowitsch   PetscCall(MatGetOwnershipRange(A,&cstart,NULL));
22463c07aadSStefano Zampini 
225a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixGetObjectType,ij,&type);
2262c71b3e2SJacob Faibussowitsch   PetscCheckFalse(type != HYPRE_PARCSR,PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported");
227a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixGetObject,ij,(void**)&par_matrix);
22863c07aadSStefano Zampini   hdiag = hypre_ParCSRMatrixDiag(par_matrix);
22963c07aadSStefano Zampini   hoffd = hypre_ParCSRMatrixOffd(par_matrix);
23063c07aadSStefano Zampini 
23163c07aadSStefano Zampini   /*
23263c07aadSStefano Zampini        this is the Hack part where we monkey directly with the hypre datastructures
23363c07aadSStefano Zampini   */
2342cf14000SStefano Zampini   if (sameint) {
2359566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(hdiag->i,pdiag->i,pA->A->rmap->n + 1));
2362cf14000SStefano Zampini   } else {
2372cf14000SStefano Zampini     for (i=0; i<pA->A->rmap->n + 1; i++) hdiag->i[i] = (HYPRE_Int)(pdiag->i[i]);
2382cf14000SStefano Zampini   }
23963c07aadSStefano Zampini   /* need to shift the diag column indices (hdiag->j) back to global numbering since hypre is expecting this */
2402cf14000SStefano Zampini   hjj = hdiag->j;
2412cf14000SStefano Zampini   pjj = pdiag->j;
242c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2,16,0)
2432cf14000SStefano Zampini   for (i=0; i<pdiag->nz; i++) hjj[i] = pjj[i];
244c6698e78SStefano Zampini #else
2452cf14000SStefano Zampini   for (i=0; i<pdiag->nz; i++) hjj[i] = cstart + pjj[i];
246c6698e78SStefano Zampini #endif
2479566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(pA->A,&pa));
2489566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(hdiag->data,pa,pdiag->nz));
2499566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(pA->A,&pa));
2502cf14000SStefano Zampini   if (sameint) {
2519566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(hoffd->i,poffd->i,pA->A->rmap->n + 1));
2522cf14000SStefano Zampini   } else {
2532cf14000SStefano Zampini     for (i=0; i<pA->A->rmap->n + 1; i++) hoffd->i[i] = (HYPRE_Int)(poffd->i[i]);
2542cf14000SStefano Zampini   }
2552cf14000SStefano Zampini 
25663c07aadSStefano Zampini   /* need to move the offd column indices (hoffd->j) back to global numbering since hypre is expecting this
25763c07aadSStefano Zampini      If we hacked a hypre a bit more we might be able to avoid this step */
258c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2,16,0)
259a74df02fSJacob Faibussowitsch   PetscStackCallStandard(hypre_CSRMatrixBigInitialize,hoffd);
260c6698e78SStefano Zampini   jj  = (PetscInt*) hoffd->big_j;
261c6698e78SStefano Zampini #else
26263c07aadSStefano Zampini   jj  = (PetscInt*) hoffd->j;
263c6698e78SStefano Zampini #endif
2642cf14000SStefano Zampini   pjj = poffd->j;
26563c07aadSStefano Zampini   for (i=0; i<poffd->nz; i++) jj[i] = garray[pjj[i]];
266c6698e78SStefano Zampini 
2679566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(pA->B,&pa));
2689566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(hoffd->data,pa,poffd->nz));
2699566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(pA->B,&pa));
27063c07aadSStefano Zampini 
271ea9daf28SStefano Zampini   aux_matrix = (hypre_AuxParCSRMatrix*)hypre_IJMatrixTranslator(ij);
27263c07aadSStefano Zampini   hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0;
27363c07aadSStefano Zampini   PetscFunctionReturn(0);
27463c07aadSStefano Zampini }
27563c07aadSStefano Zampini 
2762df22349SStefano Zampini static PetscErrorCode MatConvert_HYPRE_IS(Mat A, MatType mtype, MatReuse reuse, Mat* B)
2772df22349SStefano Zampini {
2782df22349SStefano Zampini   Mat_HYPRE*             mhA = (Mat_HYPRE*)(A->data);
2792df22349SStefano Zampini   Mat                    lA;
2802df22349SStefano Zampini   ISLocalToGlobalMapping rl2g,cl2g;
2812df22349SStefano Zampini   IS                     is;
2822df22349SStefano Zampini   hypre_ParCSRMatrix     *hA;
2832df22349SStefano Zampini   hypre_CSRMatrix        *hdiag,*hoffd;
2842df22349SStefano Zampini   MPI_Comm               comm;
28539accc25SStefano Zampini   HYPRE_Complex          *hdd,*hod,*aa;
28639accc25SStefano Zampini   PetscScalar            *data;
2872cf14000SStefano Zampini   HYPRE_BigInt           *col_map_offd;
2882cf14000SStefano Zampini   HYPRE_Int              *hdi,*hdj,*hoi,*hoj;
2892df22349SStefano Zampini   PetscInt               *ii,*jj,*iptr,*jptr;
2902df22349SStefano Zampini   PetscInt               cum,dr,dc,oc,str,stc,nnz,i,jd,jo,M,N;
29158968eb6SStefano Zampini   HYPRE_Int              type;
2922df22349SStefano Zampini 
2932df22349SStefano Zampini   PetscFunctionBegin;
294a1787963SStefano Zampini   comm = PetscObjectComm((PetscObject)A);
295a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixGetObjectType,mhA->ij,&type);
2962c71b3e2SJacob Faibussowitsch   PetscCheckFalse(type != HYPRE_PARCSR,comm,PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported");
297a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixGetObject,mhA->ij,(void**)&hA);
2982df22349SStefano Zampini   M     = hypre_ParCSRMatrixGlobalNumRows(hA);
2992df22349SStefano Zampini   N     = hypre_ParCSRMatrixGlobalNumCols(hA);
3002df22349SStefano Zampini   str   = hypre_ParCSRMatrixFirstRowIndex(hA);
3012df22349SStefano Zampini   stc   = hypre_ParCSRMatrixFirstColDiag(hA);
3022df22349SStefano Zampini   hdiag = hypre_ParCSRMatrixDiag(hA);
3032df22349SStefano Zampini   hoffd = hypre_ParCSRMatrixOffd(hA);
3042df22349SStefano Zampini   dr    = hypre_CSRMatrixNumRows(hdiag);
3052df22349SStefano Zampini   dc    = hypre_CSRMatrixNumCols(hdiag);
3062df22349SStefano Zampini   nnz   = hypre_CSRMatrixNumNonzeros(hdiag);
3072df22349SStefano Zampini   hdi   = hypre_CSRMatrixI(hdiag);
3082df22349SStefano Zampini   hdj   = hypre_CSRMatrixJ(hdiag);
3092df22349SStefano Zampini   hdd   = hypre_CSRMatrixData(hdiag);
3102df22349SStefano Zampini   oc    = hypre_CSRMatrixNumCols(hoffd);
3112df22349SStefano Zampini   nnz  += hypre_CSRMatrixNumNonzeros(hoffd);
3122df22349SStefano Zampini   hoi   = hypre_CSRMatrixI(hoffd);
3132df22349SStefano Zampini   hoj   = hypre_CSRMatrixJ(hoffd);
3142df22349SStefano Zampini   hod   = hypre_CSRMatrixData(hoffd);
3152df22349SStefano Zampini   if (reuse != MAT_REUSE_MATRIX) {
3162df22349SStefano Zampini     PetscInt *aux;
3172df22349SStefano Zampini 
3182df22349SStefano Zampini     /* generate l2g maps for rows and cols */
3199566063dSJacob Faibussowitsch     PetscCall(ISCreateStride(comm,dr,str,1,&is));
3209566063dSJacob Faibussowitsch     PetscCall(ISLocalToGlobalMappingCreateIS(is,&rl2g));
3219566063dSJacob Faibussowitsch     PetscCall(ISDestroy(&is));
3222df22349SStefano Zampini     col_map_offd = hypre_ParCSRMatrixColMapOffd(hA);
3239566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(dc+oc,&aux));
3242df22349SStefano Zampini     for (i=0; i<dc; i++) aux[i] = i+stc;
3252df22349SStefano Zampini     for (i=0; i<oc; i++) aux[i+dc] = col_map_offd[i];
3269566063dSJacob Faibussowitsch     PetscCall(ISCreateGeneral(comm,dc+oc,aux,PETSC_OWN_POINTER,&is));
3279566063dSJacob Faibussowitsch     PetscCall(ISLocalToGlobalMappingCreateIS(is,&cl2g));
3289566063dSJacob Faibussowitsch     PetscCall(ISDestroy(&is));
3292df22349SStefano Zampini     /* create MATIS object */
3309566063dSJacob Faibussowitsch     PetscCall(MatCreate(comm,B));
3319566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(*B,dr,dc,M,N));
3329566063dSJacob Faibussowitsch     PetscCall(MatSetType(*B,MATIS));
3339566063dSJacob Faibussowitsch     PetscCall(MatSetLocalToGlobalMapping(*B,rl2g,cl2g));
3349566063dSJacob Faibussowitsch     PetscCall(ISLocalToGlobalMappingDestroy(&rl2g));
3359566063dSJacob Faibussowitsch     PetscCall(ISLocalToGlobalMappingDestroy(&cl2g));
3362df22349SStefano Zampini 
3372df22349SStefano Zampini     /* allocate CSR for local matrix */
3389566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(dr+1,&iptr));
3399566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nnz,&jptr));
3409566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nnz,&data));
3412df22349SStefano Zampini   } else {
3422df22349SStefano Zampini     PetscInt  nr;
3432df22349SStefano Zampini     PetscBool done;
3449566063dSJacob Faibussowitsch     PetscCall(MatISGetLocalMat(*B,&lA));
3459566063dSJacob Faibussowitsch     PetscCall(MatGetRowIJ(lA,0,PETSC_FALSE,PETSC_FALSE,&nr,(const PetscInt**)&iptr,(const PetscInt**)&jptr,&done));
3462c71b3e2SJacob Faibussowitsch     PetscCheckFalse(nr != dr,PETSC_COMM_SELF,PETSC_ERR_USER,"Cannot reuse mat: invalid number of rows in local mat! %" PetscInt_FMT " != %" PetscInt_FMT,nr,dr);
3472c71b3e2SJacob Faibussowitsch     PetscCheckFalse(iptr[nr] < nnz,PETSC_COMM_SELF,PETSC_ERR_USER,"Cannot reuse mat: invalid number of nonzeros in local mat! reuse %" PetscInt_FMT " requested %" PetscInt_FMT,iptr[nr],nnz);
3489566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(lA,&data));
3492df22349SStefano Zampini   }
3502df22349SStefano Zampini   /* merge local matrices */
3512df22349SStefano Zampini   ii  = iptr;
3522df22349SStefano Zampini   jj  = jptr;
35339accc25SStefano Zampini   aa  = (HYPRE_Complex*)data; /* this cast fixes the clang error when doing the assignments below: implicit conversion from 'HYPRE_Complex' (aka '_Complex double') to 'double' is not permitted in C++ */
3542df22349SStefano Zampini   *ii = *(hdi++) + *(hoi++);
3552df22349SStefano Zampini   for (jd=0,jo=0,cum=0; *ii<nnz; cum++) {
35639accc25SStefano Zampini     PetscScalar *aold = (PetscScalar*)aa;
3572df22349SStefano Zampini     PetscInt    *jold = jj,nc = jd+jo;
3582df22349SStefano Zampini     for (; jd<*hdi; jd++) { *jj++ = *hdj++;      *aa++ = *hdd++; }
3592df22349SStefano Zampini     for (; jo<*hoi; jo++) { *jj++ = *hoj++ + dc; *aa++ = *hod++; }
3602df22349SStefano Zampini     *(++ii) = *(hdi++) + *(hoi++);
3619566063dSJacob Faibussowitsch     PetscCall(PetscSortIntWithScalarArray(jd+jo-nc,jold,aold));
3622df22349SStefano Zampini   }
3632df22349SStefano Zampini   for (; cum<dr; cum++) *(++ii) = nnz;
3642df22349SStefano Zampini   if (reuse != MAT_REUSE_MATRIX) {
365a033916dSStefano Zampini     Mat_SeqAIJ* a;
366a033916dSStefano Zampini 
3679566063dSJacob Faibussowitsch     PetscCall(MatCreateSeqAIJWithArrays(PETSC_COMM_SELF,dr,dc+oc,iptr,jptr,data,&lA));
3689566063dSJacob Faibussowitsch     PetscCall(MatISSetLocalMat(*B,lA));
369a033916dSStefano Zampini     /* hack SeqAIJ */
370a033916dSStefano Zampini     a          = (Mat_SeqAIJ*)(lA->data);
371a033916dSStefano Zampini     a->free_a  = PETSC_TRUE;
372a033916dSStefano Zampini     a->free_ij = PETSC_TRUE;
3739566063dSJacob Faibussowitsch     PetscCall(MatDestroy(&lA));
3742df22349SStefano Zampini   }
3759566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY));
3769566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY));
3772df22349SStefano Zampini   if (reuse == MAT_INPLACE_MATRIX) {
3789566063dSJacob Faibussowitsch     PetscCall(MatHeaderReplace(A,B));
3792df22349SStefano Zampini   }
3802df22349SStefano Zampini   PetscFunctionReturn(0);
3812df22349SStefano Zampini }
3822df22349SStefano Zampini 
38363c07aadSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType type, MatReuse reuse, Mat *B)
38463c07aadSStefano Zampini {
38584d4e069SStefano Zampini   Mat            M = NULL;
38663c07aadSStefano Zampini   Mat_HYPRE      *hB;
38763c07aadSStefano Zampini   MPI_Comm       comm = PetscObjectComm((PetscObject)A);
38863c07aadSStefano Zampini 
38963c07aadSStefano Zampini   PetscFunctionBegin;
39063c07aadSStefano Zampini   if (reuse == MAT_REUSE_MATRIX) {
39163c07aadSStefano Zampini     /* always destroy the old matrix and create a new memory;
39263c07aadSStefano Zampini        hope this does not churn the memory too much. The problem
39363c07aadSStefano Zampini        is I do not know if it is possible to put the matrix back to
39463c07aadSStefano Zampini        its initial state so that we can directly copy the values
39563c07aadSStefano Zampini        the second time through. */
39663c07aadSStefano Zampini     hB = (Mat_HYPRE*)((*B)->data);
397a74df02fSJacob Faibussowitsch     PetscStackCallStandard(HYPRE_IJMatrixDestroy,hB->ij);
39863c07aadSStefano Zampini   } else {
3999566063dSJacob Faibussowitsch     PetscCall(MatCreate(comm,&M));
4009566063dSJacob Faibussowitsch     PetscCall(MatSetType(M,MATHYPRE));
4019566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(M,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N));
40284d4e069SStefano Zampini     hB   = (Mat_HYPRE*)(M->data);
40384d4e069SStefano Zampini     if (reuse == MAT_INITIAL_MATRIX) *B = M;
40463c07aadSStefano Zampini   }
4059566063dSJacob Faibussowitsch   PetscCall(MatSetOption(*B,MAT_SORTED_FULL,PETSC_TRUE)); /* "perfect" preallocation, so no need for hypre_AuxParCSRMatrixNeedAux */
4069566063dSJacob Faibussowitsch   PetscCall(MatSetOption(*B,MAT_NO_OFF_PROC_ENTRIES,PETSC_TRUE));
4079566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_CreateFromMat(A,hB));
4089566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_IJMatrixCopy(A,hB->ij));
40984d4e069SStefano Zampini   if (reuse == MAT_INPLACE_MATRIX) {
4109566063dSJacob Faibussowitsch     PetscCall(MatHeaderReplace(A,&M));
41184d4e069SStefano Zampini   }
4124ec6421dSstefano_zampini   (*B)->preallocated = PETSC_TRUE;
4139566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY));
4149566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY));
41563c07aadSStefano Zampini   PetscFunctionReturn(0);
41663c07aadSStefano Zampini }
41763c07aadSStefano Zampini 
418ea9daf28SStefano Zampini static PetscErrorCode MatConvert_HYPRE_AIJ(Mat A, MatType mtype, MatReuse reuse, Mat *B)
41963c07aadSStefano Zampini {
42063c07aadSStefano Zampini   Mat_HYPRE          *hA = (Mat_HYPRE*)A->data;
42163c07aadSStefano Zampini   hypre_ParCSRMatrix *parcsr;
42263c07aadSStefano Zampini   hypre_CSRMatrix    *hdiag,*hoffd;
42363c07aadSStefano Zampini   MPI_Comm           comm;
42463c07aadSStefano Zampini   PetscScalar        *da,*oa,*aptr;
42563c07aadSStefano Zampini   PetscInt           *dii,*djj,*oii,*ojj,*iptr;
42663c07aadSStefano Zampini   PetscInt           i,dnnz,onnz,m,n;
42758968eb6SStefano Zampini   HYPRE_Int          type;
42863c07aadSStefano Zampini   PetscMPIInt        size;
4292cf14000SStefano Zampini   PetscBool          sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int));
43063c07aadSStefano Zampini 
43163c07aadSStefano Zampini   PetscFunctionBegin;
43263c07aadSStefano Zampini   comm = PetscObjectComm((PetscObject)A);
433a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixGetObjectType,hA->ij,&type);
4342c71b3e2SJacob Faibussowitsch   PetscCheckFalse(type != HYPRE_PARCSR,comm,PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported");
43563c07aadSStefano Zampini   if (reuse == MAT_REUSE_MATRIX) {
43663c07aadSStefano Zampini     PetscBool ismpiaij,isseqaij;
4379566063dSJacob Faibussowitsch     PetscCall(PetscObjectBaseTypeCompare((PetscObject)*B,MATMPIAIJ,&ismpiaij));
4389566063dSJacob Faibussowitsch     PetscCall(PetscObjectBaseTypeCompare((PetscObject)*B,MATSEQAIJ,&isseqaij));
4392c71b3e2SJacob Faibussowitsch     PetscCheckFalse(!ismpiaij && !isseqaij,comm,PETSC_ERR_SUP,"Only MATMPIAIJ or MATSEQAIJ are supported");
44063c07aadSStefano Zampini   }
4416ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
4422c71b3e2SJacob Faibussowitsch   PetscCheckFalse(HYPRE_MEMORY_DEVICE == hypre_IJMatrixMemoryLocation(hA->ij),comm,PETSC_ERR_SUP,"Not yet implemented");
4436ea7df73SStefano Zampini #endif
4449566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_size(comm,&size));
44563c07aadSStefano Zampini 
446a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixGetObject,hA->ij,(void**)&parcsr);
44763c07aadSStefano Zampini   hdiag = hypre_ParCSRMatrixDiag(parcsr);
44863c07aadSStefano Zampini   hoffd = hypre_ParCSRMatrixOffd(parcsr);
44963c07aadSStefano Zampini   m     = hypre_CSRMatrixNumRows(hdiag);
45063c07aadSStefano Zampini   n     = hypre_CSRMatrixNumCols(hdiag);
45163c07aadSStefano Zampini   dnnz  = hypre_CSRMatrixNumNonzeros(hdiag);
45263c07aadSStefano Zampini   onnz  = hypre_CSRMatrixNumNonzeros(hoffd);
453225daaf8SStefano Zampini   if (reuse == MAT_INITIAL_MATRIX) {
4549566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(m+1,&dii));
4559566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(dnnz,&djj));
4569566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(dnnz,&da));
457225daaf8SStefano Zampini   } else if (reuse == MAT_REUSE_MATRIX) {
45863c07aadSStefano Zampini     PetscInt  nr;
45963c07aadSStefano Zampini     PetscBool done;
46063c07aadSStefano Zampini     if (size > 1) {
46163c07aadSStefano Zampini       Mat_MPIAIJ *b = (Mat_MPIAIJ*)((*B)->data);
46263c07aadSStefano Zampini 
4639566063dSJacob Faibussowitsch       PetscCall(MatGetRowIJ(b->A,0,PETSC_FALSE,PETSC_FALSE,&nr,(const PetscInt**)&dii,(const PetscInt**)&djj,&done));
4642c71b3e2SJacob Faibussowitsch       PetscCheckFalse(nr != m,PETSC_COMM_SELF,PETSC_ERR_USER,"Cannot reuse mat: invalid number of local rows in diag part! %" PetscInt_FMT " != %" PetscInt_FMT,nr,m);
4652c71b3e2SJacob Faibussowitsch       PetscCheckFalse(dii[nr] < dnnz,PETSC_COMM_SELF,PETSC_ERR_USER,"Cannot reuse mat: invalid number of nonzeros in diag part! reuse %" PetscInt_FMT " hypre %" PetscInt_FMT,dii[nr],dnnz);
4669566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJGetArray(b->A,&da));
46763c07aadSStefano Zampini     } else {
4689566063dSJacob Faibussowitsch       PetscCall(MatGetRowIJ(*B,0,PETSC_FALSE,PETSC_FALSE,&nr,(const PetscInt**)&dii,(const PetscInt**)&djj,&done));
4692c71b3e2SJacob Faibussowitsch       PetscCheckFalse(nr != m,PETSC_COMM_SELF,PETSC_ERR_USER,"Cannot reuse mat: invalid number of local rows! %" PetscInt_FMT " != %" PetscInt_FMT,nr,m);
4702c71b3e2SJacob Faibussowitsch       PetscCheckFalse(dii[nr] < dnnz,PETSC_COMM_SELF,PETSC_ERR_USER,"Cannot reuse mat: invalid number of nonzeros! reuse %" PetscInt_FMT " hypre %" PetscInt_FMT,dii[nr],dnnz);
4719566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJGetArray(*B,&da));
47263c07aadSStefano Zampini     }
473225daaf8SStefano Zampini   } else { /* MAT_INPLACE_MATRIX */
4742cf14000SStefano Zampini     if (!sameint) {
4759566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m+1,&dii));
4769566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(dnnz,&djj));
4772cf14000SStefano Zampini     } else {
4787d968826Sstefano_zampini       dii = (PetscInt*)hypre_CSRMatrixI(hdiag);
4797d968826Sstefano_zampini       djj = (PetscInt*)hypre_CSRMatrixJ(hdiag);
48063c07aadSStefano Zampini     }
48139accc25SStefano Zampini     da = (PetscScalar*)hypre_CSRMatrixData(hdiag);
48263c07aadSStefano Zampini   }
4832cf14000SStefano Zampini 
4842cf14000SStefano Zampini   if (!sameint) {
485a16187a7SStefano Zampini     if (reuse != MAT_REUSE_MATRIX) { for (i=0;i<m+1;i++)  dii[i] = (PetscInt)(hypre_CSRMatrixI(hdiag)[i]); }
4862cf14000SStefano Zampini     for (i=0;i<dnnz;i++) djj[i] = (PetscInt)(hypre_CSRMatrixJ(hdiag)[i]);
4872cf14000SStefano Zampini   } else {
4889566063dSJacob Faibussowitsch     if (reuse != MAT_REUSE_MATRIX) PetscCall(PetscArraycpy(dii,hypre_CSRMatrixI(hdiag),m+1));
4899566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(djj,hypre_CSRMatrixJ(hdiag),dnnz));
4902cf14000SStefano Zampini   }
4919566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(da,hypre_CSRMatrixData(hdiag),dnnz));
49263c07aadSStefano Zampini   iptr = djj;
49363c07aadSStefano Zampini   aptr = da;
49463c07aadSStefano Zampini   for (i=0; i<m; i++) {
49563c07aadSStefano Zampini     PetscInt nc = dii[i+1]-dii[i];
4969566063dSJacob Faibussowitsch     PetscCall(PetscSortIntWithScalarArray(nc,iptr,aptr));
49763c07aadSStefano Zampini     iptr += nc;
49863c07aadSStefano Zampini     aptr += nc;
49963c07aadSStefano Zampini   }
50063c07aadSStefano Zampini   if (size > 1) {
5012cf14000SStefano Zampini     HYPRE_BigInt *coffd;
5022cf14000SStefano Zampini     HYPRE_Int    *offdj;
50363c07aadSStefano Zampini 
504225daaf8SStefano Zampini     if (reuse == MAT_INITIAL_MATRIX) {
5059566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m+1,&oii));
5069566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(onnz,&ojj));
5079566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(onnz,&oa));
508225daaf8SStefano Zampini     } else if (reuse == MAT_REUSE_MATRIX) {
50963c07aadSStefano Zampini       Mat_MPIAIJ *b = (Mat_MPIAIJ*)((*B)->data);
51063c07aadSStefano Zampini       PetscInt   nr,hr = hypre_CSRMatrixNumRows(hoffd);
51163c07aadSStefano Zampini       PetscBool  done;
51263c07aadSStefano Zampini 
5139566063dSJacob Faibussowitsch       PetscCall(MatGetRowIJ(b->B,0,PETSC_FALSE,PETSC_FALSE,&nr,(const PetscInt**)&oii,(const PetscInt**)&ojj,&done));
5142c71b3e2SJacob Faibussowitsch       PetscCheckFalse(nr != hr,PETSC_COMM_SELF,PETSC_ERR_USER,"Cannot reuse mat: invalid number of local rows in offdiag part! %" PetscInt_FMT " != %" PetscInt_FMT,nr,hr);
5152c71b3e2SJacob Faibussowitsch       PetscCheckFalse(oii[nr] < onnz,PETSC_COMM_SELF,PETSC_ERR_USER,"Cannot reuse mat: invalid number of nonzeros in offdiag part! reuse %" PetscInt_FMT " hypre %" PetscInt_FMT,oii[nr],onnz);
5169566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJGetArray(b->B,&oa));
517225daaf8SStefano Zampini     } else { /* MAT_INPLACE_MATRIX */
5182cf14000SStefano Zampini       if (!sameint) {
5199566063dSJacob Faibussowitsch         PetscCall(PetscMalloc1(m+1,&oii));
5209566063dSJacob Faibussowitsch         PetscCall(PetscMalloc1(onnz,&ojj));
5212cf14000SStefano Zampini       } else {
5227d968826Sstefano_zampini         oii = (PetscInt*)hypre_CSRMatrixI(hoffd);
5237d968826Sstefano_zampini         ojj = (PetscInt*)hypre_CSRMatrixJ(hoffd);
52463c07aadSStefano Zampini       }
52539accc25SStefano Zampini       oa = (PetscScalar*)hypre_CSRMatrixData(hoffd);
52663c07aadSStefano Zampini     }
527a16187a7SStefano Zampini     if (reuse != MAT_REUSE_MATRIX) {
5282cf14000SStefano Zampini       if (!sameint) {
5292cf14000SStefano Zampini         for (i=0;i<m+1;i++) oii[i] = (PetscInt)(hypre_CSRMatrixI(hoffd)[i]);
5302cf14000SStefano Zampini       } else {
5319566063dSJacob Faibussowitsch         PetscCall(PetscArraycpy(oii,hypre_CSRMatrixI(hoffd),m+1));
5322cf14000SStefano Zampini       }
533a16187a7SStefano Zampini     }
5349566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(oa,hypre_CSRMatrixData(hoffd),onnz));
535a16187a7SStefano Zampini 
53663c07aadSStefano Zampini     offdj = hypre_CSRMatrixJ(hoffd);
53763c07aadSStefano Zampini     coffd = hypre_ParCSRMatrixColMapOffd(parcsr);
538a16187a7SStefano Zampini     /* we only need the permutation to be computed properly, I don't know if HYPRE
539a16187a7SStefano Zampini        messes up with the ordering. Just in case, allocate some memory and free it
540a16187a7SStefano Zampini        later */
541a16187a7SStefano Zampini     if (reuse == MAT_REUSE_MATRIX) {
542a16187a7SStefano Zampini       Mat_MPIAIJ *b = (Mat_MPIAIJ*)((*B)->data);
543a16187a7SStefano Zampini       PetscInt   mnz;
544a16187a7SStefano Zampini 
5459566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJGetMaxRowNonzeros(b->B,&mnz));
5469566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(mnz,&ojj));
547a16187a7SStefano Zampini     } else for (i=0; i<onnz; i++) ojj[i] = coffd[offdj[i]];
54863c07aadSStefano Zampini     iptr = ojj;
54963c07aadSStefano Zampini     aptr = oa;
55063c07aadSStefano Zampini     for (i=0; i<m; i++) {
55163c07aadSStefano Zampini        PetscInt nc = oii[i+1]-oii[i];
552a16187a7SStefano Zampini        if (reuse == MAT_REUSE_MATRIX) {
553a16187a7SStefano Zampini          PetscInt j;
554a16187a7SStefano Zampini 
555a16187a7SStefano Zampini          iptr = ojj;
556a16187a7SStefano Zampini          for (j=0; j<nc; j++) iptr[j] = coffd[offdj[oii[i] + j]];
557a16187a7SStefano Zampini        }
5589566063dSJacob Faibussowitsch        PetscCall(PetscSortIntWithScalarArray(nc,iptr,aptr));
55963c07aadSStefano Zampini        iptr += nc;
56063c07aadSStefano Zampini        aptr += nc;
56163c07aadSStefano Zampini     }
5629566063dSJacob Faibussowitsch     if (reuse == MAT_REUSE_MATRIX) PetscCall(PetscFree(ojj));
563225daaf8SStefano Zampini     if (reuse == MAT_INITIAL_MATRIX) {
56463c07aadSStefano Zampini       Mat_MPIAIJ *b;
56563c07aadSStefano Zampini       Mat_SeqAIJ *d,*o;
566225daaf8SStefano Zampini 
5679566063dSJacob Faibussowitsch       PetscCall(MatCreateMPIAIJWithSplitArrays(comm,m,n,PETSC_DECIDE,PETSC_DECIDE,dii,djj,da,oii,ojj,oa,B));
56863c07aadSStefano Zampini       /* hack MPIAIJ */
56963c07aadSStefano Zampini       b          = (Mat_MPIAIJ*)((*B)->data);
57063c07aadSStefano Zampini       d          = (Mat_SeqAIJ*)b->A->data;
57163c07aadSStefano Zampini       o          = (Mat_SeqAIJ*)b->B->data;
57263c07aadSStefano Zampini       d->free_a  = PETSC_TRUE;
57363c07aadSStefano Zampini       d->free_ij = PETSC_TRUE;
57463c07aadSStefano Zampini       o->free_a  = PETSC_TRUE;
57563c07aadSStefano Zampini       o->free_ij = PETSC_TRUE;
576225daaf8SStefano Zampini     } else if (reuse == MAT_INPLACE_MATRIX) {
577225daaf8SStefano Zampini       Mat T;
5782cf14000SStefano Zampini 
5799566063dSJacob Faibussowitsch       PetscCall(MatCreateMPIAIJWithSplitArrays(comm,m,n,PETSC_DECIDE,PETSC_DECIDE,dii,djj,da,oii,ojj,oa,&T));
5802cf14000SStefano Zampini       if (sameint) { /* ownership of CSR pointers is transferred to PETSc */
581225daaf8SStefano Zampini         hypre_CSRMatrixI(hdiag) = NULL;
582225daaf8SStefano Zampini         hypre_CSRMatrixJ(hdiag) = NULL;
583225daaf8SStefano Zampini         hypre_CSRMatrixI(hoffd) = NULL;
584225daaf8SStefano Zampini         hypre_CSRMatrixJ(hoffd) = NULL;
5852cf14000SStefano Zampini       } else { /* Hack MPIAIJ -> free ij but not a */
5862cf14000SStefano Zampini         Mat_MPIAIJ *b = (Mat_MPIAIJ*)(T->data);
5872cf14000SStefano Zampini         Mat_SeqAIJ *d = (Mat_SeqAIJ*)(b->A->data);
5882cf14000SStefano Zampini         Mat_SeqAIJ *o = (Mat_SeqAIJ*)(b->B->data);
5892cf14000SStefano Zampini 
5902cf14000SStefano Zampini         d->free_ij = PETSC_TRUE;
5912cf14000SStefano Zampini         o->free_ij = PETSC_TRUE;
5922cf14000SStefano Zampini       }
5932cf14000SStefano Zampini       hypre_CSRMatrixData(hdiag) = NULL;
594225daaf8SStefano Zampini       hypre_CSRMatrixData(hoffd) = NULL;
5959566063dSJacob Faibussowitsch       PetscCall(MatHeaderReplace(A,&T));
59663c07aadSStefano Zampini     }
597225daaf8SStefano Zampini   } else {
598225daaf8SStefano Zampini     oii  = NULL;
599225daaf8SStefano Zampini     ojj  = NULL;
600225daaf8SStefano Zampini     oa   = NULL;
601225daaf8SStefano Zampini     if (reuse == MAT_INITIAL_MATRIX) {
60263c07aadSStefano Zampini       Mat_SeqAIJ* b;
6032cf14000SStefano Zampini 
6049566063dSJacob Faibussowitsch       PetscCall(MatCreateSeqAIJWithArrays(comm,m,n,dii,djj,da,B));
60563c07aadSStefano Zampini       /* hack SeqAIJ */
60663c07aadSStefano Zampini       b          = (Mat_SeqAIJ*)((*B)->data);
60763c07aadSStefano Zampini       b->free_a  = PETSC_TRUE;
60863c07aadSStefano Zampini       b->free_ij = PETSC_TRUE;
609225daaf8SStefano Zampini     } else if (reuse == MAT_INPLACE_MATRIX) {
610225daaf8SStefano Zampini       Mat T;
6112cf14000SStefano Zampini 
6129566063dSJacob Faibussowitsch       PetscCall(MatCreateSeqAIJWithArrays(comm,m,n,dii,djj,da,&T));
6132cf14000SStefano Zampini       if (sameint) { /* ownership of CSR pointers is transferred to PETSc */
614225daaf8SStefano Zampini         hypre_CSRMatrixI(hdiag) = NULL;
615225daaf8SStefano Zampini         hypre_CSRMatrixJ(hdiag) = NULL;
6162cf14000SStefano Zampini       } else { /* free ij but not a */
6172cf14000SStefano Zampini         Mat_SeqAIJ* b = (Mat_SeqAIJ*)(T->data);
6182cf14000SStefano Zampini 
6192cf14000SStefano Zampini         b->free_ij = PETSC_TRUE;
6202cf14000SStefano Zampini       }
621225daaf8SStefano Zampini       hypre_CSRMatrixData(hdiag) = NULL;
6229566063dSJacob Faibussowitsch       PetscCall(MatHeaderReplace(A,&T));
62363c07aadSStefano Zampini     }
624225daaf8SStefano Zampini   }
625225daaf8SStefano Zampini 
6262cf14000SStefano Zampini   /* we have to use hypre_Tfree to free the HYPRE arrays
6272cf14000SStefano Zampini      that PETSc now onws */
62863c07aadSStefano Zampini   if (reuse == MAT_INPLACE_MATRIX) {
6292cf14000SStefano Zampini     PetscInt nh;
6302cf14000SStefano Zampini     void *ptrs[6] = {da,oa,dii,djj,oii,ojj};
6312cf14000SStefano Zampini     const char *names[6] = {"_hypre_csr_da",
6322cf14000SStefano Zampini                             "_hypre_csr_oa",
6332cf14000SStefano Zampini                             "_hypre_csr_dii",
634225daaf8SStefano Zampini                             "_hypre_csr_djj",
635225daaf8SStefano Zampini                             "_hypre_csr_oii",
6362cf14000SStefano Zampini                             "_hypre_csr_ojj"};
6372cf14000SStefano Zampini     nh = sameint ? 6 : 2;
6382cf14000SStefano Zampini     for (i=0; i<nh; i++) {
639225daaf8SStefano Zampini       PetscContainer c;
640225daaf8SStefano Zampini 
6419566063dSJacob Faibussowitsch       PetscCall(PetscContainerCreate(comm,&c));
6429566063dSJacob Faibussowitsch       PetscCall(PetscContainerSetPointer(c,ptrs[i]));
6439566063dSJacob Faibussowitsch       PetscCall(PetscContainerSetUserDestroy(c,hypre_array_destroy));
6449566063dSJacob Faibussowitsch       PetscCall(PetscObjectCompose((PetscObject)(*B),names[i],(PetscObject)c));
6459566063dSJacob Faibussowitsch       PetscCall(PetscContainerDestroy(&c));
646225daaf8SStefano Zampini     }
64763c07aadSStefano Zampini   }
64863c07aadSStefano Zampini   PetscFunctionReturn(0);
64963c07aadSStefano Zampini }
65063c07aadSStefano Zampini 
651613e5ff0Sstefano_zampini static PetscErrorCode MatAIJGetParCSR_Private(Mat A, hypre_ParCSRMatrix **hA)
652c1a070e6SStefano Zampini {
653613e5ff0Sstefano_zampini   hypre_ParCSRMatrix *tA;
654c1a070e6SStefano Zampini   hypre_CSRMatrix    *hdiag,*hoffd;
655c1a070e6SStefano Zampini   Mat_SeqAIJ         *diag,*offd;
6562cf14000SStefano Zampini   PetscInt           *garray,i,noffd,dnnz,onnz,*row_starts,*col_starts;
657c1a070e6SStefano Zampini   MPI_Comm           comm = PetscObjectComm((PetscObject)A);
658613e5ff0Sstefano_zampini   PetscBool          ismpiaij,isseqaij;
6592cf14000SStefano Zampini   PetscBool          sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int));
6606ea7df73SStefano Zampini   HYPRE_Int          *hdi = NULL,*hdj = NULL,*hoi = NULL,*hoj = NULL;
6615c97c10fSStefano Zampini   PetscInt           *pdi = NULL,*pdj = NULL,*poi = NULL,*poj = NULL;
6626ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
6636ea7df73SStefano Zampini   PetscBool          iscuda = PETSC_FALSE;
6646ea7df73SStefano Zampini #endif
665c1a070e6SStefano Zampini 
666c1a070e6SStefano Zampini   PetscFunctionBegin;
6679566063dSJacob Faibussowitsch   PetscCall(PetscObjectBaseTypeCompare((PetscObject)A,MATMPIAIJ,&ismpiaij));
6689566063dSJacob Faibussowitsch   PetscCall(PetscObjectBaseTypeCompare((PetscObject)A,MATSEQAIJ,&isseqaij));
6692c71b3e2SJacob Faibussowitsch   PetscCheckFalse(!ismpiaij && !isseqaij,comm,PETSC_ERR_SUP,"Unsupported type %s",((PetscObject)A)->type_name);
670c1a070e6SStefano Zampini   if (ismpiaij) {
671c1a070e6SStefano Zampini     Mat_MPIAIJ *a = (Mat_MPIAIJ*)(A->data);
672c1a070e6SStefano Zampini 
673c1a070e6SStefano Zampini     diag = (Mat_SeqAIJ*)a->A->data;
674c1a070e6SStefano Zampini     offd = (Mat_SeqAIJ*)a->B->data;
6756ea7df73SStefano Zampini #if defined(PETSC_HAVE_CUDA) && defined(PETSC_HAVE_HYPRE_DEVICE) && defined(HYPRE_USING_CUDA)
6769566063dSJacob Faibussowitsch     PetscCall(PetscObjectTypeCompare((PetscObject)A,MATMPIAIJCUSPARSE,&iscuda));
6776ea7df73SStefano Zampini     if (iscuda && !A->boundtocpu) {
6786ea7df73SStefano Zampini       sameint = PETSC_TRUE;
6799566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJCUSPARSEGetIJ(a->A,PETSC_FALSE,(const HYPRE_Int**)&hdi,(const HYPRE_Int**)&hdj));
6809566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJCUSPARSEGetIJ(a->B,PETSC_FALSE,(const HYPRE_Int**)&hoi,(const HYPRE_Int**)&hoj));
6816ea7df73SStefano Zampini     } else {
6826ea7df73SStefano Zampini #else
6836ea7df73SStefano Zampini     {
6846ea7df73SStefano Zampini #endif
6856ea7df73SStefano Zampini       pdi = diag->i;
6866ea7df73SStefano Zampini       pdj = diag->j;
6876ea7df73SStefano Zampini       poi = offd->i;
6886ea7df73SStefano Zampini       poj = offd->j;
6896ea7df73SStefano Zampini       if (sameint) {
6906ea7df73SStefano Zampini         hdi = (HYPRE_Int*)pdi;
6916ea7df73SStefano Zampini         hdj = (HYPRE_Int*)pdj;
6926ea7df73SStefano Zampini         hoi = (HYPRE_Int*)poi;
6936ea7df73SStefano Zampini         hoj = (HYPRE_Int*)poj;
6946ea7df73SStefano Zampini       }
6956ea7df73SStefano Zampini     }
696c1a070e6SStefano Zampini     garray = a->garray;
697c1a070e6SStefano Zampini     noffd  = a->B->cmap->N;
698c1a070e6SStefano Zampini     dnnz   = diag->nz;
699c1a070e6SStefano Zampini     onnz   = offd->nz;
700c1a070e6SStefano Zampini   } else {
701c1a070e6SStefano Zampini     diag = (Mat_SeqAIJ*)A->data;
702c1a070e6SStefano Zampini     offd = NULL;
7036ea7df73SStefano Zampini #if defined(PETSC_HAVE_CUDA) && defined(PETSC_HAVE_HYPRE_DEVICE)
7049566063dSJacob Faibussowitsch     PetscCall(PetscObjectTypeCompare((PetscObject)A,MATSEQAIJCUSPARSE,&iscuda));
7056ea7df73SStefano Zampini     if (iscuda && !A->boundtocpu) {
7066ea7df73SStefano Zampini       sameint = PETSC_TRUE;
7079566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJCUSPARSEGetIJ(A,PETSC_FALSE,(const HYPRE_Int**)&hdi,(const HYPRE_Int**)&hdj));
7086ea7df73SStefano Zampini     } else {
7096ea7df73SStefano Zampini #else
7106ea7df73SStefano Zampini     {
7116ea7df73SStefano Zampini #endif
7126ea7df73SStefano Zampini       pdi = diag->i;
7136ea7df73SStefano Zampini       pdj = diag->j;
7146ea7df73SStefano Zampini       if (sameint) {
7156ea7df73SStefano Zampini         hdi = (HYPRE_Int*)pdi;
7166ea7df73SStefano Zampini         hdj = (HYPRE_Int*)pdj;
7176ea7df73SStefano Zampini       }
7186ea7df73SStefano Zampini     }
719c1a070e6SStefano Zampini     garray = NULL;
720c1a070e6SStefano Zampini     noffd  = 0;
721c1a070e6SStefano Zampini     dnnz   = diag->nz;
722c1a070e6SStefano Zampini     onnz   = 0;
723c1a070e6SStefano Zampini   }
724225daaf8SStefano Zampini 
725c1a070e6SStefano Zampini   /* create a temporary ParCSR */
726c1a070e6SStefano Zampini   if (HYPRE_AssumedPartitionCheck()) {
727c1a070e6SStefano Zampini     PetscMPIInt myid;
728c1a070e6SStefano Zampini 
7299566063dSJacob Faibussowitsch     PetscCallMPI(MPI_Comm_rank(comm,&myid));
730c1a070e6SStefano Zampini     row_starts = A->rmap->range + myid;
731c1a070e6SStefano Zampini     col_starts = A->cmap->range + myid;
732c1a070e6SStefano Zampini   } else {
733c1a070e6SStefano Zampini     row_starts = A->rmap->range;
734c1a070e6SStefano Zampini     col_starts = A->cmap->range;
735c1a070e6SStefano Zampini   }
7362cf14000SStefano Zampini   tA = hypre_ParCSRMatrixCreate(comm,A->rmap->N,A->cmap->N,(HYPRE_BigInt*)row_starts,(HYPRE_BigInt*)col_starts,noffd,dnnz,onnz);
737a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts)
738c1a070e6SStefano Zampini   hypre_ParCSRMatrixSetRowStartsOwner(tA,0);
739c1a070e6SStefano Zampini   hypre_ParCSRMatrixSetColStartsOwner(tA,0);
740a1d2239cSSatish Balay #endif
741c1a070e6SStefano Zampini 
742225daaf8SStefano Zampini   /* set diagonal part */
743c1a070e6SStefano Zampini   hdiag = hypre_ParCSRMatrixDiag(tA);
7446ea7df73SStefano Zampini   if (!sameint) { /* malloc CSR pointers */
7459566063dSJacob Faibussowitsch     PetscCall(PetscMalloc2(A->rmap->n+1,&hdi,dnnz,&hdj));
7466ea7df73SStefano Zampini     for (i = 0; i < A->rmap->n+1; i++) hdi[i] = (HYPRE_Int)(pdi[i]);
7476ea7df73SStefano Zampini     for (i = 0; i < dnnz; i++)         hdj[i] = (HYPRE_Int)(pdj[i]);
7482cf14000SStefano Zampini   }
7496ea7df73SStefano Zampini   hypre_CSRMatrixI(hdiag)           = hdi;
7506ea7df73SStefano Zampini   hypre_CSRMatrixJ(hdiag)           = hdj;
75139accc25SStefano Zampini   hypre_CSRMatrixData(hdiag)        = (HYPRE_Complex*)diag->a;
752c1a070e6SStefano Zampini   hypre_CSRMatrixNumNonzeros(hdiag) = diag->nz;
753c1a070e6SStefano Zampini   hypre_CSRMatrixSetRownnz(hdiag);
754c1a070e6SStefano Zampini   hypre_CSRMatrixSetDataOwner(hdiag,0);
755c1a070e6SStefano Zampini 
756225daaf8SStefano Zampini   /* set offdiagonal part */
757c1a070e6SStefano Zampini   hoffd = hypre_ParCSRMatrixOffd(tA);
758c1a070e6SStefano Zampini   if (offd) {
7596ea7df73SStefano Zampini     if (!sameint) { /* malloc CSR pointers */
7609566063dSJacob Faibussowitsch       PetscCall(PetscMalloc2(A->rmap->n+1,&hoi,onnz,&hoj));
7616ea7df73SStefano Zampini       for (i = 0; i < A->rmap->n+1; i++) hoi[i] = (HYPRE_Int)(poi[i]);
7626ea7df73SStefano Zampini       for (i = 0; i < onnz; i++)         hoj[i] = (HYPRE_Int)(poj[i]);
7632cf14000SStefano Zampini     }
7646ea7df73SStefano Zampini     hypre_CSRMatrixI(hoffd)           = hoi;
7656ea7df73SStefano Zampini     hypre_CSRMatrixJ(hoffd)           = hoj;
76639accc25SStefano Zampini     hypre_CSRMatrixData(hoffd)        = (HYPRE_Complex*)offd->a;
767c1a070e6SStefano Zampini     hypre_CSRMatrixNumNonzeros(hoffd) = offd->nz;
768c1a070e6SStefano Zampini     hypre_CSRMatrixSetRownnz(hoffd);
769c1a070e6SStefano Zampini     hypre_CSRMatrixSetDataOwner(hoffd,0);
7706ea7df73SStefano Zampini   }
7716ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
772a74df02fSJacob Faibussowitsch   PetscStackCallStandard(hypre_ParCSRMatrixInitialize_v2,tA,iscuda ? HYPRE_MEMORY_DEVICE : HYPRE_MEMORY_HOST);
7736ea7df73SStefano Zampini #else
7746ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2,18,0)
775a74df02fSJacob Faibussowitsch   PetscStackCallStandard(hypre_ParCSRMatrixInitialize,tA);
7766ea7df73SStefano Zampini #else
777a74df02fSJacob Faibussowitsch   PetscStackCallStandard(hypre_ParCSRMatrixInitialize_v2,tA,HYPRE_MEMORY_HOST);
7786ea7df73SStefano Zampini #endif
7796ea7df73SStefano Zampini #endif
7806ea7df73SStefano Zampini   hypre_TFree(hypre_ParCSRMatrixColMapOffd(tA),HYPRE_MEMORY_HOST);
781c1a070e6SStefano Zampini   hypre_ParCSRMatrixSetNumNonzeros(tA);
7822cf14000SStefano Zampini   hypre_ParCSRMatrixColMapOffd(tA) = (HYPRE_BigInt*)garray;
783a74df02fSJacob Faibussowitsch   if (!hypre_ParCSRMatrixCommPkg(tA)) PetscStackCallStandard(hypre_MatvecCommPkgCreate,tA);
784613e5ff0Sstefano_zampini   *hA = tA;
785613e5ff0Sstefano_zampini   PetscFunctionReturn(0);
786613e5ff0Sstefano_zampini }
787c1a070e6SStefano Zampini 
788613e5ff0Sstefano_zampini static PetscErrorCode MatAIJRestoreParCSR_Private(Mat A, hypre_ParCSRMatrix **hA)
789613e5ff0Sstefano_zampini {
790613e5ff0Sstefano_zampini   hypre_CSRMatrix *hdiag,*hoffd;
7916ea7df73SStefano Zampini   PetscBool       ismpiaij,sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int));
7926ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
7936ea7df73SStefano Zampini   PetscBool       iscuda = PETSC_FALSE;
7946ea7df73SStefano Zampini #endif
795c1a070e6SStefano Zampini 
796613e5ff0Sstefano_zampini   PetscFunctionBegin;
7979566063dSJacob Faibussowitsch   PetscCall(PetscObjectBaseTypeCompare((PetscObject)A,MATMPIAIJ,&ismpiaij));
7986ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
7999566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompareAny((PetscObject)A,&iscuda,MATSEQAIJCUSPARSE,MATMPIAIJCUSPARSE,""));
8006ea7df73SStefano Zampini   if (iscuda) sameint = PETSC_TRUE;
8016ea7df73SStefano Zampini #endif
802613e5ff0Sstefano_zampini   hdiag = hypre_ParCSRMatrixDiag(*hA);
803613e5ff0Sstefano_zampini   hoffd = hypre_ParCSRMatrixOffd(*hA);
8046ea7df73SStefano Zampini   /* free temporary memory allocated by PETSc
8056ea7df73SStefano Zampini      set pointers to NULL before destroying tA */
8062cf14000SStefano Zampini   if (!sameint) {
8072cf14000SStefano Zampini     HYPRE_Int *hi,*hj;
8082cf14000SStefano Zampini 
8092cf14000SStefano Zampini     hi = hypre_CSRMatrixI(hdiag);
8102cf14000SStefano Zampini     hj = hypre_CSRMatrixJ(hdiag);
8119566063dSJacob Faibussowitsch     PetscCall(PetscFree2(hi,hj));
8126ea7df73SStefano Zampini     if (ismpiaij) {
8132cf14000SStefano Zampini       hi = hypre_CSRMatrixI(hoffd);
8142cf14000SStefano Zampini       hj = hypre_CSRMatrixJ(hoffd);
8159566063dSJacob Faibussowitsch       PetscCall(PetscFree2(hi,hj));
8162cf14000SStefano Zampini     }
8172cf14000SStefano Zampini   }
818c1a070e6SStefano Zampini   hypre_CSRMatrixI(hdiag)    = NULL;
819c1a070e6SStefano Zampini   hypre_CSRMatrixJ(hdiag)    = NULL;
820c1a070e6SStefano Zampini   hypre_CSRMatrixData(hdiag) = NULL;
8216ea7df73SStefano Zampini   if (ismpiaij) {
822c1a070e6SStefano Zampini     hypre_CSRMatrixI(hoffd)    = NULL;
823c1a070e6SStefano Zampini     hypre_CSRMatrixJ(hoffd)    = NULL;
824c1a070e6SStefano Zampini     hypre_CSRMatrixData(hoffd) = NULL;
8256ea7df73SStefano Zampini   }
826613e5ff0Sstefano_zampini   hypre_ParCSRMatrixColMapOffd(*hA) = NULL;
827613e5ff0Sstefano_zampini   hypre_ParCSRMatrixDestroy(*hA);
828613e5ff0Sstefano_zampini   *hA = NULL;
829613e5ff0Sstefano_zampini   PetscFunctionReturn(0);
830613e5ff0Sstefano_zampini }
831613e5ff0Sstefano_zampini 
832613e5ff0Sstefano_zampini /* calls RAP from BoomerAMG:
8333dad0653Sstefano_zampini    the resulting ParCSR will not own the column and row starts
8346ea7df73SStefano Zampini    It looks like we don't need to have the diagonal entries ordered first */
835a055b5aaSBarry Smith static PetscErrorCode MatHYPRE_ParCSR_RAP(hypre_ParCSRMatrix *hR, hypre_ParCSRMatrix *hA,hypre_ParCSRMatrix *hP, hypre_ParCSRMatrix **hRAP)
836613e5ff0Sstefano_zampini {
837a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts)
838613e5ff0Sstefano_zampini   HYPRE_Int P_owns_col_starts,R_owns_row_starts;
839a1d2239cSSatish Balay #endif
840613e5ff0Sstefano_zampini 
841613e5ff0Sstefano_zampini   PetscFunctionBegin;
842a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts)
843613e5ff0Sstefano_zampini   P_owns_col_starts = hypre_ParCSRMatrixOwnsColStarts(hP);
844613e5ff0Sstefano_zampini   R_owns_row_starts = hypre_ParCSRMatrixOwnsRowStarts(hR);
845a1d2239cSSatish Balay #endif
8466ea7df73SStefano Zampini   /* can be replaced by version test later */
8476ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
8486ea7df73SStefano Zampini   PetscStackPush("hypre_ParCSRMatrixRAP");
8496ea7df73SStefano Zampini   *hRAP = hypre_ParCSRMatrixRAP(hR,hA,hP);
8506ea7df73SStefano Zampini   PetscStackPop;
8516ea7df73SStefano Zampini #else
852a74df02fSJacob Faibussowitsch   PetscStackCallStandard(hypre_BoomerAMGBuildCoarseOperator,hR,hA,hP,hRAP);
853a74df02fSJacob Faibussowitsch   PetscStackCallStandard(hypre_ParCSRMatrixSetNumNonzeros,*hRAP);
8546ea7df73SStefano Zampini #endif
855613e5ff0Sstefano_zampini   /* hypre_BoomerAMGBuildCoarseOperator steals the col_starts from P and the row_starts from R */
856a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts)
857613e5ff0Sstefano_zampini   hypre_ParCSRMatrixSetRowStartsOwner(*hRAP,0);
858613e5ff0Sstefano_zampini   hypre_ParCSRMatrixSetColStartsOwner(*hRAP,0);
859613e5ff0Sstefano_zampini   if (P_owns_col_starts) hypre_ParCSRMatrixSetColStartsOwner(hP,1);
860613e5ff0Sstefano_zampini   if (R_owns_row_starts) hypre_ParCSRMatrixSetRowStartsOwner(hR,1);
861a1d2239cSSatish Balay #endif
862613e5ff0Sstefano_zampini   PetscFunctionReturn(0);
863613e5ff0Sstefano_zampini }
864613e5ff0Sstefano_zampini 
8656f231fbdSstefano_zampini static PetscErrorCode MatPtAPNumeric_AIJ_AIJ_wHYPRE(Mat A,Mat P,Mat C)
866613e5ff0Sstefano_zampini {
8676f231fbdSstefano_zampini   Mat                B;
8686abb4441SStefano Zampini   hypre_ParCSRMatrix *hA,*hP,*hPtAP = NULL;
8694222ddf1SHong Zhang   Mat_Product        *product=C->product;
870613e5ff0Sstefano_zampini 
871613e5ff0Sstefano_zampini   PetscFunctionBegin;
8729566063dSJacob Faibussowitsch   PetscCall(MatAIJGetParCSR_Private(A,&hA));
8739566063dSJacob Faibussowitsch   PetscCall(MatAIJGetParCSR_Private(P,&hP));
8749566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_ParCSR_RAP(hP,hA,hP,&hPtAP));
8759566063dSJacob Faibussowitsch   PetscCall(MatCreateFromParCSR(hPtAP,MATAIJ,PETSC_OWN_POINTER,&B));
8764222ddf1SHong Zhang 
8779566063dSJacob Faibussowitsch   PetscCall(MatHeaderMerge(C,&B));
8784222ddf1SHong Zhang   C->product = product;
8794222ddf1SHong Zhang 
8809566063dSJacob Faibussowitsch   PetscCall(MatAIJRestoreParCSR_Private(A,&hA));
8819566063dSJacob Faibussowitsch   PetscCall(MatAIJRestoreParCSR_Private(P,&hP));
8826f231fbdSstefano_zampini   PetscFunctionReturn(0);
8836f231fbdSstefano_zampini }
8846f231fbdSstefano_zampini 
8854222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatPtAPSymbolic_AIJ_AIJ_wHYPRE(Mat A,Mat P,PetscReal fill,Mat C)
8866f231fbdSstefano_zampini {
8876f231fbdSstefano_zampini   PetscFunctionBegin;
8889566063dSJacob Faibussowitsch   PetscCall(MatSetType(C,MATAIJ));
8894222ddf1SHong Zhang   C->ops->ptapnumeric    = MatPtAPNumeric_AIJ_AIJ_wHYPRE;
8904222ddf1SHong Zhang   C->ops->productnumeric = MatProductNumeric_PtAP;
891613e5ff0Sstefano_zampini   PetscFunctionReturn(0);
892613e5ff0Sstefano_zampini }
893613e5ff0Sstefano_zampini 
8944cc28894Sstefano_zampini static PetscErrorCode MatPtAPNumeric_AIJ_HYPRE(Mat A,Mat P,Mat C)
895613e5ff0Sstefano_zampini {
8964cc28894Sstefano_zampini   Mat                B;
8974cc28894Sstefano_zampini   Mat_HYPRE          *hP;
8986abb4441SStefano Zampini   hypre_ParCSRMatrix *hA = NULL,*Pparcsr,*ptapparcsr = NULL;
899613e5ff0Sstefano_zampini   HYPRE_Int          type;
900613e5ff0Sstefano_zampini   MPI_Comm           comm = PetscObjectComm((PetscObject)A);
9014cc28894Sstefano_zampini   PetscBool          ishypre;
902613e5ff0Sstefano_zampini 
903613e5ff0Sstefano_zampini   PetscFunctionBegin;
9049566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)P,MATHYPRE,&ishypre));
90528b400f6SJacob Faibussowitsch   PetscCheck(ishypre,comm,PETSC_ERR_USER,"P should be of type %s",MATHYPRE);
9064cc28894Sstefano_zampini   hP = (Mat_HYPRE*)P->data;
907a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixGetObjectType,hP->ij,&type);
9082c71b3e2SJacob Faibussowitsch   PetscCheckFalse(type != HYPRE_PARCSR,comm,PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported");
909a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixGetObject,hP->ij,(void**)&Pparcsr);
910613e5ff0Sstefano_zampini 
9119566063dSJacob Faibussowitsch   PetscCall(MatAIJGetParCSR_Private(A,&hA));
9129566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_ParCSR_RAP(Pparcsr,hA,Pparcsr,&ptapparcsr));
9139566063dSJacob Faibussowitsch   PetscCall(MatAIJRestoreParCSR_Private(A,&hA));
914225daaf8SStefano Zampini 
9154cc28894Sstefano_zampini   /* create temporary matrix and merge to C */
9169566063dSJacob Faibussowitsch   PetscCall(MatCreateFromParCSR(ptapparcsr,((PetscObject)C)->type_name,PETSC_OWN_POINTER,&B));
9179566063dSJacob Faibussowitsch   PetscCall(MatHeaderMerge(C,&B));
9184cc28894Sstefano_zampini   PetscFunctionReturn(0);
9194cc28894Sstefano_zampini }
9204cc28894Sstefano_zampini 
9214cc28894Sstefano_zampini static PetscErrorCode MatPtAPNumeric_HYPRE_HYPRE(Mat A,Mat P,Mat C)
9224cc28894Sstefano_zampini {
9234cc28894Sstefano_zampini   Mat                B;
9246abb4441SStefano Zampini   hypre_ParCSRMatrix *Aparcsr,*Pparcsr,*ptapparcsr = NULL;
9254cc28894Sstefano_zampini   Mat_HYPRE          *hA,*hP;
9264cc28894Sstefano_zampini   PetscBool          ishypre;
9274cc28894Sstefano_zampini   HYPRE_Int          type;
9284cc28894Sstefano_zampini 
9294cc28894Sstefano_zampini   PetscFunctionBegin;
9309566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)P,MATHYPRE,&ishypre));
93128b400f6SJacob Faibussowitsch   PetscCheck(ishypre,PetscObjectComm((PetscObject)P),PETSC_ERR_USER,"P should be of type %s",MATHYPRE);
9329566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)A,MATHYPRE,&ishypre));
93328b400f6SJacob Faibussowitsch   PetscCheck(ishypre,PetscObjectComm((PetscObject)A),PETSC_ERR_USER,"A should be of type %s",MATHYPRE);
9344cc28894Sstefano_zampini   hA = (Mat_HYPRE*)A->data;
9354cc28894Sstefano_zampini   hP = (Mat_HYPRE*)P->data;
936a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixGetObjectType,hA->ij,&type);
9372c71b3e2SJacob Faibussowitsch   PetscCheckFalse(type != HYPRE_PARCSR,PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported");
938a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixGetObjectType,hP->ij,&type);
9392c71b3e2SJacob Faibussowitsch   PetscCheckFalse(type != HYPRE_PARCSR,PetscObjectComm((PetscObject)P),PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported");
940a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixGetObject,hA->ij,(void**)&Aparcsr);
941a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixGetObject,hP->ij,(void**)&Pparcsr);
9429566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_ParCSR_RAP(Pparcsr,Aparcsr,Pparcsr,&ptapparcsr));
9439566063dSJacob Faibussowitsch   PetscCall(MatCreateFromParCSR(ptapparcsr,MATHYPRE,PETSC_OWN_POINTER,&B));
9449566063dSJacob Faibussowitsch   PetscCall(MatHeaderMerge(C,&B));
9454cc28894Sstefano_zampini   PetscFunctionReturn(0);
9464cc28894Sstefano_zampini }
9474cc28894Sstefano_zampini 
948d501dc42Sstefano_zampini /* calls hypre_ParMatmul
949d501dc42Sstefano_zampini    hypre_ParMatMul uses hypre_ParMatrixCreate with the communicator of hA
9503dad0653Sstefano_zampini    hypre_ParMatrixCreate does not duplicate the communicator
9516ea7df73SStefano Zampini    It looks like we don't need to have the diagonal entries ordered first */
952d501dc42Sstefano_zampini static PetscErrorCode MatHYPRE_ParCSR_MatMatMult(hypre_ParCSRMatrix *hA, hypre_ParCSRMatrix *hB, hypre_ParCSRMatrix **hAB)
953d501dc42Sstefano_zampini {
954d501dc42Sstefano_zampini   PetscFunctionBegin;
9556ea7df73SStefano Zampini   /* can be replaced by version test later */
9566ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
9576ea7df73SStefano Zampini   PetscStackPush("hypre_ParCSRMatMat");
9586ea7df73SStefano Zampini   *hAB = hypre_ParCSRMatMat(hA,hB);
9596ea7df73SStefano Zampini #else
960d501dc42Sstefano_zampini   PetscStackPush("hypre_ParMatmul");
961d501dc42Sstefano_zampini   *hAB = hypre_ParMatmul(hA,hB);
9626ea7df73SStefano Zampini #endif
963d501dc42Sstefano_zampini   PetscStackPop;
964d501dc42Sstefano_zampini   PetscFunctionReturn(0);
965d501dc42Sstefano_zampini }
966d501dc42Sstefano_zampini 
9675e5acdf2Sstefano_zampini static PetscErrorCode MatMatMultNumeric_AIJ_AIJ_wHYPRE(Mat A,Mat B,Mat C)
9685e5acdf2Sstefano_zampini {
9695e5acdf2Sstefano_zampini   Mat                D;
970d501dc42Sstefano_zampini   hypre_ParCSRMatrix *hA,*hB,*hAB = NULL;
9714222ddf1SHong Zhang   Mat_Product        *product=C->product;
9725e5acdf2Sstefano_zampini 
9735e5acdf2Sstefano_zampini   PetscFunctionBegin;
9749566063dSJacob Faibussowitsch   PetscCall(MatAIJGetParCSR_Private(A,&hA));
9759566063dSJacob Faibussowitsch   PetscCall(MatAIJGetParCSR_Private(B,&hB));
9769566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_ParCSR_MatMatMult(hA,hB,&hAB));
9779566063dSJacob Faibussowitsch   PetscCall(MatCreateFromParCSR(hAB,MATAIJ,PETSC_OWN_POINTER,&D));
9784222ddf1SHong Zhang 
9799566063dSJacob Faibussowitsch   PetscCall(MatHeaderMerge(C,&D));
9804222ddf1SHong Zhang   C->product = product;
9814222ddf1SHong Zhang 
9829566063dSJacob Faibussowitsch   PetscCall(MatAIJRestoreParCSR_Private(A,&hA));
9839566063dSJacob Faibussowitsch   PetscCall(MatAIJRestoreParCSR_Private(B,&hB));
9845e5acdf2Sstefano_zampini   PetscFunctionReturn(0);
9855e5acdf2Sstefano_zampini }
9865e5acdf2Sstefano_zampini 
9874222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatMatMultSymbolic_AIJ_AIJ_wHYPRE(Mat A,Mat B,PetscReal fill,Mat C)
9885e5acdf2Sstefano_zampini {
9895e5acdf2Sstefano_zampini   PetscFunctionBegin;
9909566063dSJacob Faibussowitsch   PetscCall(MatSetType(C,MATAIJ));
9914222ddf1SHong Zhang   C->ops->matmultnumeric = MatMatMultNumeric_AIJ_AIJ_wHYPRE;
9924222ddf1SHong Zhang   C->ops->productnumeric = MatProductNumeric_AB;
9935e5acdf2Sstefano_zampini   PetscFunctionReturn(0);
9945e5acdf2Sstefano_zampini }
9955e5acdf2Sstefano_zampini 
996d501dc42Sstefano_zampini static PetscErrorCode MatMatMultNumeric_HYPRE_HYPRE(Mat A,Mat B,Mat C)
997d501dc42Sstefano_zampini {
998d501dc42Sstefano_zampini   Mat                D;
999d501dc42Sstefano_zampini   hypre_ParCSRMatrix *Aparcsr,*Bparcsr,*ABparcsr = NULL;
1000d501dc42Sstefano_zampini   Mat_HYPRE          *hA,*hB;
1001d501dc42Sstefano_zampini   PetscBool          ishypre;
1002d501dc42Sstefano_zampini   HYPRE_Int          type;
10034222ddf1SHong Zhang   Mat_Product        *product;
1004d501dc42Sstefano_zampini 
1005d501dc42Sstefano_zampini   PetscFunctionBegin;
10069566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)B,MATHYPRE,&ishypre));
100728b400f6SJacob Faibussowitsch   PetscCheck(ishypre,PetscObjectComm((PetscObject)B),PETSC_ERR_USER,"B should be of type %s",MATHYPRE);
10089566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)A,MATHYPRE,&ishypre));
100928b400f6SJacob Faibussowitsch   PetscCheck(ishypre,PetscObjectComm((PetscObject)A),PETSC_ERR_USER,"A should be of type %s",MATHYPRE);
1010d501dc42Sstefano_zampini   hA = (Mat_HYPRE*)A->data;
1011d501dc42Sstefano_zampini   hB = (Mat_HYPRE*)B->data;
1012a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixGetObjectType,hA->ij,&type);
10132c71b3e2SJacob Faibussowitsch   PetscCheckFalse(type != HYPRE_PARCSR,PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported");
1014a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixGetObjectType,hB->ij,&type);
10152c71b3e2SJacob Faibussowitsch   PetscCheckFalse(type != HYPRE_PARCSR,PetscObjectComm((PetscObject)B),PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported");
1016a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixGetObject,hA->ij,(void**)&Aparcsr);
1017a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixGetObject,hB->ij,(void**)&Bparcsr);
10189566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_ParCSR_MatMatMult(Aparcsr,Bparcsr,&ABparcsr));
10199566063dSJacob Faibussowitsch   PetscCall(MatCreateFromParCSR(ABparcsr,MATHYPRE,PETSC_OWN_POINTER,&D));
10204222ddf1SHong Zhang 
1021d501dc42Sstefano_zampini   /* need to use HeaderReplace because HeaderMerge messes up with the communicator */
10224222ddf1SHong Zhang   product    = C->product;  /* save it from MatHeaderReplace() */
10234222ddf1SHong Zhang   C->product = NULL;
10249566063dSJacob Faibussowitsch   PetscCall(MatHeaderReplace(C,&D));
10254222ddf1SHong Zhang   C->product = product;
1026d501dc42Sstefano_zampini   C->ops->matmultnumeric = MatMatMultNumeric_HYPRE_HYPRE;
10274222ddf1SHong Zhang   C->ops->productnumeric = MatProductNumeric_AB;
1028d501dc42Sstefano_zampini   PetscFunctionReturn(0);
1029d501dc42Sstefano_zampini }
1030d501dc42Sstefano_zampini 
10313dad0653Sstefano_zampini PETSC_INTERN PetscErrorCode MatTransposeMatMatMultNumeric_AIJ_AIJ_AIJ_wHYPRE(Mat A,Mat B,Mat C,Mat D)
103220e1dc0dSstefano_zampini {
103320e1dc0dSstefano_zampini   Mat                E;
10346abb4441SStefano Zampini   hypre_ParCSRMatrix *hA,*hB,*hC,*hABC = NULL;
103520e1dc0dSstefano_zampini 
103620e1dc0dSstefano_zampini   PetscFunctionBegin;
10379566063dSJacob Faibussowitsch   PetscCall(MatAIJGetParCSR_Private(A,&hA));
10389566063dSJacob Faibussowitsch   PetscCall(MatAIJGetParCSR_Private(B,&hB));
10399566063dSJacob Faibussowitsch   PetscCall(MatAIJGetParCSR_Private(C,&hC));
10409566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_ParCSR_RAP(hA,hB,hC,&hABC));
10419566063dSJacob Faibussowitsch   PetscCall(MatCreateFromParCSR(hABC,MATAIJ,PETSC_OWN_POINTER,&E));
10429566063dSJacob Faibussowitsch   PetscCall(MatHeaderMerge(D,&E));
10439566063dSJacob Faibussowitsch   PetscCall(MatAIJRestoreParCSR_Private(A,&hA));
10449566063dSJacob Faibussowitsch   PetscCall(MatAIJRestoreParCSR_Private(B,&hB));
10459566063dSJacob Faibussowitsch   PetscCall(MatAIJRestoreParCSR_Private(C,&hC));
104620e1dc0dSstefano_zampini   PetscFunctionReturn(0);
104720e1dc0dSstefano_zampini }
104820e1dc0dSstefano_zampini 
10494222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatTransposeMatMatMultSymbolic_AIJ_AIJ_AIJ_wHYPRE(Mat A,Mat B,Mat C,PetscReal fill,Mat D)
105020e1dc0dSstefano_zampini {
105120e1dc0dSstefano_zampini   PetscFunctionBegin;
10529566063dSJacob Faibussowitsch   PetscCall(MatSetType(D,MATAIJ));
105320e1dc0dSstefano_zampini   PetscFunctionReturn(0);
105420e1dc0dSstefano_zampini }
105520e1dc0dSstefano_zampini 
10564222ddf1SHong Zhang /* ---------------------------------------------------- */
10574222ddf1SHong Zhang static PetscErrorCode MatProductSymbolic_AB_HYPRE(Mat C)
10584222ddf1SHong Zhang {
10594222ddf1SHong Zhang   PetscFunctionBegin;
10604222ddf1SHong Zhang   C->ops->productnumeric = MatProductNumeric_AB;
10614222ddf1SHong Zhang   PetscFunctionReturn(0);
10624222ddf1SHong Zhang }
10634222ddf1SHong Zhang 
10644222ddf1SHong Zhang static PetscErrorCode MatProductSetFromOptions_HYPRE_AB(Mat C)
10654222ddf1SHong Zhang {
10664222ddf1SHong Zhang   Mat_Product    *product = C->product;
10674222ddf1SHong Zhang   PetscBool      Ahypre;
10684222ddf1SHong Zhang 
10694222ddf1SHong Zhang   PetscFunctionBegin;
10709566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)product->A,MATHYPRE,&Ahypre));
10714222ddf1SHong Zhang   if (Ahypre) { /* A is a Hypre matrix */
10729566063dSJacob Faibussowitsch     PetscCall(MatSetType(C,MATHYPRE));
10734222ddf1SHong Zhang     C->ops->productsymbolic = MatProductSymbolic_AB_HYPRE;
10744222ddf1SHong Zhang     C->ops->matmultnumeric  = MatMatMultNumeric_HYPRE_HYPRE;
10754222ddf1SHong Zhang     PetscFunctionReturn(0);
10766718818eSStefano Zampini   }
10774222ddf1SHong Zhang   PetscFunctionReturn(0);
10784222ddf1SHong Zhang }
10794222ddf1SHong Zhang 
10804222ddf1SHong Zhang static PetscErrorCode MatProductSymbolic_PtAP_HYPRE(Mat C)
10814222ddf1SHong Zhang {
10824222ddf1SHong Zhang   PetscFunctionBegin;
10834222ddf1SHong Zhang   C->ops->productnumeric = MatProductNumeric_PtAP;
10844222ddf1SHong Zhang   PetscFunctionReturn(0);
10854222ddf1SHong Zhang }
10864222ddf1SHong Zhang 
10874222ddf1SHong Zhang static PetscErrorCode MatProductSetFromOptions_HYPRE_PtAP(Mat C)
10884222ddf1SHong Zhang {
10894222ddf1SHong Zhang   Mat_Product    *product = C->product;
10904222ddf1SHong Zhang   PetscBool      flg;
10914222ddf1SHong Zhang   PetscInt       type = 0;
10924222ddf1SHong Zhang   const char     *outTypes[4] = {"aij","seqaij","mpiaij","hypre"};
10934222ddf1SHong Zhang   PetscInt       ntype = 4;
10944222ddf1SHong Zhang   Mat            A = product->A;
10954222ddf1SHong Zhang   PetscBool      Ahypre;
10965f80ce2aSJacob Faibussowitsch   PetscErrorCode ierr;
10974222ddf1SHong Zhang 
10984222ddf1SHong Zhang   PetscFunctionBegin;
10999566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)A,MATHYPRE,&Ahypre));
11004222ddf1SHong Zhang   if (Ahypre) { /* A is a Hypre matrix */
11019566063dSJacob Faibussowitsch     PetscCall(MatSetType(C,MATHYPRE));
11024222ddf1SHong Zhang     C->ops->productsymbolic = MatProductSymbolic_PtAP_HYPRE;
11034222ddf1SHong Zhang     C->ops->ptapnumeric     = MatPtAPNumeric_HYPRE_HYPRE;
11044222ddf1SHong Zhang     PetscFunctionReturn(0);
11054222ddf1SHong Zhang   }
11064222ddf1SHong Zhang 
11074222ddf1SHong Zhang   /* A is AIJ, P is Hypre, C = PtAP can be either AIJ or Hypre format */
11084222ddf1SHong Zhang   /* Get runtime option */
11094222ddf1SHong Zhang   if (product->api_user) {
11109566063dSJacob Faibussowitsch     ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)C),((PetscObject)C)->prefix,"MatPtAP_HYPRE","Mat");PetscCall(ierr);
11119566063dSJacob Faibussowitsch     PetscCall(PetscOptionsEList("-matptap_hypre_outtype","MatPtAP outtype","MatPtAP outtype",outTypes,ntype,outTypes[type],&type,&flg));
11129566063dSJacob Faibussowitsch     ierr = PetscOptionsEnd();PetscCall(ierr);
11134222ddf1SHong Zhang   } else {
11149566063dSJacob Faibussowitsch     ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)C),((PetscObject)C)->prefix,"MatProduct_PtAP_HYPRE","Mat");PetscCall(ierr);
11159566063dSJacob Faibussowitsch     PetscCall(PetscOptionsEList("-mat_product_algorithm_hypre_outtype","MatProduct_PtAP outtype","MatProduct_PtAP",outTypes,ntype,outTypes[type],&type,&flg));
11169566063dSJacob Faibussowitsch     ierr = PetscOptionsEnd();PetscCall(ierr);
11174222ddf1SHong Zhang   }
11184222ddf1SHong Zhang 
11194222ddf1SHong Zhang   if (type == 0 || type == 1 || type == 2) {
11209566063dSJacob Faibussowitsch     PetscCall(MatSetType(C,MATAIJ));
11214222ddf1SHong Zhang   } else if (type == 3) {
11229566063dSJacob Faibussowitsch     PetscCall(MatSetType(C,MATHYPRE));
11234222ddf1SHong Zhang   } else SETERRQ(PetscObjectComm((PetscObject)C),PETSC_ERR_SUP,"MatPtAP outtype is not supported");
11244222ddf1SHong Zhang   C->ops->productsymbolic = MatProductSymbolic_PtAP_HYPRE;
11254222ddf1SHong Zhang   C->ops->ptapnumeric     = MatPtAPNumeric_AIJ_HYPRE;
11264222ddf1SHong Zhang   PetscFunctionReturn(0);
11274222ddf1SHong Zhang }
11284222ddf1SHong Zhang 
11294222ddf1SHong Zhang static PetscErrorCode MatProductSetFromOptions_HYPRE(Mat C)
11304222ddf1SHong Zhang {
11314222ddf1SHong Zhang   Mat_Product    *product = C->product;
11324222ddf1SHong Zhang 
11334222ddf1SHong Zhang   PetscFunctionBegin;
11344222ddf1SHong Zhang   switch (product->type) {
11354222ddf1SHong Zhang   case MATPRODUCT_AB:
11369566063dSJacob Faibussowitsch     PetscCall(MatProductSetFromOptions_HYPRE_AB(C));
11374222ddf1SHong Zhang     break;
11384222ddf1SHong Zhang   case MATPRODUCT_PtAP:
11399566063dSJacob Faibussowitsch     PetscCall(MatProductSetFromOptions_HYPRE_PtAP(C));
11404222ddf1SHong Zhang     break;
11416718818eSStefano Zampini   default:
11426718818eSStefano Zampini     break;
11434222ddf1SHong Zhang   }
11444222ddf1SHong Zhang   PetscFunctionReturn(0);
11454222ddf1SHong Zhang }
11464222ddf1SHong Zhang 
11474222ddf1SHong Zhang /* -------------------------------------------------------- */
11484222ddf1SHong Zhang 
1149ea9daf28SStefano Zampini static PetscErrorCode MatMultTranspose_HYPRE(Mat A, Vec x, Vec y)
115063c07aadSStefano Zampini {
115163c07aadSStefano Zampini   PetscFunctionBegin;
11529566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_MultKernel_Private(A,1.0,x,0.0,y,PETSC_TRUE));
115363c07aadSStefano Zampini   PetscFunctionReturn(0);
115463c07aadSStefano Zampini }
115563c07aadSStefano Zampini 
1156ea9daf28SStefano Zampini static PetscErrorCode MatMult_HYPRE(Mat A, Vec x, Vec y)
115763c07aadSStefano Zampini {
115863c07aadSStefano Zampini   PetscFunctionBegin;
11599566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_MultKernel_Private(A,1.0,x,0.0,y,PETSC_FALSE));
116063c07aadSStefano Zampini   PetscFunctionReturn(0);
116163c07aadSStefano Zampini }
116263c07aadSStefano Zampini 
1163414bd5c3SStefano Zampini static PetscErrorCode MatMultAdd_HYPRE(Mat A, Vec x, Vec y, Vec z)
1164414bd5c3SStefano Zampini {
1165414bd5c3SStefano Zampini   PetscFunctionBegin;
1166414bd5c3SStefano Zampini   if (y != z) {
11679566063dSJacob Faibussowitsch     PetscCall(VecCopy(y,z));
1168414bd5c3SStefano Zampini   }
11699566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_MultKernel_Private(A,1.0,x,1.0,z,PETSC_FALSE));
1170414bd5c3SStefano Zampini   PetscFunctionReturn(0);
1171414bd5c3SStefano Zampini }
1172414bd5c3SStefano Zampini 
1173414bd5c3SStefano Zampini static PetscErrorCode MatMultTransposeAdd_HYPRE(Mat A, Vec x, Vec y, Vec z)
1174414bd5c3SStefano Zampini {
1175414bd5c3SStefano Zampini   PetscFunctionBegin;
1176414bd5c3SStefano Zampini   if (y != z) {
11779566063dSJacob Faibussowitsch     PetscCall(VecCopy(y,z));
1178414bd5c3SStefano Zampini   }
11799566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_MultKernel_Private(A,1.0,x,1.0,z,PETSC_TRUE));
1180414bd5c3SStefano Zampini   PetscFunctionReturn(0);
1181414bd5c3SStefano Zampini }
1182414bd5c3SStefano Zampini 
1183414bd5c3SStefano Zampini /* y = a * A * x + b * y or y = a * A^t * x + b * y depending on trans */
118439accc25SStefano Zampini static PetscErrorCode MatHYPRE_MultKernel_Private(Mat A, HYPRE_Complex a, Vec x, HYPRE_Complex b, Vec y, PetscBool trans)
118563c07aadSStefano Zampini {
118663c07aadSStefano Zampini   Mat_HYPRE          *hA = (Mat_HYPRE*)A->data;
118763c07aadSStefano Zampini   hypre_ParCSRMatrix *parcsr;
118863c07aadSStefano Zampini   hypre_ParVector    *hx,*hy;
118963c07aadSStefano Zampini 
119063c07aadSStefano Zampini   PetscFunctionBegin;
119163c07aadSStefano Zampini   if (trans) {
11929566063dSJacob Faibussowitsch     PetscCall(VecHYPRE_IJVectorPushVecRead(hA->b,x));
11939566063dSJacob Faibussowitsch     if (b != 0.0) PetscCall(VecHYPRE_IJVectorPushVec(hA->x,y));
11949566063dSJacob Faibussowitsch     else PetscCall(VecHYPRE_IJVectorPushVecWrite(hA->x,y));
1195a74df02fSJacob Faibussowitsch     PetscStackCallStandard(HYPRE_IJVectorGetObject,hA->b->ij,(void**)&hx);
1196a74df02fSJacob Faibussowitsch     PetscStackCallStandard(HYPRE_IJVectorGetObject,hA->x->ij,(void**)&hy);
119763c07aadSStefano Zampini   } else {
11989566063dSJacob Faibussowitsch     PetscCall(VecHYPRE_IJVectorPushVecRead(hA->x,x));
11999566063dSJacob Faibussowitsch     if (b != 0.0) PetscCall(VecHYPRE_IJVectorPushVec(hA->b,y));
12009566063dSJacob Faibussowitsch     else PetscCall(VecHYPRE_IJVectorPushVecWrite(hA->b,y));
1201a74df02fSJacob Faibussowitsch     PetscStackCallStandard(HYPRE_IJVectorGetObject,hA->x->ij,(void**)&hx);
1202a74df02fSJacob Faibussowitsch     PetscStackCallStandard(HYPRE_IJVectorGetObject,hA->b->ij,(void**)&hy);
120363c07aadSStefano Zampini   }
1204a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixGetObject,hA->ij,(void**)&parcsr);
12056ea7df73SStefano Zampini   if (trans) {
1206a74df02fSJacob Faibussowitsch     PetscStackCallStandard(hypre_ParCSRMatrixMatvecT,a,parcsr,hx,b,hy);
12076ea7df73SStefano Zampini   } else {
1208a74df02fSJacob Faibussowitsch     PetscStackCallStandard(hypre_ParCSRMatrixMatvec,a,parcsr,hx,b,hy);
12096ea7df73SStefano Zampini   }
12109566063dSJacob Faibussowitsch   PetscCall(VecHYPRE_IJVectorPopVec(hA->x));
12119566063dSJacob Faibussowitsch   PetscCall(VecHYPRE_IJVectorPopVec(hA->b));
121263c07aadSStefano Zampini   PetscFunctionReturn(0);
121363c07aadSStefano Zampini }
121463c07aadSStefano Zampini 
1215ea9daf28SStefano Zampini static PetscErrorCode MatDestroy_HYPRE(Mat A)
121663c07aadSStefano Zampini {
121763c07aadSStefano Zampini   Mat_HYPRE      *hA = (Mat_HYPRE*)A->data;
121863c07aadSStefano Zampini 
121963c07aadSStefano Zampini   PetscFunctionBegin;
12209566063dSJacob Faibussowitsch   PetscCall(VecHYPRE_IJVectorDestroy(&hA->x));
12219566063dSJacob Faibussowitsch   PetscCall(VecHYPRE_IJVectorDestroy(&hA->b));
1222978814f1SStefano Zampini   if (hA->ij) {
1223978814f1SStefano Zampini     if (!hA->inner_free) hypre_IJMatrixObject(hA->ij) = NULL;
1224a74df02fSJacob Faibussowitsch     PetscStackCallStandard(HYPRE_IJMatrixDestroy,hA->ij);
1225978814f1SStefano Zampini   }
12269566063dSJacob Faibussowitsch   if (hA->comm) PetscCall(PetscCommRestoreComm(PetscObjectComm((PetscObject)A),&hA->comm));
1227c69f721fSFande Kong 
12289566063dSJacob Faibussowitsch   PetscCall(MatStashDestroy_Private(&A->stash));
12299566063dSJacob Faibussowitsch   PetscCall(PetscFree(hA->array));
1230c69f721fSFande Kong 
12315fbaff96SJunchao Zhang   if (hA->cooMat) {
12325fbaff96SJunchao Zhang     PetscCall(MatDestroy(&hA->cooMat));
12335fbaff96SJunchao Zhang     PetscStackCall("hypre_TFree",hypre_TFree(hA->diagJ,hA->memType));
12345fbaff96SJunchao Zhang     PetscStackCall("hypre_TFree",hypre_TFree(hA->offdJ,hA->memType));
12355fbaff96SJunchao Zhang     PetscStackCall("hypre_TFree",hypre_TFree(hA->diag,hA->memType));
12365fbaff96SJunchao Zhang   }
12375fbaff96SJunchao Zhang 
12389566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_hypre_aij_C",NULL));
12399566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_hypre_is_C",NULL));
12409566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqaij_hypre_C",NULL));
12419566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_mpiaij_hypre_C",NULL));
12429566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatHYPRESetPreallocation_C",NULL));
12439566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatHYPREGetParCSR_C",NULL));
12445fbaff96SJunchao Zhang   PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSetPreallocationCOO_C",NULL));
12455fbaff96SJunchao Zhang   PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSetValuesCOO_C",NULL));
12469566063dSJacob Faibussowitsch   PetscCall(PetscFree(A->data));
124763c07aadSStefano Zampini   PetscFunctionReturn(0);
124863c07aadSStefano Zampini }
124963c07aadSStefano Zampini 
1250ea9daf28SStefano Zampini static PetscErrorCode MatSetUp_HYPRE(Mat A)
125163c07aadSStefano Zampini {
12524ec6421dSstefano_zampini   PetscFunctionBegin;
12539566063dSJacob Faibussowitsch   PetscCall(MatHYPRESetPreallocation(A,PETSC_DEFAULT,NULL,PETSC_DEFAULT,NULL));
12544ec6421dSstefano_zampini   PetscFunctionReturn(0);
12554ec6421dSstefano_zampini }
12564ec6421dSstefano_zampini 
12576ea7df73SStefano Zampini //TODO FIX hypre_CSRMatrixMatvecOutOfPlace
12586ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
12596ea7df73SStefano Zampini static PetscErrorCode MatBindToCPU_HYPRE(Mat A, PetscBool bind)
12606ea7df73SStefano Zampini {
12616ea7df73SStefano Zampini   Mat_HYPRE            *hA = (Mat_HYPRE*)A->data;
12626ea7df73SStefano Zampini   HYPRE_MemoryLocation hmem = bind ? HYPRE_MEMORY_HOST : HYPRE_MEMORY_DEVICE;
12636ea7df73SStefano Zampini 
12646ea7df73SStefano Zampini   PetscFunctionBegin;
12656ea7df73SStefano Zampini   A->boundtocpu = bind;
12665fbaff96SJunchao Zhang   if (hA->ij && hypre_IJMatrixAssembleFlag(hA->ij) && hmem != hypre_IJMatrixMemoryLocation(hA->ij)) {
12676ea7df73SStefano Zampini     hypre_ParCSRMatrix *parcsr;
1268a74df02fSJacob Faibussowitsch     PetscStackCallStandard(HYPRE_IJMatrixGetObject,hA->ij,(void**)&parcsr);
1269a74df02fSJacob Faibussowitsch     PetscStackCallStandard(hypre_ParCSRMatrixMigrate,parcsr, hmem);
12706ea7df73SStefano Zampini   }
12719566063dSJacob Faibussowitsch   if (hA->x) PetscCall(VecHYPRE_IJBindToCPU(hA->x,bind));
12729566063dSJacob Faibussowitsch   if (hA->b) PetscCall(VecHYPRE_IJBindToCPU(hA->b,bind));
12736ea7df73SStefano Zampini   PetscFunctionReturn(0);
12746ea7df73SStefano Zampini }
12756ea7df73SStefano Zampini #endif
12766ea7df73SStefano Zampini 
12774ec6421dSstefano_zampini static PetscErrorCode MatAssemblyEnd_HYPRE(Mat A, MatAssemblyType mode)
12784ec6421dSstefano_zampini {
127963c07aadSStefano Zampini   Mat_HYPRE          *hA = (Mat_HYPRE*)A->data;
1280c69f721fSFande Kong   PetscMPIInt        n;
1281c69f721fSFande Kong   PetscInt           i,j,rstart,ncols,flg;
1282c69f721fSFande Kong   PetscInt           *row,*col;
1283c69f721fSFande Kong   PetscScalar        *val;
128463c07aadSStefano Zampini 
128563c07aadSStefano Zampini   PetscFunctionBegin;
12862c71b3e2SJacob Faibussowitsch   PetscCheckFalse(mode == MAT_FLUSH_ASSEMBLY,PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"MAT_FLUSH_ASSEMBLY currently not supported with MATHYPRE");
1287c69f721fSFande Kong 
1288c69f721fSFande Kong   if (!A->nooffprocentries) {
1289c69f721fSFande Kong     while (1) {
12909566063dSJacob Faibussowitsch       PetscCall(MatStashScatterGetMesg_Private(&A->stash,&n,&row,&col,&val,&flg));
1291c69f721fSFande Kong       if (!flg) break;
1292c69f721fSFande Kong 
1293c69f721fSFande Kong       for (i=0; i<n;) {
1294c69f721fSFande Kong         /* Now identify the consecutive vals belonging to the same row */
1295c69f721fSFande Kong         for (j=i,rstart=row[j]; j<n; j++) {
1296c69f721fSFande Kong           if (row[j] != rstart) break;
1297c69f721fSFande Kong         }
1298c69f721fSFande Kong         if (j < n) ncols = j-i;
1299c69f721fSFande Kong         else       ncols = n-i;
1300c69f721fSFande Kong         /* Now assemble all these values with a single function call */
13019566063dSJacob Faibussowitsch         PetscCall(MatSetValues_HYPRE(A,1,row+i,ncols,col+i,val+i,A->insertmode));
1302c69f721fSFande Kong 
1303c69f721fSFande Kong         i = j;
1304c69f721fSFande Kong       }
1305c69f721fSFande Kong     }
13069566063dSJacob Faibussowitsch     PetscCall(MatStashScatterEnd_Private(&A->stash));
1307c69f721fSFande Kong   }
1308c69f721fSFande Kong 
1309a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixAssemble,hA->ij);
1310336664bdSPierre Jolivet   /* The assembly routine destroys the aux_matrix, we recreate it here by calling HYPRE_IJMatrixInitialize */
1311336664bdSPierre Jolivet   /* If the option MAT_SORTED_FULL is set to true, the indices and values can be passed to hypre directly, so we don't need the aux_matrix */
1312336664bdSPierre Jolivet   if (!hA->sorted_full) {
1313af1cf968SStefano Zampini     hypre_AuxParCSRMatrix *aux_matrix;
1314af1cf968SStefano Zampini 
1315af1cf968SStefano Zampini     /* call destroy just to make sure we do not leak anything */
1316af1cf968SStefano Zampini     aux_matrix = (hypre_AuxParCSRMatrix*)hypre_IJMatrixTranslator(hA->ij);
1317a74df02fSJacob Faibussowitsch     PetscStackCallStandard(hypre_AuxParCSRMatrixDestroy,aux_matrix);
1318af1cf968SStefano Zampini     hypre_IJMatrixTranslator(hA->ij) = NULL;
1319af1cf968SStefano Zampini 
1320af1cf968SStefano Zampini     /* Initialize with assembled flag -> it only recreates the aux_par_matrix */
1321a74df02fSJacob Faibussowitsch     PetscStackCallStandard(HYPRE_IJMatrixInitialize,hA->ij);
1322af1cf968SStefano Zampini     aux_matrix = (hypre_AuxParCSRMatrix*)hypre_IJMatrixTranslator(hA->ij);
13236ea7df73SStefano Zampini     if (aux_matrix) {
1324af1cf968SStefano Zampini       hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 1; /* see comment in MatHYPRESetPreallocation_HYPRE */
132522235d61SPierre Jolivet #if PETSC_PKG_HYPRE_VERSION_LT(2,19,0)
1326a74df02fSJacob Faibussowitsch       PetscStackCallStandard(hypre_AuxParCSRMatrixInitialize,aux_matrix);
132722235d61SPierre Jolivet #else
1328a74df02fSJacob Faibussowitsch       PetscStackCallStandard(hypre_AuxParCSRMatrixInitialize_v2,aux_matrix,HYPRE_MEMORY_HOST);
132922235d61SPierre Jolivet #endif
1330af1cf968SStefano Zampini     }
13316ea7df73SStefano Zampini   }
13326ea7df73SStefano Zampini   {
13336ea7df73SStefano Zampini     hypre_ParCSRMatrix *parcsr;
13346ea7df73SStefano Zampini 
1335a74df02fSJacob Faibussowitsch     PetscStackCallStandard(HYPRE_IJMatrixGetObject,hA->ij,(void**)&parcsr);
1336a74df02fSJacob Faibussowitsch     if (!hypre_ParCSRMatrixCommPkg(parcsr)) PetscStackCallStandard(hypre_MatvecCommPkgCreate,parcsr);
13376ea7df73SStefano Zampini   }
13389566063dSJacob Faibussowitsch   if (!hA->x) PetscCall(VecHYPRE_IJVectorCreate(A->cmap,&hA->x));
13399566063dSJacob Faibussowitsch   if (!hA->b) PetscCall(VecHYPRE_IJVectorCreate(A->rmap,&hA->b));
13406ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
13419566063dSJacob Faibussowitsch   PetscCall(MatBindToCPU_HYPRE(A,A->boundtocpu));
13426ea7df73SStefano Zampini #endif
134363c07aadSStefano Zampini   PetscFunctionReturn(0);
134463c07aadSStefano Zampini }
134563c07aadSStefano Zampini 
1346c69f721fSFande Kong static PetscErrorCode MatGetArray_HYPRE(Mat A, PetscInt size, void **array)
1347c69f721fSFande Kong {
1348c69f721fSFande Kong   Mat_HYPRE          *hA = (Mat_HYPRE*)A->data;
1349c69f721fSFande Kong 
1350c69f721fSFande Kong   PetscFunctionBegin;
135128b400f6SJacob Faibussowitsch   PetscCheck(hA->available,PETSC_COMM_SELF,PETSC_ERR_ARG_NULL,"Temporary space is in use");
1352c69f721fSFande Kong 
135339accc25SStefano Zampini   if (hA->size >= size) {
135439accc25SStefano Zampini     *array = hA->array;
135539accc25SStefano Zampini   } else {
13569566063dSJacob Faibussowitsch     PetscCall(PetscFree(hA->array));
1357c69f721fSFande Kong     hA->size = size;
13589566063dSJacob Faibussowitsch     PetscCall(PetscMalloc(hA->size,&hA->array));
1359c69f721fSFande Kong     *array = hA->array;
1360c69f721fSFande Kong   }
1361c69f721fSFande Kong 
1362c69f721fSFande Kong   hA->available = PETSC_FALSE;
1363c69f721fSFande Kong   PetscFunctionReturn(0);
1364c69f721fSFande Kong }
1365c69f721fSFande Kong 
1366708542d2SFande Kong static PetscErrorCode MatRestoreArray_HYPRE(Mat A, void **array)
1367c69f721fSFande Kong {
1368c69f721fSFande Kong   Mat_HYPRE          *hA = (Mat_HYPRE*)A->data;
1369c69f721fSFande Kong 
1370c69f721fSFande Kong   PetscFunctionBegin;
1371c69f721fSFande Kong   *array = NULL;
1372c69f721fSFande Kong   hA->available = PETSC_TRUE;
1373c69f721fSFande Kong   PetscFunctionReturn(0);
1374c69f721fSFande Kong }
1375c69f721fSFande Kong 
13766ea7df73SStefano Zampini static PetscErrorCode MatSetValues_HYPRE(Mat A, PetscInt nr, const PetscInt rows[], PetscInt nc, const PetscInt cols[], const PetscScalar v[], InsertMode ins)
1377d975228cSstefano_zampini {
1378d975228cSstefano_zampini   Mat_HYPRE      *hA = (Mat_HYPRE*)A->data;
1379d975228cSstefano_zampini   PetscScalar    *vals = (PetscScalar *)v;
138039accc25SStefano Zampini   HYPRE_Complex  *sscr;
1381c69f721fSFande Kong   PetscInt       *cscr[2];
1382c69f721fSFande Kong   PetscInt       i,nzc;
138308defe43SFande Kong   void           *array = NULL;
1384d975228cSstefano_zampini 
1385d975228cSstefano_zampini   PetscFunctionBegin;
13869566063dSJacob Faibussowitsch   PetscCall(MatGetArray_HYPRE(A,sizeof(PetscInt)*(2*nc)+sizeof(HYPRE_Complex)*nc*nr,&array));
1387c69f721fSFande Kong   cscr[0] = (PetscInt*)array;
1388c69f721fSFande Kong   cscr[1] = ((PetscInt*)array)+nc;
138939accc25SStefano Zampini   sscr = (HYPRE_Complex*)(((PetscInt*)array)+nc*2);
1390d975228cSstefano_zampini   for (i=0,nzc=0;i<nc;i++) {
1391d975228cSstefano_zampini     if (cols[i] >= 0) {
1392d975228cSstefano_zampini       cscr[0][nzc  ] = cols[i];
1393d975228cSstefano_zampini       cscr[1][nzc++] = i;
1394d975228cSstefano_zampini     }
1395d975228cSstefano_zampini   }
1396c69f721fSFande Kong   if (!nzc) {
13979566063dSJacob Faibussowitsch     PetscCall(MatRestoreArray_HYPRE(A,&array));
1398c69f721fSFande Kong     PetscFunctionReturn(0);
1399c69f721fSFande Kong   }
1400d975228cSstefano_zampini 
14016ea7df73SStefano Zampini #if 0 //defined(PETSC_HAVE_HYPRE_DEVICE)
14026ea7df73SStefano Zampini   if (HYPRE_MEMORY_HOST != hypre_IJMatrixMemoryLocation(hA->ij)) {
14036ea7df73SStefano Zampini     hypre_ParCSRMatrix *parcsr;
14046ea7df73SStefano Zampini 
1405a74df02fSJacob Faibussowitsch     PetscStackCallStandard(HYPRE_IJMatrixGetObject,hA->ij,(void**)&parcsr);
1406a74df02fSJacob Faibussowitsch     PetscStackCallStandard(hypre_ParCSRMatrixMigrate,parcsr, HYPRE_MEMORY_HOST);
14076ea7df73SStefano Zampini   }
14086ea7df73SStefano Zampini #endif
14096ea7df73SStefano Zampini 
1410d975228cSstefano_zampini   if (ins == ADD_VALUES) {
1411d975228cSstefano_zampini     for (i=0;i<nr;i++) {
14126ea7df73SStefano Zampini       if (rows[i] >= 0) {
1413d975228cSstefano_zampini         PetscInt  j;
14142cf14000SStefano Zampini         HYPRE_Int hnc = (HYPRE_Int)nzc;
14152cf14000SStefano Zampini 
14162c71b3e2SJacob Faibussowitsch         PetscCheckFalse((PetscInt)hnc != nzc,PETSC_COMM_SELF,PETSC_ERR_SUP,"Hypre overflow! number of columns %" PetscInt_FMT " for row %" PetscInt_FMT,nzc,rows[i]);
14179566063dSJacob Faibussowitsch         for (j=0;j<nzc;j++) PetscCall(PetscHYPREScalarCast(vals[cscr[1][j]],&sscr[j]));
1418a74df02fSJacob Faibussowitsch         PetscStackCallStandard(HYPRE_IJMatrixAddToValues,hA->ij,1,&hnc,(HYPRE_BigInt*)(rows+i),(HYPRE_BigInt*)cscr[0],sscr);
1419d975228cSstefano_zampini       }
1420d975228cSstefano_zampini       vals += nc;
1421d975228cSstefano_zampini     }
1422d975228cSstefano_zampini   } else { /* INSERT_VALUES */
1423d975228cSstefano_zampini     PetscInt rst,ren;
1424c69f721fSFande Kong 
14259566063dSJacob Faibussowitsch     PetscCall(MatGetOwnershipRange(A,&rst,&ren));
1426d975228cSstefano_zampini     for (i=0;i<nr;i++) {
14276ea7df73SStefano Zampini       if (rows[i] >= 0) {
1428d975228cSstefano_zampini         PetscInt  j;
14292cf14000SStefano Zampini         HYPRE_Int hnc = (HYPRE_Int)nzc;
14302cf14000SStefano Zampini 
14312c71b3e2SJacob Faibussowitsch         PetscCheckFalse((PetscInt)hnc != nzc,PETSC_COMM_SELF,PETSC_ERR_SUP,"Hypre overflow! number of columns %" PetscInt_FMT " for row %" PetscInt_FMT,nzc,rows[i]);
14329566063dSJacob Faibussowitsch         for (j=0;j<nzc;j++) PetscCall(PetscHYPREScalarCast(vals[cscr[1][j]],&sscr[j]));
1433c69f721fSFande Kong         /* nonlocal values */
14349566063dSJacob Faibussowitsch         if (rows[i] < rst || rows[i] >= ren) PetscCall(MatStashValuesRow_Private(&A->stash,rows[i],nzc,cscr[0],(PetscScalar*)sscr,PETSC_FALSE));
1435c69f721fSFande Kong         /* local values */
1436a74df02fSJacob Faibussowitsch         else PetscStackCallStandard(HYPRE_IJMatrixSetValues,hA->ij,1,&hnc,(HYPRE_BigInt*)(rows+i),(HYPRE_BigInt*)cscr[0],sscr);
1437d975228cSstefano_zampini       }
1438d975228cSstefano_zampini       vals += nc;
1439d975228cSstefano_zampini     }
1440d975228cSstefano_zampini   }
1441c69f721fSFande Kong 
14429566063dSJacob Faibussowitsch   PetscCall(MatRestoreArray_HYPRE(A,&array));
1443d975228cSstefano_zampini   PetscFunctionReturn(0);
1444d975228cSstefano_zampini }
1445d975228cSstefano_zampini 
1446d975228cSstefano_zampini static PetscErrorCode MatHYPRESetPreallocation_HYPRE(Mat A, PetscInt dnz, const PetscInt dnnz[], PetscInt onz, const PetscInt onnz[])
1447d975228cSstefano_zampini {
1448d975228cSstefano_zampini   Mat_HYPRE      *hA = (Mat_HYPRE*)A->data;
14497d968826Sstefano_zampini   HYPRE_Int      *hdnnz,*honnz;
145006a29025Sstefano_zampini   PetscInt       i,rs,re,cs,ce,bs;
1451d975228cSstefano_zampini   PetscMPIInt    size;
1452d975228cSstefano_zampini 
1453d975228cSstefano_zampini   PetscFunctionBegin;
14549566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->rmap));
14559566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->cmap));
1456d975228cSstefano_zampini   rs   = A->rmap->rstart;
1457d975228cSstefano_zampini   re   = A->rmap->rend;
1458d975228cSstefano_zampini   cs   = A->cmap->rstart;
1459d975228cSstefano_zampini   ce   = A->cmap->rend;
1460d975228cSstefano_zampini   if (!hA->ij) {
1461a74df02fSJacob Faibussowitsch     PetscStackCallStandard(HYPRE_IJMatrixCreate,hA->comm,rs,re-1,cs,ce-1,&hA->ij);
1462a74df02fSJacob Faibussowitsch     PetscStackCallStandard(HYPRE_IJMatrixSetObjectType,hA->ij,HYPRE_PARCSR);
1463d975228cSstefano_zampini   } else {
14642cf14000SStefano Zampini     HYPRE_BigInt hrs,hre,hcs,hce;
1465a74df02fSJacob Faibussowitsch     PetscStackCallStandard(HYPRE_IJMatrixGetLocalRange,hA->ij,&hrs,&hre,&hcs,&hce);
14662c71b3e2SJacob Faibussowitsch     PetscCheckFalse(hre-hrs+1 != re -rs,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Inconsistent local rows: IJMatrix [%" PetscInt_FMT ",%" PetscInt_FMT "), PETSc [%" PetscInt_FMT ",%" PetscInt_FMT ")",hrs,hre+1,rs,re);
14672c71b3e2SJacob Faibussowitsch     PetscCheckFalse(hce-hcs+1 != ce -cs,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Inconsistent local cols: IJMatrix [%" PetscInt_FMT ",%" PetscInt_FMT "), PETSc [%" PetscInt_FMT ",%" PetscInt_FMT ")",hcs,hce+1,cs,ce);
1468d975228cSstefano_zampini   }
14699566063dSJacob Faibussowitsch   PetscCall(MatGetBlockSize(A,&bs));
147006a29025Sstefano_zampini   if (dnz == PETSC_DEFAULT || dnz == PETSC_DECIDE) dnz = 10*bs;
147106a29025Sstefano_zampini   if (onz == PETSC_DEFAULT || onz == PETSC_DECIDE) onz = 10*bs;
147206a29025Sstefano_zampini 
1473d975228cSstefano_zampini   if (!dnnz) {
14749566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n,&hdnnz));
1475d975228cSstefano_zampini     for (i=0;i<A->rmap->n;i++) hdnnz[i] = dnz;
1476d975228cSstefano_zampini   } else {
14777d968826Sstefano_zampini     hdnnz = (HYPRE_Int*)dnnz;
1478d975228cSstefano_zampini   }
14799566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)A),&size));
1480d975228cSstefano_zampini   if (size > 1) {
1481ddbeb582SStefano Zampini     hypre_AuxParCSRMatrix *aux_matrix;
1482d975228cSstefano_zampini     if (!onnz) {
14839566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(A->rmap->n,&honnz));
1484d975228cSstefano_zampini       for (i=0;i<A->rmap->n;i++) honnz[i] = onz;
148522235d61SPierre Jolivet     } else honnz = (HYPRE_Int*)onnz;
1486ddbeb582SStefano Zampini     /* SetDiagOffdSizes sets hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0, since it seems
1487ddbeb582SStefano Zampini        they assume the user will input the entire row values, properly sorted
1488336664bdSPierre Jolivet        In PETSc, we don't make such an assumption and set this flag to 1,
1489336664bdSPierre Jolivet        unless the option MAT_SORTED_FULL is set to true.
1490ddbeb582SStefano Zampini        Also, to avoid possible memory leaks, we destroy and recreate the translator
1491ddbeb582SStefano Zampini        This has to be done here, as HYPRE_IJMatrixInitialize will properly initialize
1492ddbeb582SStefano Zampini        the IJ matrix for us */
1493ddbeb582SStefano Zampini     aux_matrix = (hypre_AuxParCSRMatrix*)hypre_IJMatrixTranslator(hA->ij);
1494ddbeb582SStefano Zampini     hypre_AuxParCSRMatrixDestroy(aux_matrix);
1495ddbeb582SStefano Zampini     hypre_IJMatrixTranslator(hA->ij) = NULL;
1496a74df02fSJacob Faibussowitsch     PetscStackCallStandard(HYPRE_IJMatrixSetDiagOffdSizes,hA->ij,hdnnz,honnz);
1497ddbeb582SStefano Zampini     aux_matrix = (hypre_AuxParCSRMatrix*)hypre_IJMatrixTranslator(hA->ij);
1498336664bdSPierre Jolivet     hypre_AuxParCSRMatrixNeedAux(aux_matrix) = !hA->sorted_full;
1499d975228cSstefano_zampini   } else {
1500d975228cSstefano_zampini     honnz = NULL;
1501a74df02fSJacob Faibussowitsch     PetscStackCallStandard(HYPRE_IJMatrixSetRowSizes,hA->ij,hdnnz);
1502d975228cSstefano_zampini   }
1503ddbeb582SStefano Zampini 
1504af1cf968SStefano Zampini   /* reset assembled flag and call the initialize method */
1505af1cf968SStefano Zampini   hypre_IJMatrixAssembleFlag(hA->ij) = 0;
15066ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2,19,0)
1507a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixInitialize,hA->ij);
15086ea7df73SStefano Zampini #else
1509a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixInitialize_v2,hA->ij,HYPRE_MEMORY_HOST);
15106ea7df73SStefano Zampini #endif
1511d975228cSstefano_zampini   if (!dnnz) {
15129566063dSJacob Faibussowitsch     PetscCall(PetscFree(hdnnz));
1513d975228cSstefano_zampini   }
1514d975228cSstefano_zampini   if (!onnz && honnz) {
15159566063dSJacob Faibussowitsch     PetscCall(PetscFree(honnz));
1516d975228cSstefano_zampini   }
1517af1cf968SStefano Zampini   /* Match AIJ logic */
151806a29025Sstefano_zampini   A->preallocated = PETSC_TRUE;
1519af1cf968SStefano Zampini   A->assembled    = PETSC_FALSE;
1520d975228cSstefano_zampini   PetscFunctionReturn(0);
1521d975228cSstefano_zampini }
1522d975228cSstefano_zampini 
1523d975228cSstefano_zampini /*@C
1524d975228cSstefano_zampini    MatHYPRESetPreallocation - Preallocates memory for a sparse parallel matrix in HYPRE IJ format
1525d975228cSstefano_zampini 
1526d975228cSstefano_zampini    Collective on Mat
1527d975228cSstefano_zampini 
1528d975228cSstefano_zampini    Input Parameters:
1529d975228cSstefano_zampini +  A - the matrix
1530d975228cSstefano_zampini .  dnz  - number of nonzeros per row in DIAGONAL portion of local submatrix
1531d975228cSstefano_zampini           (same value is used for all local rows)
1532d975228cSstefano_zampini .  dnnz - array containing the number of nonzeros in the various rows of the
1533d975228cSstefano_zampini           DIAGONAL portion of the local submatrix (possibly different for each row)
1534d975228cSstefano_zampini           or NULL (PETSC_NULL_INTEGER in Fortran), if d_nz is used to specify the nonzero structure.
1535d975228cSstefano_zampini           The size of this array is equal to the number of local rows, i.e 'm'.
1536d975228cSstefano_zampini           For matrices that will be factored, you must leave room for (and set)
1537d975228cSstefano_zampini           the diagonal entry even if it is zero.
1538d975228cSstefano_zampini .  onz  - number of nonzeros per row in the OFF-DIAGONAL portion of local
1539d975228cSstefano_zampini           submatrix (same value is used for all local rows).
1540d975228cSstefano_zampini -  onnz - array containing the number of nonzeros in the various rows of the
1541d975228cSstefano_zampini           OFF-DIAGONAL portion of the local submatrix (possibly different for
1542d975228cSstefano_zampini           each row) or NULL (PETSC_NULL_INTEGER in Fortran), if o_nz is used to specify the nonzero
1543d975228cSstefano_zampini           structure. The size of this array is equal to the number
1544d975228cSstefano_zampini           of local rows, i.e 'm'.
1545d975228cSstefano_zampini 
154695452b02SPatrick Sanan    Notes:
154795452b02SPatrick Sanan     If the *nnz parameter is given then the *nz parameter is ignored; for sequential matrices, onz and onnz are ignored.
1548d975228cSstefano_zampini 
1549d975228cSstefano_zampini    Level: intermediate
1550d975228cSstefano_zampini 
1551af1cf968SStefano Zampini .seealso: MatCreate(), MatMPIAIJSetPreallocation(), MATHYPRE
1552d975228cSstefano_zampini @*/
1553d975228cSstefano_zampini PetscErrorCode MatHYPRESetPreallocation(Mat A, PetscInt dnz, const PetscInt dnnz[], PetscInt onz, const PetscInt onnz[])
1554d975228cSstefano_zampini {
1555d975228cSstefano_zampini   PetscFunctionBegin;
1556d975228cSstefano_zampini   PetscValidHeaderSpecific(A,MAT_CLASSID,1);
1557d975228cSstefano_zampini   PetscValidType(A,1);
1558*cac4c232SBarry Smith   PetscTryMethod(A,"MatHYPRESetPreallocation_C",(Mat,PetscInt,const PetscInt[],PetscInt,const PetscInt[]),(A,dnz,dnnz,onz,onnz));
1559d975228cSstefano_zampini   PetscFunctionReturn(0);
1560d975228cSstefano_zampini }
1561d975228cSstefano_zampini 
1562225daaf8SStefano Zampini /*
1563225daaf8SStefano Zampini    MatCreateFromParCSR - Creates a matrix from a hypre_ParCSRMatrix
1564225daaf8SStefano Zampini 
1565225daaf8SStefano Zampini    Collective
1566225daaf8SStefano Zampini 
1567225daaf8SStefano Zampini    Input Parameters:
156845b8d346SStefano Zampini +  parcsr   - the pointer to the hypre_ParCSRMatrix
1569bb4689ddSStefano Zampini .  mtype    - matrix type to be created. Currently MATAIJ, MATIS and MATHYPRE are supported.
1570225daaf8SStefano Zampini -  copymode - PETSc copying options
1571225daaf8SStefano Zampini 
1572225daaf8SStefano Zampini    Output Parameter:
1573225daaf8SStefano Zampini .  A  - the matrix
1574225daaf8SStefano Zampini 
1575225daaf8SStefano Zampini    Level: intermediate
1576225daaf8SStefano Zampini 
1577225daaf8SStefano Zampini .seealso: MatHYPRE, PetscCopyMode
1578225daaf8SStefano Zampini */
157945b8d346SStefano Zampini PETSC_EXTERN PetscErrorCode MatCreateFromParCSR(hypre_ParCSRMatrix *parcsr, MatType mtype, PetscCopyMode copymode, Mat* A)
1580978814f1SStefano Zampini {
1581225daaf8SStefano Zampini   Mat            T;
1582978814f1SStefano Zampini   Mat_HYPRE      *hA;
1583978814f1SStefano Zampini   MPI_Comm       comm;
1584978814f1SStefano Zampini   PetscInt       rstart,rend,cstart,cend,M,N;
1585d248a85cSRichard Tran Mills   PetscBool      isseqaij,isseqaijmkl,ismpiaij,isaij,ishyp,isis;
1586978814f1SStefano Zampini 
1587978814f1SStefano Zampini   PetscFunctionBegin;
1588978814f1SStefano Zampini   comm  = hypre_ParCSRMatrixComm(parcsr);
15899566063dSJacob Faibussowitsch   PetscCall(PetscStrcmp(mtype,MATSEQAIJ,&isseqaij));
15909566063dSJacob Faibussowitsch   PetscCall(PetscStrcmp(mtype,MATSEQAIJMKL,&isseqaijmkl));
15919566063dSJacob Faibussowitsch   PetscCall(PetscStrcmp(mtype,MATMPIAIJ,&ismpiaij));
15929566063dSJacob Faibussowitsch   PetscCall(PetscStrcmp(mtype,MATAIJ,&isaij));
15939566063dSJacob Faibussowitsch   PetscCall(PetscStrcmp(mtype,MATHYPRE,&ishyp));
15949566063dSJacob Faibussowitsch   PetscCall(PetscStrcmp(mtype,MATIS,&isis));
1595d248a85cSRichard Tran Mills   isaij = (PetscBool)(isseqaij || isseqaijmkl || ismpiaij || isaij);
15966ea7df73SStefano Zampini   /* TODO */
15972c71b3e2SJacob Faibussowitsch   PetscCheckFalse(!isaij && !ishyp && !isis,comm,PETSC_ERR_SUP,"Unsupported MatType %s! Supported types are %s, %s, %s, %s, %s, and %s",mtype,MATAIJ,MATSEQAIJ,MATSEQAIJMKL,MATMPIAIJ,MATIS,MATHYPRE);
1598978814f1SStefano Zampini   /* access ParCSRMatrix */
1599978814f1SStefano Zampini   rstart = hypre_ParCSRMatrixFirstRowIndex(parcsr);
1600978814f1SStefano Zampini   rend   = hypre_ParCSRMatrixLastRowIndex(parcsr);
1601978814f1SStefano Zampini   cstart = hypre_ParCSRMatrixFirstColDiag(parcsr);
1602978814f1SStefano Zampini   cend   = hypre_ParCSRMatrixLastColDiag(parcsr);
1603978814f1SStefano Zampini   M      = hypre_ParCSRMatrixGlobalNumRows(parcsr);
1604978814f1SStefano Zampini   N      = hypre_ParCSRMatrixGlobalNumCols(parcsr);
1605978814f1SStefano Zampini 
1606fa92c42cSstefano_zampini   /* fix for empty local rows/columns */
1607fa92c42cSstefano_zampini   if (rend < rstart) rend = rstart;
1608fa92c42cSstefano_zampini   if (cend < cstart) cend = cstart;
1609fa92c42cSstefano_zampini 
1610e6471dc9SStefano Zampini   /* PETSc convention */
1611e6471dc9SStefano Zampini   rend++;
1612e6471dc9SStefano Zampini   cend++;
1613e6471dc9SStefano Zampini   rend = PetscMin(rend,M);
1614e6471dc9SStefano Zampini   cend = PetscMin(cend,N);
1615e6471dc9SStefano Zampini 
1616978814f1SStefano Zampini   /* create PETSc matrix with MatHYPRE */
16179566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm,&T));
16189566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(T,rend-rstart,cend-cstart,M,N));
16199566063dSJacob Faibussowitsch   PetscCall(MatSetType(T,MATHYPRE));
1620225daaf8SStefano Zampini   hA   = (Mat_HYPRE*)(T->data);
1621978814f1SStefano Zampini 
1622978814f1SStefano Zampini   /* create HYPRE_IJMatrix */
1623a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixCreate,hA->comm,rstart,rend-1,cstart,cend-1,&hA->ij);
1624a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixSetObjectType,hA->ij,HYPRE_PARCSR);
162545b8d346SStefano Zampini 
16266ea7df73SStefano Zampini // TODO DEV
162745b8d346SStefano Zampini   /* create new ParCSR object if needed */
162845b8d346SStefano Zampini   if (ishyp && copymode == PETSC_COPY_VALUES) {
162945b8d346SStefano Zampini     hypre_ParCSRMatrix *new_parcsr;
16306ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2,18,0)
163145b8d346SStefano Zampini     hypre_CSRMatrix    *hdiag,*hoffd,*ndiag,*noffd;
163245b8d346SStefano Zampini 
16330e6427aaSSatish Balay     new_parcsr = hypre_ParCSRMatrixClone(parcsr,0);
163445b8d346SStefano Zampini     hdiag      = hypre_ParCSRMatrixDiag(parcsr);
163545b8d346SStefano Zampini     hoffd      = hypre_ParCSRMatrixOffd(parcsr);
163645b8d346SStefano Zampini     ndiag      = hypre_ParCSRMatrixDiag(new_parcsr);
163745b8d346SStefano Zampini     noffd      = hypre_ParCSRMatrixOffd(new_parcsr);
16389566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(hypre_CSRMatrixData(ndiag),hypre_CSRMatrixData(hdiag),hypre_CSRMatrixNumNonzeros(hdiag)));
16399566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(hypre_CSRMatrixData(noffd),hypre_CSRMatrixData(hoffd),hypre_CSRMatrixNumNonzeros(hoffd)));
16406ea7df73SStefano Zampini #else
16416ea7df73SStefano Zampini     new_parcsr = hypre_ParCSRMatrixClone(parcsr,1);
16426ea7df73SStefano Zampini #endif
164345b8d346SStefano Zampini     parcsr     = new_parcsr;
164445b8d346SStefano Zampini     copymode   = PETSC_OWN_POINTER;
164545b8d346SStefano Zampini   }
1646978814f1SStefano Zampini 
1647978814f1SStefano Zampini   /* set ParCSR object */
1648978814f1SStefano Zampini   hypre_IJMatrixObject(hA->ij) = parcsr;
16494ec6421dSstefano_zampini   T->preallocated = PETSC_TRUE;
1650978814f1SStefano Zampini 
1651978814f1SStefano Zampini   /* set assembled flag */
1652978814f1SStefano Zampini   hypre_IJMatrixAssembleFlag(hA->ij) = 1;
16536ea7df73SStefano Zampini #if 0
1654a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixInitialize,hA->ij);
16556ea7df73SStefano Zampini #endif
1656225daaf8SStefano Zampini   if (ishyp) {
16576d2a658fSstefano_zampini     PetscMPIInt myid = 0;
16586d2a658fSstefano_zampini 
16596d2a658fSstefano_zampini     /* make sure we always have row_starts and col_starts available */
16606d2a658fSstefano_zampini     if (HYPRE_AssumedPartitionCheck()) {
16619566063dSJacob Faibussowitsch       PetscCallMPI(MPI_Comm_rank(comm,&myid));
16626d2a658fSstefano_zampini     }
1663a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts)
16646d2a658fSstefano_zampini     if (!hypre_ParCSRMatrixOwnsColStarts(parcsr)) {
16656d2a658fSstefano_zampini       PetscLayout map;
16666d2a658fSstefano_zampini 
16679566063dSJacob Faibussowitsch       PetscCall(MatGetLayouts(T,NULL,&map));
16689566063dSJacob Faibussowitsch       PetscCall(PetscLayoutSetUp(map));
16692cf14000SStefano Zampini       hypre_ParCSRMatrixColStarts(parcsr) = (HYPRE_BigInt*)(map->range + myid);
16706d2a658fSstefano_zampini     }
16716d2a658fSstefano_zampini     if (!hypre_ParCSRMatrixOwnsRowStarts(parcsr)) {
16726d2a658fSstefano_zampini       PetscLayout map;
16736d2a658fSstefano_zampini 
16749566063dSJacob Faibussowitsch       PetscCall(MatGetLayouts(T,&map,NULL));
16759566063dSJacob Faibussowitsch       PetscCall(PetscLayoutSetUp(map));
16762cf14000SStefano Zampini       hypre_ParCSRMatrixRowStarts(parcsr) = (HYPRE_BigInt*)(map->range + myid);
16776d2a658fSstefano_zampini     }
1678a1d2239cSSatish Balay #endif
1679978814f1SStefano Zampini     /* prevent from freeing the pointer */
1680978814f1SStefano Zampini     if (copymode == PETSC_USE_POINTER) hA->inner_free = PETSC_FALSE;
1681225daaf8SStefano Zampini     *A   = T;
16829566063dSJacob Faibussowitsch     PetscCall(MatSetOption(*A,MAT_SORTED_FULL,PETSC_TRUE));
16839566063dSJacob Faibussowitsch     PetscCall(MatAssemblyBegin(*A,MAT_FINAL_ASSEMBLY));
16849566063dSJacob Faibussowitsch     PetscCall(MatAssemblyEnd(*A,MAT_FINAL_ASSEMBLY));
1685bb4689ddSStefano Zampini   } else if (isaij) {
1686bb4689ddSStefano Zampini     if (copymode != PETSC_OWN_POINTER) {
1687225daaf8SStefano Zampini       /* prevent from freeing the pointer */
1688225daaf8SStefano Zampini       hA->inner_free = PETSC_FALSE;
16899566063dSJacob Faibussowitsch       PetscCall(MatConvert_HYPRE_AIJ(T,MATAIJ,MAT_INITIAL_MATRIX,A));
16909566063dSJacob Faibussowitsch       PetscCall(MatDestroy(&T));
1691225daaf8SStefano Zampini     } else { /* AIJ return type with PETSC_OWN_POINTER */
16929566063dSJacob Faibussowitsch       PetscCall(MatConvert_HYPRE_AIJ(T,MATAIJ,MAT_INPLACE_MATRIX,&T));
1693225daaf8SStefano Zampini       *A   = T;
1694225daaf8SStefano Zampini     }
1695bb4689ddSStefano Zampini   } else if (isis) {
16969566063dSJacob Faibussowitsch     PetscCall(MatConvert_HYPRE_IS(T,MATIS,MAT_INITIAL_MATRIX,A));
16978cfe8d00SStefano Zampini     if (copymode != PETSC_OWN_POINTER) hA->inner_free = PETSC_FALSE;
16989566063dSJacob Faibussowitsch     PetscCall(MatDestroy(&T));
1699bb4689ddSStefano Zampini   }
1700978814f1SStefano Zampini   PetscFunctionReturn(0);
1701978814f1SStefano Zampini }
1702978814f1SStefano Zampini 
170368ec7858SStefano Zampini static PetscErrorCode MatHYPREGetParCSR_HYPRE(Mat A, hypre_ParCSRMatrix **parcsr)
1704dd9c0a25Sstefano_zampini {
1705dd9c0a25Sstefano_zampini   Mat_HYPRE *hA = (Mat_HYPRE*)A->data;
1706dd9c0a25Sstefano_zampini   HYPRE_Int type;
1707dd9c0a25Sstefano_zampini 
1708dd9c0a25Sstefano_zampini   PetscFunctionBegin;
170928b400f6SJacob Faibussowitsch   PetscCheck(hA->ij,PetscObjectComm((PetscObject)A),PETSC_ERR_PLIB,"HYPRE_IJMatrix not present");
1710a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixGetObjectType,hA->ij,&type);
17112c71b3e2SJacob Faibussowitsch   PetscCheckFalse(type != HYPRE_PARCSR,PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"HYPRE_IJMatrix is not of type HYPRE_PARCSR");
1712a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_IJMatrixGetObject,hA->ij,(void**)parcsr);
1713dd9c0a25Sstefano_zampini   PetscFunctionReturn(0);
1714dd9c0a25Sstefano_zampini }
1715dd9c0a25Sstefano_zampini 
1716dd9c0a25Sstefano_zampini /*
1717dd9c0a25Sstefano_zampini    MatHYPREGetParCSR - Gets the pointer to the ParCSR matrix
1718dd9c0a25Sstefano_zampini 
1719dd9c0a25Sstefano_zampini    Not collective
1720dd9c0a25Sstefano_zampini 
1721dd9c0a25Sstefano_zampini    Input Parameters:
1722dd9c0a25Sstefano_zampini +  A  - the MATHYPRE object
1723dd9c0a25Sstefano_zampini 
1724dd9c0a25Sstefano_zampini    Output Parameter:
1725dd9c0a25Sstefano_zampini .  parcsr  - the pointer to the hypre_ParCSRMatrix
1726dd9c0a25Sstefano_zampini 
1727dd9c0a25Sstefano_zampini    Level: intermediate
1728dd9c0a25Sstefano_zampini 
1729dd9c0a25Sstefano_zampini .seealso: MatHYPRE, PetscCopyMode
1730dd9c0a25Sstefano_zampini */
1731dd9c0a25Sstefano_zampini PetscErrorCode MatHYPREGetParCSR(Mat A, hypre_ParCSRMatrix **parcsr)
1732dd9c0a25Sstefano_zampini {
1733dd9c0a25Sstefano_zampini   PetscFunctionBegin;
1734dd9c0a25Sstefano_zampini   PetscValidHeaderSpecific(A,MAT_CLASSID,1);
1735dd9c0a25Sstefano_zampini   PetscValidType(A,1);
1736*cac4c232SBarry Smith   PetscUseMethod(A,"MatHYPREGetParCSR_C",(Mat,hypre_ParCSRMatrix**),(A,parcsr));
1737dd9c0a25Sstefano_zampini   PetscFunctionReturn(0);
1738dd9c0a25Sstefano_zampini }
1739dd9c0a25Sstefano_zampini 
174068ec7858SStefano Zampini static PetscErrorCode MatMissingDiagonal_HYPRE(Mat A, PetscBool *missing, PetscInt *dd)
174168ec7858SStefano Zampini {
174268ec7858SStefano Zampini   hypre_ParCSRMatrix *parcsr;
174368ec7858SStefano Zampini   hypre_CSRMatrix    *ha;
174468ec7858SStefano Zampini   PetscInt           rst;
174568ec7858SStefano Zampini 
174668ec7858SStefano Zampini   PetscFunctionBegin;
17472c71b3e2SJacob Faibussowitsch   PetscCheckFalse(A->rmap->n != A->cmap->n,PETSC_COMM_SELF,PETSC_ERR_SUP,"Not implemented with non-square diagonal blocks");
17489566063dSJacob Faibussowitsch   PetscCall(MatGetOwnershipRange(A,&rst,NULL));
17499566063dSJacob Faibussowitsch   PetscCall(MatHYPREGetParCSR_HYPRE(A,&parcsr));
175068ec7858SStefano Zampini   if (missing) *missing = PETSC_FALSE;
175168ec7858SStefano Zampini   if (dd) *dd = -1;
175268ec7858SStefano Zampini   ha = hypre_ParCSRMatrixDiag(parcsr);
175368ec7858SStefano Zampini   if (ha) {
175468299464SStefano Zampini     PetscInt  size,i;
175568299464SStefano Zampini     HYPRE_Int *ii,*jj;
175668ec7858SStefano Zampini 
175768ec7858SStefano Zampini     size = hypre_CSRMatrixNumRows(ha);
175868ec7858SStefano Zampini     ii   = hypre_CSRMatrixI(ha);
175968ec7858SStefano Zampini     jj   = hypre_CSRMatrixJ(ha);
176068ec7858SStefano Zampini     for (i = 0; i < size; i++) {
176168ec7858SStefano Zampini       PetscInt  j;
176268ec7858SStefano Zampini       PetscBool found = PETSC_FALSE;
176368ec7858SStefano Zampini 
176468ec7858SStefano Zampini       for (j = ii[i]; j < ii[i+1] && !found; j++)
176568ec7858SStefano Zampini         found = (jj[j] == i) ? PETSC_TRUE : PETSC_FALSE;
176668ec7858SStefano Zampini 
176768ec7858SStefano Zampini       if (!found) {
17687d3de750SJacob Faibussowitsch         PetscInfo(A,"Matrix is missing local diagonal entry %" PetscInt_FMT "\n",i);
176968ec7858SStefano Zampini         if (missing) *missing = PETSC_TRUE;
177068ec7858SStefano Zampini         if (dd) *dd = i+rst;
177168ec7858SStefano Zampini         PetscFunctionReturn(0);
177268ec7858SStefano Zampini       }
177368ec7858SStefano Zampini     }
177468ec7858SStefano Zampini     if (!size) {
177568ec7858SStefano Zampini       PetscInfo(A,"Matrix has no diagonal entries therefore is missing diagonal\n");
177668ec7858SStefano Zampini       if (missing) *missing = PETSC_TRUE;
177768ec7858SStefano Zampini       if (dd) *dd = rst;
177868ec7858SStefano Zampini     }
177968ec7858SStefano Zampini   } else {
178068ec7858SStefano Zampini     PetscInfo(A,"Matrix has no diagonal entries therefore is missing diagonal\n");
178168ec7858SStefano Zampini     if (missing) *missing = PETSC_TRUE;
178268ec7858SStefano Zampini     if (dd) *dd = rst;
178368ec7858SStefano Zampini   }
178468ec7858SStefano Zampini   PetscFunctionReturn(0);
178568ec7858SStefano Zampini }
178668ec7858SStefano Zampini 
178768ec7858SStefano Zampini static PetscErrorCode MatScale_HYPRE(Mat A, PetscScalar s)
178868ec7858SStefano Zampini {
178968ec7858SStefano Zampini   hypre_ParCSRMatrix *parcsr;
17906ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2,19,0)
179168ec7858SStefano Zampini   hypre_CSRMatrix    *ha;
17926ea7df73SStefano Zampini #endif
179339accc25SStefano Zampini   HYPRE_Complex      hs;
179468ec7858SStefano Zampini 
179568ec7858SStefano Zampini   PetscFunctionBegin;
17969566063dSJacob Faibussowitsch   PetscCall(PetscHYPREScalarCast(s,&hs));
17979566063dSJacob Faibussowitsch   PetscCall(MatHYPREGetParCSR_HYPRE(A,&parcsr));
17986ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2,19,0)
1799a74df02fSJacob Faibussowitsch   PetscStackCallStandard(hypre_ParCSRMatrixScale,parcsr,hs);
18006ea7df73SStefano Zampini #else  /* diagonal part */
180168ec7858SStefano Zampini   ha = hypre_ParCSRMatrixDiag(parcsr);
180268ec7858SStefano Zampini   if (ha) {
180368299464SStefano Zampini     PetscInt      size,i;
180468299464SStefano Zampini     HYPRE_Int     *ii;
180539accc25SStefano Zampini     HYPRE_Complex *a;
180668ec7858SStefano Zampini 
180768ec7858SStefano Zampini     size = hypre_CSRMatrixNumRows(ha);
180868ec7858SStefano Zampini     a    = hypre_CSRMatrixData(ha);
180968ec7858SStefano Zampini     ii   = hypre_CSRMatrixI(ha);
181039accc25SStefano Zampini     for (i = 0; i < ii[size]; i++) a[i] *= hs;
181168ec7858SStefano Zampini   }
181268ec7858SStefano Zampini   /* offdiagonal part */
181368ec7858SStefano Zampini   ha = hypre_ParCSRMatrixOffd(parcsr);
181468ec7858SStefano Zampini   if (ha) {
181568299464SStefano Zampini     PetscInt      size,i;
181668299464SStefano Zampini     HYPRE_Int     *ii;
181739accc25SStefano Zampini     HYPRE_Complex *a;
181868ec7858SStefano Zampini 
181968ec7858SStefano Zampini     size = hypre_CSRMatrixNumRows(ha);
182068ec7858SStefano Zampini     a    = hypre_CSRMatrixData(ha);
182168ec7858SStefano Zampini     ii   = hypre_CSRMatrixI(ha);
182239accc25SStefano Zampini     for (i = 0; i < ii[size]; i++) a[i] *= hs;
182368ec7858SStefano Zampini   }
18246ea7df73SStefano Zampini #endif
182568ec7858SStefano Zampini   PetscFunctionReturn(0);
182668ec7858SStefano Zampini }
182768ec7858SStefano Zampini 
182868ec7858SStefano Zampini static PetscErrorCode MatZeroRowsColumns_HYPRE(Mat A, PetscInt numRows, const PetscInt rows[], PetscScalar diag, Vec x, Vec b)
182968ec7858SStefano Zampini {
183068ec7858SStefano Zampini   hypre_ParCSRMatrix *parcsr;
183168299464SStefano Zampini   HYPRE_Int          *lrows;
183268299464SStefano Zampini   PetscInt           rst,ren,i;
183368ec7858SStefano Zampini 
183468ec7858SStefano Zampini   PetscFunctionBegin;
18352c71b3e2SJacob Faibussowitsch   PetscCheckFalse(x || b,PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"To be implemented");
18369566063dSJacob Faibussowitsch   PetscCall(MatHYPREGetParCSR_HYPRE(A,&parcsr));
18379566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(numRows,&lrows));
18389566063dSJacob Faibussowitsch   PetscCall(MatGetOwnershipRange(A,&rst,&ren));
183968ec7858SStefano Zampini   for (i=0;i<numRows;i++) {
184068ec7858SStefano Zampini     if (rows[i] < rst || rows[i] >= ren)
184168ec7858SStefano Zampini       SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Non-local rows not yet supported");
184268ec7858SStefano Zampini     lrows[i] = rows[i] - rst;
184368ec7858SStefano Zampini   }
1844a74df02fSJacob Faibussowitsch   PetscStackCallStandard(hypre_ParCSRMatrixEliminateRowsCols,parcsr,numRows,lrows);
18459566063dSJacob Faibussowitsch   PetscCall(PetscFree(lrows));
184668ec7858SStefano Zampini   PetscFunctionReturn(0);
184768ec7858SStefano Zampini }
184868ec7858SStefano Zampini 
1849c69f721fSFande Kong static PetscErrorCode MatZeroEntries_HYPRE_CSRMatrix(hypre_CSRMatrix *ha)
1850c69f721fSFande Kong {
1851c69f721fSFande Kong   PetscFunctionBegin;
1852c69f721fSFande Kong   if (ha) {
1853c69f721fSFande Kong     HYPRE_Int     *ii, size;
1854c69f721fSFande Kong     HYPRE_Complex *a;
1855c69f721fSFande Kong 
1856c69f721fSFande Kong     size = hypre_CSRMatrixNumRows(ha);
1857c69f721fSFande Kong     a    = hypre_CSRMatrixData(ha);
1858c69f721fSFande Kong     ii   = hypre_CSRMatrixI(ha);
1859c69f721fSFande Kong 
18609566063dSJacob Faibussowitsch     if (a) PetscCall(PetscArrayzero(a,ii[size]));
1861c69f721fSFande Kong   }
1862c69f721fSFande Kong   PetscFunctionReturn(0);
1863c69f721fSFande Kong }
1864c69f721fSFande Kong 
1865c69f721fSFande Kong PetscErrorCode MatZeroEntries_HYPRE(Mat A)
1866c69f721fSFande Kong {
18676ea7df73SStefano Zampini   Mat_HYPRE *hA = (Mat_HYPRE*)A->data;
18686ea7df73SStefano Zampini 
18696ea7df73SStefano Zampini   PetscFunctionBegin;
18706ea7df73SStefano Zampini   if (HYPRE_MEMORY_DEVICE == hypre_IJMatrixMemoryLocation(hA->ij)) {
1871a74df02fSJacob Faibussowitsch     PetscStackCallStandard(HYPRE_IJMatrixSetConstantValues,hA->ij,0.0);
18726ea7df73SStefano Zampini   } else {
1873c69f721fSFande Kong     hypre_ParCSRMatrix *parcsr;
1874c69f721fSFande Kong 
18759566063dSJacob Faibussowitsch     PetscCall(MatHYPREGetParCSR_HYPRE(A,&parcsr));
18769566063dSJacob Faibussowitsch     PetscCall(MatZeroEntries_HYPRE_CSRMatrix(hypre_ParCSRMatrixDiag(parcsr)));
18779566063dSJacob Faibussowitsch     PetscCall(MatZeroEntries_HYPRE_CSRMatrix(hypre_ParCSRMatrixOffd(parcsr)));
18786ea7df73SStefano Zampini   }
1879c69f721fSFande Kong   PetscFunctionReturn(0);
1880c69f721fSFande Kong }
1881c69f721fSFande Kong 
188239accc25SStefano Zampini static PetscErrorCode MatZeroRows_HYPRE_CSRMatrix(hypre_CSRMatrix *hA,PetscInt N,const PetscInt rows[],HYPRE_Complex diag)
1883c69f721fSFande Kong {
188439accc25SStefano Zampini   PetscInt        ii;
188539accc25SStefano Zampini   HYPRE_Int       *i, *j;
188639accc25SStefano Zampini   HYPRE_Complex   *a;
1887c69f721fSFande Kong 
1888c69f721fSFande Kong   PetscFunctionBegin;
1889c69f721fSFande Kong   if (!hA) PetscFunctionReturn(0);
1890c69f721fSFande Kong 
189139accc25SStefano Zampini   i = hypre_CSRMatrixI(hA);
189239accc25SStefano Zampini   j = hypre_CSRMatrixJ(hA);
1893c69f721fSFande Kong   a = hypre_CSRMatrixData(hA);
1894c69f721fSFande Kong 
1895c69f721fSFande Kong   for (ii = 0; ii < N; ii++) {
189639accc25SStefano Zampini     HYPRE_Int jj, ibeg, iend, irow;
189739accc25SStefano Zampini 
1898c69f721fSFande Kong     irow = rows[ii];
1899c69f721fSFande Kong     ibeg = i[irow];
1900c69f721fSFande Kong     iend = i[irow+1];
1901c69f721fSFande Kong     for (jj = ibeg; jj < iend; jj++)
1902c69f721fSFande Kong       if (j[jj] == irow) a[jj] = diag;
1903c69f721fSFande Kong       else a[jj] = 0.0;
1904c69f721fSFande Kong    }
1905c69f721fSFande Kong    PetscFunctionReturn(0);
1906c69f721fSFande Kong }
1907c69f721fSFande Kong 
1908ddbeb582SStefano Zampini static PetscErrorCode MatZeroRows_HYPRE(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b)
1909c69f721fSFande Kong {
1910c69f721fSFande Kong   hypre_ParCSRMatrix  *parcsr;
1911c69f721fSFande Kong   PetscInt            *lrows,len;
191239accc25SStefano Zampini   HYPRE_Complex       hdiag;
1913c69f721fSFande Kong 
1914c69f721fSFande Kong   PetscFunctionBegin;
19152c71b3e2SJacob Faibussowitsch   PetscCheckFalse(x || b,PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Does not support to modify the solution and the right hand size");
19169566063dSJacob Faibussowitsch   PetscCall(PetscHYPREScalarCast(diag,&hdiag));
1917c69f721fSFande Kong   /* retrieve the internal matrix */
19189566063dSJacob Faibussowitsch   PetscCall(MatHYPREGetParCSR_HYPRE(A,&parcsr));
1919c69f721fSFande Kong   /* get locally owned rows */
19209566063dSJacob Faibussowitsch   PetscCall(MatZeroRowsMapLocal_Private(A,N,rows,&len,&lrows));
1921c69f721fSFande Kong   /* zero diagonal part */
19229566063dSJacob Faibussowitsch   PetscCall(MatZeroRows_HYPRE_CSRMatrix(hypre_ParCSRMatrixDiag(parcsr),len,lrows,hdiag));
1923c69f721fSFande Kong   /* zero off-diagonal part */
19249566063dSJacob Faibussowitsch   PetscCall(MatZeroRows_HYPRE_CSRMatrix(hypre_ParCSRMatrixOffd(parcsr),len,lrows,0.0));
1925c69f721fSFande Kong 
19269566063dSJacob Faibussowitsch   PetscCall(PetscFree(lrows));
1927c69f721fSFande Kong   PetscFunctionReturn(0);
1928c69f721fSFande Kong }
1929c69f721fSFande Kong 
1930ddbeb582SStefano Zampini static PetscErrorCode MatAssemblyBegin_HYPRE(Mat mat,MatAssemblyType mode)
1931c69f721fSFande Kong {
1932c69f721fSFande Kong   PetscFunctionBegin;
1933c69f721fSFande Kong   if (mat->nooffprocentries) PetscFunctionReturn(0);
1934c69f721fSFande Kong 
19359566063dSJacob Faibussowitsch   PetscCall(MatStashScatterBegin_Private(mat,&mat->stash,mat->rmap->range));
1936c69f721fSFande Kong   PetscFunctionReturn(0);
1937c69f721fSFande Kong }
1938c69f721fSFande Kong 
1939ddbeb582SStefano Zampini static PetscErrorCode MatGetRow_HYPRE(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v)
1940c69f721fSFande Kong {
1941c69f721fSFande Kong   hypre_ParCSRMatrix  *parcsr;
19422cf14000SStefano Zampini   HYPRE_Int           hnz;
1943c69f721fSFande Kong 
1944c69f721fSFande Kong   PetscFunctionBegin;
1945c69f721fSFande Kong   /* retrieve the internal matrix */
19469566063dSJacob Faibussowitsch   PetscCall(MatHYPREGetParCSR_HYPRE(A,&parcsr));
1947c69f721fSFande Kong   /* call HYPRE API */
1948a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_ParCSRMatrixGetRow,parcsr,row,&hnz,(HYPRE_BigInt**)idx,(HYPRE_Complex**)v);
19492cf14000SStefano Zampini   if (nz) *nz = (PetscInt)hnz;
1950c69f721fSFande Kong   PetscFunctionReturn(0);
1951c69f721fSFande Kong }
1952c69f721fSFande Kong 
1953ddbeb582SStefano Zampini static PetscErrorCode MatRestoreRow_HYPRE(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v)
1954c69f721fSFande Kong {
1955c69f721fSFande Kong   hypre_ParCSRMatrix  *parcsr;
19562cf14000SStefano Zampini   HYPRE_Int           hnz;
1957c69f721fSFande Kong 
1958c69f721fSFande Kong   PetscFunctionBegin;
1959c69f721fSFande Kong   /* retrieve the internal matrix */
19609566063dSJacob Faibussowitsch   PetscCall(MatHYPREGetParCSR_HYPRE(A,&parcsr));
1961c69f721fSFande Kong   /* call HYPRE API */
19622cf14000SStefano Zampini   hnz = nz ? (HYPRE_Int)(*nz) : 0;
1963a74df02fSJacob Faibussowitsch   PetscStackCallStandard(HYPRE_ParCSRMatrixRestoreRow,parcsr,row,&hnz,(HYPRE_BigInt**)idx,(HYPRE_Complex**)v);
1964c69f721fSFande Kong   PetscFunctionReturn(0);
1965c69f721fSFande Kong }
1966c69f721fSFande Kong 
1967ddbeb582SStefano Zampini static PetscErrorCode MatGetValues_HYPRE(Mat A,PetscInt m,const PetscInt idxm[],PetscInt n,const PetscInt idxn[],PetscScalar v[])
1968c69f721fSFande Kong {
196945b8d346SStefano Zampini   Mat_HYPRE *hA = (Mat_HYPRE*)A->data;
1970c69f721fSFande Kong   PetscInt  i;
19711d4906efSStefano Zampini 
1972c69f721fSFande Kong   PetscFunctionBegin;
1973c69f721fSFande Kong   if (!m || !n) PetscFunctionReturn(0);
1974c69f721fSFande Kong   /* Ignore negative row indices
1975c69f721fSFande Kong    * And negative column indices should be automatically ignored in hypre
1976c69f721fSFande Kong    * */
19772cf14000SStefano Zampini   for (i=0; i<m; i++) {
19782cf14000SStefano Zampini     if (idxm[i] >= 0) {
19792cf14000SStefano Zampini       HYPRE_Int hn = (HYPRE_Int)n;
1980a74df02fSJacob Faibussowitsch       PetscStackCallStandard(HYPRE_IJMatrixGetValues,hA->ij,1,&hn,(HYPRE_BigInt*)&idxm[i],(HYPRE_BigInt*)idxn,(HYPRE_Complex*)(v + i*n));
19812cf14000SStefano Zampini     }
19822cf14000SStefano Zampini   }
1983c69f721fSFande Kong   PetscFunctionReturn(0);
1984c69f721fSFande Kong }
1985c69f721fSFande Kong 
1986ddbeb582SStefano Zampini static PetscErrorCode MatSetOption_HYPRE(Mat A,MatOption op,PetscBool flg)
1987ddbeb582SStefano Zampini {
1988ddbeb582SStefano Zampini   Mat_HYPRE *hA = (Mat_HYPRE*)A->data;
1989ddbeb582SStefano Zampini 
1990ddbeb582SStefano Zampini   PetscFunctionBegin;
1991c6698e78SStefano Zampini   switch (op) {
1992ddbeb582SStefano Zampini   case MAT_NO_OFF_PROC_ENTRIES:
1993ddbeb582SStefano Zampini     if (flg) {
1994a74df02fSJacob Faibussowitsch       PetscStackCallStandard(HYPRE_IJMatrixSetMaxOffProcElmts,hA->ij,0);
1995ddbeb582SStefano Zampini     }
1996ddbeb582SStefano Zampini     break;
1997336664bdSPierre Jolivet   case MAT_SORTED_FULL:
1998336664bdSPierre Jolivet     hA->sorted_full = flg;
1999336664bdSPierre Jolivet     break;
2000ddbeb582SStefano Zampini   default:
2001ddbeb582SStefano Zampini     break;
2002ddbeb582SStefano Zampini   }
2003ddbeb582SStefano Zampini   PetscFunctionReturn(0);
2004ddbeb582SStefano Zampini }
2005c69f721fSFande Kong 
200645b8d346SStefano Zampini static PetscErrorCode MatView_HYPRE(Mat A, PetscViewer view)
200745b8d346SStefano Zampini {
200845b8d346SStefano Zampini   PetscViewerFormat  format;
200945b8d346SStefano Zampini 
201045b8d346SStefano Zampini   PetscFunctionBegin;
20119566063dSJacob Faibussowitsch   PetscCall(PetscViewerGetFormat(view,&format));
20126ea7df73SStefano Zampini   if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(0);
201345b8d346SStefano Zampini   if (format != PETSC_VIEWER_NATIVE) {
20146ea7df73SStefano Zampini     Mat                B;
20156ea7df73SStefano Zampini     hypre_ParCSRMatrix *parcsr;
20166ea7df73SStefano Zampini     PetscErrorCode     (*mview)(Mat,PetscViewer) = NULL;
20176ea7df73SStefano Zampini 
20189566063dSJacob Faibussowitsch     PetscCall(MatHYPREGetParCSR_HYPRE(A,&parcsr));
20199566063dSJacob Faibussowitsch     PetscCall(MatCreateFromParCSR(parcsr,MATAIJ,PETSC_USE_POINTER,&B));
20209566063dSJacob Faibussowitsch     PetscCall(MatGetOperation(B,MATOP_VIEW,(void(**)(void))&mview));
202128b400f6SJacob Faibussowitsch     PetscCheck(mview,PetscObjectComm((PetscObject)A),PETSC_ERR_PLIB,"Missing view operation");
20229566063dSJacob Faibussowitsch     PetscCall((*mview)(B,view));
20239566063dSJacob Faibussowitsch     PetscCall(MatDestroy(&B));
202445b8d346SStefano Zampini   } else {
202545b8d346SStefano Zampini     Mat_HYPRE  *hA = (Mat_HYPRE*)A->data;
202645b8d346SStefano Zampini     PetscMPIInt size;
202745b8d346SStefano Zampini     PetscBool   isascii;
202845b8d346SStefano Zampini     const char *filename;
202945b8d346SStefano Zampini 
203045b8d346SStefano Zampini     /* HYPRE uses only text files */
20319566063dSJacob Faibussowitsch     PetscCall(PetscObjectTypeCompare((PetscObject)view,PETSCVIEWERASCII,&isascii));
203228b400f6SJacob Faibussowitsch     PetscCheck(isascii,PetscObjectComm((PetscObject)view),PETSC_ERR_SUP,"PetscViewerType %s: native HYPRE format needs PETSCVIEWERASCII",((PetscObject)view)->type_name);
20339566063dSJacob Faibussowitsch     PetscCall(PetscViewerFileGetName(view,&filename));
2034a74df02fSJacob Faibussowitsch     PetscStackCallStandard(HYPRE_IJMatrixPrint,hA->ij,filename);
20359566063dSJacob Faibussowitsch     PetscCallMPI(MPI_Comm_size(hA->comm,&size));
203645b8d346SStefano Zampini     if (size > 1) {
20379566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(view,"Matrix files: %s.%05d ... %s.%05d\n",filename,0,filename,size-1));
203845b8d346SStefano Zampini     } else {
20399566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(view,"Matrix file: %s.%05d\n",filename,0));
204045b8d346SStefano Zampini     }
204145b8d346SStefano Zampini   }
204245b8d346SStefano Zampini   PetscFunctionReturn(0);
204345b8d346SStefano Zampini }
204445b8d346SStefano Zampini 
204545b8d346SStefano Zampini static PetscErrorCode MatDuplicate_HYPRE(Mat A,MatDuplicateOption op, Mat *B)
204645b8d346SStefano Zampini {
20476abb4441SStefano Zampini   hypre_ParCSRMatrix *parcsr = NULL;
204845b8d346SStefano Zampini   PetscCopyMode      cpmode;
204945b8d346SStefano Zampini 
205045b8d346SStefano Zampini   PetscFunctionBegin;
20519566063dSJacob Faibussowitsch   PetscCall(MatHYPREGetParCSR_HYPRE(A,&parcsr));
205245b8d346SStefano Zampini   if (op == MAT_DO_NOT_COPY_VALUES || op == MAT_SHARE_NONZERO_PATTERN) {
20530e6427aaSSatish Balay     parcsr = hypre_ParCSRMatrixClone(parcsr,0);
205445b8d346SStefano Zampini     cpmode = PETSC_OWN_POINTER;
205545b8d346SStefano Zampini   } else {
205645b8d346SStefano Zampini     cpmode = PETSC_COPY_VALUES;
205745b8d346SStefano Zampini   }
20589566063dSJacob Faibussowitsch   PetscCall(MatCreateFromParCSR(parcsr,MATHYPRE,cpmode,B));
205945b8d346SStefano Zampini   PetscFunctionReturn(0);
206045b8d346SStefano Zampini }
206145b8d346SStefano Zampini 
2062465edc17SStefano Zampini static PetscErrorCode MatCopy_HYPRE(Mat A, Mat B, MatStructure str)
2063465edc17SStefano Zampini {
2064465edc17SStefano Zampini   hypre_ParCSRMatrix *acsr,*bcsr;
2065465edc17SStefano Zampini 
2066465edc17SStefano Zampini   PetscFunctionBegin;
2067465edc17SStefano Zampini   if (str == SAME_NONZERO_PATTERN && A->ops->copy == B->ops->copy) {
20689566063dSJacob Faibussowitsch     PetscCall(MatHYPREGetParCSR_HYPRE(A,&acsr));
20699566063dSJacob Faibussowitsch     PetscCall(MatHYPREGetParCSR_HYPRE(B,&bcsr));
2070a74df02fSJacob Faibussowitsch     PetscStackCallStandard(hypre_ParCSRMatrixCopy,acsr,bcsr,1);
20719566063dSJacob Faibussowitsch     PetscCall(MatSetOption(B,MAT_SORTED_FULL,PETSC_TRUE)); /* "perfect" preallocation, so no need for hypre_AuxParCSRMatrixNeedAux */
20729566063dSJacob Faibussowitsch     PetscCall(MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY));
20739566063dSJacob Faibussowitsch     PetscCall(MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY));
2074465edc17SStefano Zampini   } else {
20759566063dSJacob Faibussowitsch     PetscCall(MatCopy_Basic(A,B,str));
2076465edc17SStefano Zampini   }
2077465edc17SStefano Zampini   PetscFunctionReturn(0);
2078465edc17SStefano Zampini }
2079465edc17SStefano Zampini 
20806305df00SStefano Zampini static PetscErrorCode MatGetDiagonal_HYPRE(Mat A, Vec d)
20816305df00SStefano Zampini {
20826305df00SStefano Zampini   hypre_ParCSRMatrix *parcsr;
20836305df00SStefano Zampini   hypre_CSRMatrix    *dmat;
208439accc25SStefano Zampini   HYPRE_Complex      *a;
208539accc25SStefano Zampini   HYPRE_Complex      *data = NULL;
20862cf14000SStefano Zampini   HYPRE_Int          *diag = NULL;
20872cf14000SStefano Zampini   PetscInt           i;
20886305df00SStefano Zampini   PetscBool          cong;
20896305df00SStefano Zampini 
20906305df00SStefano Zampini   PetscFunctionBegin;
20919566063dSJacob Faibussowitsch   PetscCall(MatHasCongruentLayouts(A,&cong));
209228b400f6SJacob Faibussowitsch   PetscCheck(cong,PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Only for square matrices with same local distributions of rows and columns");
209376bd3646SJed Brown   if (PetscDefined(USE_DEBUG)) {
20946305df00SStefano Zampini     PetscBool miss;
20959566063dSJacob Faibussowitsch     PetscCall(MatMissingDiagonal(A,&miss,NULL));
20962c71b3e2SJacob Faibussowitsch     PetscCheckFalse(miss && A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_SUP,"Not implemented when diagonal entries are missing");
20976305df00SStefano Zampini   }
20989566063dSJacob Faibussowitsch   PetscCall(MatHYPREGetParCSR_HYPRE(A,&parcsr));
20996305df00SStefano Zampini   dmat = hypre_ParCSRMatrixDiag(parcsr);
21006305df00SStefano Zampini   if (dmat) {
210139accc25SStefano Zampini     /* this cast fixes the clang error: implicit conversion from 'HYPRE_Complex' (aka '_Complex double') to 'double' is not permitted in C++ */
21029566063dSJacob Faibussowitsch     PetscCall(VecGetArray(d,(PetscScalar**)&a));
21032cf14000SStefano Zampini     diag = hypre_CSRMatrixI(dmat);
210439accc25SStefano Zampini     data = hypre_CSRMatrixData(dmat);
21056305df00SStefano Zampini     for (i=0;i<A->rmap->n;i++) a[i] = data[diag[i]];
21069566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(d,(PetscScalar**)&a));
21076305df00SStefano Zampini   }
21086305df00SStefano Zampini   PetscFunctionReturn(0);
21096305df00SStefano Zampini }
21106305df00SStefano Zampini 
2111363d496dSStefano Zampini #include <petscblaslapack.h>
2112363d496dSStefano Zampini 
2113363d496dSStefano Zampini static PetscErrorCode MatAXPY_HYPRE(Mat Y,PetscScalar a,Mat X,MatStructure str)
2114363d496dSStefano Zampini {
2115363d496dSStefano Zampini   PetscFunctionBegin;
21166ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
21176ea7df73SStefano Zampini   {
21186ea7df73SStefano Zampini     Mat                B;
21196ea7df73SStefano Zampini     hypre_ParCSRMatrix *x,*y,*z;
21206ea7df73SStefano Zampini 
21219566063dSJacob Faibussowitsch     PetscCall(MatHYPREGetParCSR(Y,&y));
21229566063dSJacob Faibussowitsch     PetscCall(MatHYPREGetParCSR(X,&x));
2123a74df02fSJacob Faibussowitsch     PetscStackCallStandard(hypre_ParCSRMatrixAdd,1.0,y,1.0,x,&z);
21249566063dSJacob Faibussowitsch     PetscCall(MatCreateFromParCSR(z,MATHYPRE,PETSC_OWN_POINTER,&B));
21259566063dSJacob Faibussowitsch     PetscCall(MatHeaderMerge(Y,&B));
21266ea7df73SStefano Zampini   }
21276ea7df73SStefano Zampini #else
2128363d496dSStefano Zampini   if (str == SAME_NONZERO_PATTERN) {
2129363d496dSStefano Zampini     hypre_ParCSRMatrix *x,*y;
2130363d496dSStefano Zampini     hypre_CSRMatrix    *xloc,*yloc;
2131363d496dSStefano Zampini     PetscInt           xnnz,ynnz;
213239accc25SStefano Zampini     HYPRE_Complex      *xarr,*yarr;
2133363d496dSStefano Zampini     PetscBLASInt       one=1,bnz;
2134363d496dSStefano Zampini 
21359566063dSJacob Faibussowitsch     PetscCall(MatHYPREGetParCSR(Y,&y));
21369566063dSJacob Faibussowitsch     PetscCall(MatHYPREGetParCSR(X,&x));
2137363d496dSStefano Zampini 
2138363d496dSStefano Zampini     /* diagonal block */
2139363d496dSStefano Zampini     xloc = hypre_ParCSRMatrixDiag(x);
2140363d496dSStefano Zampini     yloc = hypre_ParCSRMatrixDiag(y);
2141363d496dSStefano Zampini     xnnz = 0;
2142363d496dSStefano Zampini     ynnz = 0;
2143363d496dSStefano Zampini     xarr = NULL;
2144363d496dSStefano Zampini     yarr = NULL;
2145363d496dSStefano Zampini     if (xloc) {
214639accc25SStefano Zampini       xarr = hypre_CSRMatrixData(xloc);
2147363d496dSStefano Zampini       xnnz = hypre_CSRMatrixNumNonzeros(xloc);
2148363d496dSStefano Zampini     }
2149363d496dSStefano Zampini     if (yloc) {
215039accc25SStefano Zampini       yarr = hypre_CSRMatrixData(yloc);
2151363d496dSStefano Zampini       ynnz = hypre_CSRMatrixNumNonzeros(yloc);
2152363d496dSStefano Zampini     }
21532c71b3e2SJacob Faibussowitsch     PetscCheckFalse(xnnz != ynnz,PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Different number of nonzeros in diagonal block %" PetscInt_FMT " != %" PetscInt_FMT,xnnz,ynnz);
21549566063dSJacob Faibussowitsch     PetscCall(PetscBLASIntCast(xnnz,&bnz));
215539accc25SStefano Zampini     PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&bnz,&a,(PetscScalar*)xarr,&one,(PetscScalar*)yarr,&one));
2156363d496dSStefano Zampini 
2157363d496dSStefano Zampini     /* off-diagonal block */
2158363d496dSStefano Zampini     xloc = hypre_ParCSRMatrixOffd(x);
2159363d496dSStefano Zampini     yloc = hypre_ParCSRMatrixOffd(y);
2160363d496dSStefano Zampini     xnnz = 0;
2161363d496dSStefano Zampini     ynnz = 0;
2162363d496dSStefano Zampini     xarr = NULL;
2163363d496dSStefano Zampini     yarr = NULL;
2164363d496dSStefano Zampini     if (xloc) {
216539accc25SStefano Zampini       xarr = hypre_CSRMatrixData(xloc);
2166363d496dSStefano Zampini       xnnz = hypre_CSRMatrixNumNonzeros(xloc);
2167363d496dSStefano Zampini     }
2168363d496dSStefano Zampini     if (yloc) {
216939accc25SStefano Zampini       yarr = hypre_CSRMatrixData(yloc);
2170363d496dSStefano Zampini       ynnz = hypre_CSRMatrixNumNonzeros(yloc);
2171363d496dSStefano Zampini     }
21722c71b3e2SJacob Faibussowitsch     PetscCheckFalse(xnnz != ynnz,PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Different number of nonzeros in off-diagonal block %" PetscInt_FMT " != %" PetscInt_FMT,xnnz,ynnz);
21739566063dSJacob Faibussowitsch     PetscCall(PetscBLASIntCast(xnnz,&bnz));
217439accc25SStefano Zampini     PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&bnz,&a,(PetscScalar*)xarr,&one,(PetscScalar*)yarr,&one));
2175363d496dSStefano Zampini   } else if (str == SUBSET_NONZERO_PATTERN) {
21769566063dSJacob Faibussowitsch     PetscCall(MatAXPY_Basic(Y,a,X,str));
2177363d496dSStefano Zampini   } else {
2178363d496dSStefano Zampini     Mat B;
2179363d496dSStefano Zampini 
21809566063dSJacob Faibussowitsch     PetscCall(MatAXPY_Basic_Preallocate(Y,X,&B));
21819566063dSJacob Faibussowitsch     PetscCall(MatAXPY_BasicWithPreallocation(B,Y,a,X,str));
21829566063dSJacob Faibussowitsch     PetscCall(MatHeaderReplace(Y,&B));
2183363d496dSStefano Zampini   }
21846ea7df73SStefano Zampini #endif
2185363d496dSStefano Zampini   PetscFunctionReturn(0);
2186363d496dSStefano Zampini }
2187363d496dSStefano Zampini 
21885fbaff96SJunchao Zhang static PetscErrorCode MatSetPreallocationCOO_HYPRE(Mat mat, PetscCount coo_n, const PetscInt coo_i[], const PetscInt coo_j[])
21895fbaff96SJunchao Zhang {
21905fbaff96SJunchao Zhang   MPI_Comm               comm;
21915fbaff96SJunchao Zhang   PetscMPIInt            size;
21925fbaff96SJunchao Zhang   PetscLayout            rmap,cmap;
21935fbaff96SJunchao Zhang   Mat_HYPRE              *hmat;
21945fbaff96SJunchao Zhang   hypre_ParCSRMatrix     *parCSR;
21955fbaff96SJunchao Zhang   hypre_CSRMatrix        *diag,*offd;
21965fbaff96SJunchao Zhang   Mat                    A,B,cooMat;
21975fbaff96SJunchao Zhang   PetscScalar            *Aa,*Ba;
21985fbaff96SJunchao Zhang   HYPRE_MemoryLocation   hypreMemtype = HYPRE_MEMORY_HOST;
21995fbaff96SJunchao Zhang   PetscMemType           petscMemtype;
22005fbaff96SJunchao Zhang   MatType                matType = MATAIJ; /* default type of cooMat */
22015fbaff96SJunchao Zhang 
22025fbaff96SJunchao Zhang   PetscFunctionBegin;
22035fbaff96SJunchao Zhang   /* Build an agent matrix cooMat whose type is either MATAIJ or MATAIJKOKKOS.
22045fbaff96SJunchao Zhang      It has the same sparsity pattern as mat, and also shares the data array with mat. We use cooMat to do the COO work.
22055fbaff96SJunchao Zhang    */
22065fbaff96SJunchao Zhang   PetscCall(PetscObjectGetComm((PetscObject)mat,&comm));
22075fbaff96SJunchao Zhang   PetscCallMPI(MPI_Comm_size(comm,&size));
22085fbaff96SJunchao Zhang   PetscCall(PetscLayoutSetUp(mat->rmap));
22095fbaff96SJunchao Zhang   PetscCall(PetscLayoutSetUp(mat->cmap));
22105fbaff96SJunchao Zhang   PetscCall(MatGetLayouts(mat,&rmap,&cmap));
22115fbaff96SJunchao Zhang 
22125fbaff96SJunchao Zhang   /* I do not know how hypre_ParCSRMatrix stores diagonal elements for non-square matrices, so I just give up now */
22135fbaff96SJunchao Zhang   PetscCheck(rmap->N == cmap->N,comm,PETSC_ERR_SUP,"MATHYPRE COO cannot handle non-square matrices");
22145fbaff96SJunchao Zhang 
22155fbaff96SJunchao Zhang  #if defined(PETSC_HAVE_DEVICE)
22165fbaff96SJunchao Zhang   if (!mat->boundtocpu) { /* mat will be on device, so will cooMat */
22175fbaff96SJunchao Zhang    #if defined(PETSC_HAVE_KOKKOS)
22185fbaff96SJunchao Zhang     matType = MATAIJKOKKOS;
22195fbaff96SJunchao Zhang    #else
22205fbaff96SJunchao Zhang     SETERRQ(comm,PETSC_ERR_SUP,"To support MATHYPRE COO assembly on device, we need Kokkos, e.g., --download-kokkos --download-kokkos-kernels");
22215fbaff96SJunchao Zhang    #endif
22225fbaff96SJunchao Zhang   }
22235fbaff96SJunchao Zhang  #endif
22245fbaff96SJunchao Zhang 
22255fbaff96SJunchao Zhang   /* Do COO preallocation through cooMat */
22265fbaff96SJunchao Zhang   hmat = (Mat_HYPRE*)mat->data;
22275fbaff96SJunchao Zhang   PetscCall(MatDestroy(&hmat->cooMat));
22285fbaff96SJunchao Zhang   PetscCall(MatCreate(comm,&cooMat));
22295fbaff96SJunchao Zhang   PetscCall(MatSetType(cooMat,matType));
22305fbaff96SJunchao Zhang   PetscCall(MatSetLayouts(cooMat,rmap,cmap));
22315fbaff96SJunchao Zhang   PetscCall(MatSetPreallocationCOO(cooMat,coo_n,coo_i,coo_j));
22325fbaff96SJunchao Zhang 
22335fbaff96SJunchao Zhang   /* Copy the sparsity pattern from cooMat to hypre IJMatrix hmat->ij */
22345fbaff96SJunchao Zhang   PetscCall(MatSetOption(mat,MAT_SORTED_FULL,PETSC_TRUE));
22355fbaff96SJunchao Zhang   PetscCall(MatSetOption(mat,MAT_NO_OFF_PROC_ENTRIES,PETSC_TRUE));
22365fbaff96SJunchao Zhang   PetscCall(MatHYPRE_CreateFromMat(cooMat,hmat)); /* Create hmat->ij and preallocate it */
22375fbaff96SJunchao Zhang   PetscCall(MatHYPRE_IJMatrixCopy(cooMat,hmat->ij)); /* Copy A's (a,i,j) to hmat->ij. To reuse code. Copying 'a' is not really needed */
22385fbaff96SJunchao Zhang 
22395fbaff96SJunchao Zhang   mat->preallocated = PETSC_TRUE;
22405fbaff96SJunchao Zhang   PetscCall(MatAssemblyBegin(mat,MAT_FINAL_ASSEMBLY));
22415fbaff96SJunchao Zhang   PetscCall(MatAssemblyEnd(mat,MAT_FINAL_ASSEMBLY)); /* Migrate mat to device if it is bound to. Hypre builds its own SpMV context here */
22425fbaff96SJunchao Zhang 
22435fbaff96SJunchao Zhang   /* Alias cooMat's data array to IJMatrix's */
22445fbaff96SJunchao Zhang   PetscStackCallStandard(HYPRE_IJMatrixGetObject,hmat->ij,(void**)&parCSR);
22455fbaff96SJunchao Zhang   diag = hypre_ParCSRMatrixDiag(parCSR);
22465fbaff96SJunchao Zhang   offd = hypre_ParCSRMatrixOffd(parCSR);
22475fbaff96SJunchao Zhang 
22485fbaff96SJunchao Zhang   hypreMemtype = hypre_CSRMatrixMemoryLocation(diag);
22495fbaff96SJunchao Zhang   A    = (size == 1)? cooMat : ((Mat_MPIAIJ*)cooMat->data)->A;
22505fbaff96SJunchao Zhang   PetscCall(MatSeqAIJGetCSRAndMemType(A,NULL,NULL,&Aa,&petscMemtype));
22515fbaff96SJunchao Zhang   PetscAssert((PetscMemTypeHost(petscMemtype) && hypreMemtype == HYPRE_MEMORY_HOST) ||
22525fbaff96SJunchao Zhang               (PetscMemTypeDevice(petscMemtype) && hypreMemtype == HYPRE_MEMORY_DEVICE),
22535fbaff96SJunchao Zhang               comm,PETSC_ERR_PLIB,"PETSc and hypre's memory types mismatch");
22545fbaff96SJunchao Zhang 
22555fbaff96SJunchao Zhang   hmat->diagJ = hypre_CSRMatrixJ(diag);
22565fbaff96SJunchao Zhang   PetscStackCall("hypre_TFree",hypre_TFree(hypre_CSRMatrixData(diag),hypreMemtype));
22575fbaff96SJunchao Zhang   hypre_CSRMatrixData(diag)     = (HYPRE_Complex*)Aa;
22585fbaff96SJunchao Zhang   hypre_CSRMatrixOwnsData(diag) = 0; /* Take ownership of (j,a) away from hypre. As a result, we need to free them on our own */
22595fbaff96SJunchao Zhang 
22605fbaff96SJunchao Zhang   /* Copy diagonal pointers of A to device to facilitate MatSeqAIJMoveDiagonalValuesFront_SeqAIJKokkos */
22615fbaff96SJunchao Zhang   if (hypreMemtype == HYPRE_MEMORY_DEVICE) {
22625fbaff96SJunchao Zhang     PetscStackCall("hypre_TAlloc",hmat->diag = hypre_TAlloc(PetscInt,rmap->n,hypreMemtype));
22635fbaff96SJunchao Zhang     PetscCall(MatMarkDiagonal_SeqAIJ(A)); /* We need updated diagonal positions */
22645fbaff96SJunchao Zhang     PetscStackCall("hypre_TMemcpy",hypre_TMemcpy(hmat->diag,((Mat_SeqAIJ*)A->data)->diag,PetscInt,rmap->n,hypreMemtype,HYPRE_MEMORY_HOST));
22655fbaff96SJunchao Zhang   }
22665fbaff96SJunchao Zhang 
22675fbaff96SJunchao Zhang   if (size > 1) {
22685fbaff96SJunchao Zhang     B    = ((Mat_MPIAIJ*)cooMat->data)->B;
22695fbaff96SJunchao Zhang     PetscCall(MatSeqAIJGetCSRAndMemType(B,NULL,NULL,&Ba,&petscMemtype));
22705fbaff96SJunchao Zhang     hmat->offdJ = hypre_CSRMatrixJ(offd);
22715fbaff96SJunchao Zhang     PetscStackCall("hypre_TFree",hypre_TFree(hypre_CSRMatrixData(offd),hypreMemtype));
22725fbaff96SJunchao Zhang     hypre_CSRMatrixData(offd)     = (HYPRE_Complex*)Ba;
22735fbaff96SJunchao Zhang     hypre_CSRMatrixOwnsData(offd) = 0;
22745fbaff96SJunchao Zhang   }
22755fbaff96SJunchao Zhang 
22765fbaff96SJunchao Zhang   /* Record cooMat for use in MatSetValuesCOO_HYPRE */
22775fbaff96SJunchao Zhang   hmat->cooMat  = cooMat;
22785fbaff96SJunchao Zhang   hmat->memType = hypreMemtype;
22795fbaff96SJunchao Zhang   PetscFunctionReturn(0);
22805fbaff96SJunchao Zhang }
22815fbaff96SJunchao Zhang 
22825fbaff96SJunchao Zhang static PetscErrorCode MatSetValuesCOO_HYPRE(Mat mat, const PetscScalar v[], InsertMode imode)
22835fbaff96SJunchao Zhang {
22845fbaff96SJunchao Zhang   Mat_HYPRE      *hmat = (Mat_HYPRE*)mat->data;
22855fbaff96SJunchao Zhang   PetscMPIInt    size;
22865fbaff96SJunchao Zhang   Mat            A;
22875fbaff96SJunchao Zhang 
22885fbaff96SJunchao Zhang   PetscFunctionBegin;
22895fbaff96SJunchao Zhang   PetscCheck(hmat->cooMat,hmat->comm,PETSC_ERR_PLIB,"HYPRE COO delegate matrix has not been created yet");
22905fbaff96SJunchao Zhang   PetscCallMPI(MPI_Comm_size(hmat->comm,&size));
22915fbaff96SJunchao Zhang   PetscCall(MatSetValuesCOO(hmat->cooMat,v,imode));
22925fbaff96SJunchao Zhang 
22935fbaff96SJunchao Zhang   /* Move diagonal elements of the diagonal block to the front of their row, as needed by ParCSRMatrix. So damn hacky */
22945fbaff96SJunchao Zhang   A = (size == 1) ? hmat->cooMat : ((Mat_MPIAIJ*)hmat->cooMat->data)->A;
22955fbaff96SJunchao Zhang   if (hmat->memType == HYPRE_MEMORY_HOST) {
22965fbaff96SJunchao Zhang     Mat_SeqAIJ   *aij = (Mat_SeqAIJ*)A->data;
22975fbaff96SJunchao Zhang     PetscInt     i,m,*Ai = aij->i,*Adiag = aij->diag;
22985fbaff96SJunchao Zhang     PetscScalar  *Aa = aij->a,tmp;
22995fbaff96SJunchao Zhang 
23005fbaff96SJunchao Zhang     PetscCall(MatGetSize(A,&m,NULL));
23015fbaff96SJunchao Zhang     for (i=0; i<m; i++) {
23025fbaff96SJunchao Zhang       if (Adiag[i] >= Ai[i] && Adiag[i] < Ai[i+1]) { /* Digonal element of this row exists in a[] and j[] */
23035fbaff96SJunchao Zhang         tmp          = Aa[Ai[i]];
23045fbaff96SJunchao Zhang         Aa[Ai[i]]    = Aa[Adiag[i]];
23055fbaff96SJunchao Zhang         Aa[Adiag[i]] = tmp;
23065fbaff96SJunchao Zhang       }
23075fbaff96SJunchao Zhang     }
23085fbaff96SJunchao Zhang   } else {
23095fbaff96SJunchao Zhang    #if defined(PETSC_HAVE_KOKKOS_KERNELS)
23105fbaff96SJunchao Zhang     PetscCall(MatSeqAIJMoveDiagonalValuesFront_SeqAIJKokkos(A,hmat->diag));
23115fbaff96SJunchao Zhang    #endif
23125fbaff96SJunchao Zhang   }
23135fbaff96SJunchao Zhang   PetscFunctionReturn(0);
23145fbaff96SJunchao Zhang }
23155fbaff96SJunchao Zhang 
2316a055b5aaSBarry Smith /*MC
2317a055b5aaSBarry Smith    MATHYPRE - MATHYPRE = "hypre" - A matrix type to be used for sequential and parallel sparse matrices
2318a055b5aaSBarry Smith           based on the hypre IJ interface.
2319a055b5aaSBarry Smith 
2320a055b5aaSBarry Smith    Level: intermediate
2321a055b5aaSBarry Smith 
2322a055b5aaSBarry Smith .seealso: MatCreate()
2323a055b5aaSBarry Smith M*/
2324a055b5aaSBarry Smith 
232563c07aadSStefano Zampini PETSC_EXTERN PetscErrorCode MatCreate_HYPRE(Mat B)
232663c07aadSStefano Zampini {
232763c07aadSStefano Zampini   Mat_HYPRE      *hB;
232863c07aadSStefano Zampini 
232963c07aadSStefano Zampini   PetscFunctionBegin;
23309566063dSJacob Faibussowitsch   PetscCall(PetscNewLog(B,&hB));
23316ea7df73SStefano Zampini 
2332978814f1SStefano Zampini   hB->inner_free  = PETSC_TRUE;
2333c69f721fSFande Kong   hB->available   = PETSC_TRUE;
2334336664bdSPierre Jolivet   hB->sorted_full = PETSC_FALSE; /* no assumption whether column indices are sorted or not */
2335c69f721fSFande Kong   hB->size        = 0;
2336c69f721fSFande Kong   hB->array       = NULL;
2337978814f1SStefano Zampini 
233863c07aadSStefano Zampini   B->data       = (void*)hB;
233963c07aadSStefano Zampini   B->assembled  = PETSC_FALSE;
234063c07aadSStefano Zampini 
23419566063dSJacob Faibussowitsch   PetscCall(PetscMemzero(B->ops,sizeof(struct _MatOps)));
234263c07aadSStefano Zampini   B->ops->mult                  = MatMult_HYPRE;
234363c07aadSStefano Zampini   B->ops->multtranspose         = MatMultTranspose_HYPRE;
2344414bd5c3SStefano Zampini   B->ops->multadd               = MatMultAdd_HYPRE;
2345414bd5c3SStefano Zampini   B->ops->multtransposeadd      = MatMultTransposeAdd_HYPRE;
234663c07aadSStefano Zampini   B->ops->setup                 = MatSetUp_HYPRE;
234763c07aadSStefano Zampini   B->ops->destroy               = MatDestroy_HYPRE;
234863c07aadSStefano Zampini   B->ops->assemblyend           = MatAssemblyEnd_HYPRE;
2349c69f721fSFande Kong   B->ops->assemblybegin         = MatAssemblyBegin_HYPRE;
2350d975228cSstefano_zampini   B->ops->setvalues             = MatSetValues_HYPRE;
235168ec7858SStefano Zampini   B->ops->missingdiagonal       = MatMissingDiagonal_HYPRE;
235268ec7858SStefano Zampini   B->ops->scale                 = MatScale_HYPRE;
235368ec7858SStefano Zampini   B->ops->zerorowscolumns       = MatZeroRowsColumns_HYPRE;
2354c69f721fSFande Kong   B->ops->zeroentries           = MatZeroEntries_HYPRE;
2355c69f721fSFande Kong   B->ops->zerorows              = MatZeroRows_HYPRE;
2356c69f721fSFande Kong   B->ops->getrow                = MatGetRow_HYPRE;
2357c69f721fSFande Kong   B->ops->restorerow            = MatRestoreRow_HYPRE;
2358c69f721fSFande Kong   B->ops->getvalues             = MatGetValues_HYPRE;
2359ddbeb582SStefano Zampini   B->ops->setoption             = MatSetOption_HYPRE;
236045b8d346SStefano Zampini   B->ops->duplicate             = MatDuplicate_HYPRE;
2361465edc17SStefano Zampini   B->ops->copy                  = MatCopy_HYPRE;
236245b8d346SStefano Zampini   B->ops->view                  = MatView_HYPRE;
23636305df00SStefano Zampini   B->ops->getdiagonal           = MatGetDiagonal_HYPRE;
2364363d496dSStefano Zampini   B->ops->axpy                  = MatAXPY_HYPRE;
23654222ddf1SHong Zhang   B->ops->productsetfromoptions = MatProductSetFromOptions_HYPRE;
23666ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
23676ea7df73SStefano Zampini   B->ops->bindtocpu             = MatBindToCPU_HYPRE;
23686ea7df73SStefano Zampini   B->boundtocpu                 = PETSC_FALSE;
23696ea7df73SStefano Zampini #endif
237045b8d346SStefano Zampini 
237145b8d346SStefano Zampini   /* build cache for off array entries formed */
23729566063dSJacob Faibussowitsch   PetscCall(MatStashCreate_Private(PetscObjectComm((PetscObject)B),1,&B->stash));
237363c07aadSStefano Zampini 
23749566063dSJacob Faibussowitsch   PetscCall(PetscCommGetComm(PetscObjectComm((PetscObject)B),&hB->comm));
23759566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)B,MATHYPRE));
23769566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_hypre_aij_C",MatConvert_HYPRE_AIJ));
23779566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_hypre_is_C",MatConvert_HYPRE_IS));
23789566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaij_hypre_C",MatProductSetFromOptions_HYPRE));
23799566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_mpiaij_hypre_C",MatProductSetFromOptions_HYPRE));
23809566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatHYPRESetPreallocation_C",MatHYPRESetPreallocation_HYPRE));
23819566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatHYPREGetParCSR_C",MatHYPREGetParCSR_HYPRE));
23825fbaff96SJunchao Zhang   PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSetPreallocationCOO_C",MatSetPreallocationCOO_HYPRE));
23835fbaff96SJunchao Zhang   PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSetValuesCOO_C",MatSetValuesCOO_HYPRE));
23846ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
23856ea7df73SStefano Zampini #if defined(HYPRE_USING_HIP)
23869566063dSJacob Faibussowitsch   PetscCall(PetscDeviceInitialize(PETSC_DEVICE_HIP));
23879566063dSJacob Faibussowitsch   PetscCall(MatSetVecType(B,VECHIP));
23886ea7df73SStefano Zampini #endif
23896ea7df73SStefano Zampini #if defined(HYPRE_USING_CUDA)
23909566063dSJacob Faibussowitsch   PetscCall(PetscDeviceInitialize(PETSC_DEVICE_CUDA));
23919566063dSJacob Faibussowitsch   PetscCall(MatSetVecType(B,VECCUDA));
23926ea7df73SStefano Zampini #endif
23936ea7df73SStefano Zampini #endif
239463c07aadSStefano Zampini   PetscFunctionReturn(0);
239563c07aadSStefano Zampini }
239663c07aadSStefano Zampini 
2397225daaf8SStefano Zampini static PetscErrorCode hypre_array_destroy(void *ptr)
2398225daaf8SStefano Zampini {
2399225daaf8SStefano Zampini    PetscFunctionBegin;
2400e6de0934SSatish Balay    hypre_TFree(ptr,HYPRE_MEMORY_HOST);
2401225daaf8SStefano Zampini    PetscFunctionReturn(0);
2402225daaf8SStefano Zampini }
2403