xref: /petsc/src/mat/impls/hypre/mhypre.c (revision f2f41e485aa34be1ebd571fc6d0409440dab19e0)
163c07aadSStefano Zampini /*
263c07aadSStefano Zampini     Creates hypre ijmatrix from PETSc matrix
363c07aadSStefano Zampini */
4225daaf8SStefano Zampini 
5c6698e78SStefano Zampini #include <petscpkg_version.h>
639accc25SStefano Zampini #include <petsc/private/petschypre.h>
7dd9c0a25Sstefano_zampini #include <petscmathypre.h>
863c07aadSStefano Zampini #include <petsc/private/matimpl.h>
9a4af0ceeSJacob Faibussowitsch #include <petsc/private/deviceimpl.h>
1063c07aadSStefano Zampini #include <../src/mat/impls/hypre/mhypre.h>
1163c07aadSStefano Zampini #include <../src/mat/impls/aij/mpi/mpiaij.h>
1258968eb6SStefano Zampini #include <../src/vec/vec/impls/hypre/vhyp.h>
1358968eb6SStefano Zampini #include <HYPRE.h>
14c1a070e6SStefano Zampini #include <HYPRE_utilities.h>
15cd8bc7baSStefano Zampini #include <_hypre_parcsr_ls.h>
1668ec7858SStefano Zampini #include <_hypre_sstruct_ls.h>
1763c07aadSStefano Zampini 
180e6427aaSSatish Balay #if PETSC_PKG_HYPRE_VERSION_LT(2, 18, 0)
190e6427aaSSatish Balay   #define hypre_ParCSRMatrixClone(A, B) hypre_ParCSRMatrixCompleteClone(A)
200e6427aaSSatish Balay #endif
210e6427aaSSatish Balay 
22bb16242fSVictor A. P. Magri #if PETSC_PKG_HYPRE_VERSION_GE(2, 15, 0)
23bb16242fSVictor A. P. Magri   #define HYPRE_AssumedPartitionCheck() 1
24bb16242fSVictor A. P. Magri #endif
25bb16242fSVictor A. P. Magri 
2663c07aadSStefano Zampini static PetscErrorCode MatHYPRE_CreateFromMat(Mat, Mat_HYPRE *);
2763c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixPreallocate(Mat, Mat, HYPRE_IJMatrix);
28b73e3080SStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixCopyIJ_MPIAIJ(Mat, HYPRE_IJMatrix);
29b73e3080SStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixCopyIJ_SeqAIJ(Mat, HYPRE_IJMatrix);
3039accc25SStefano Zampini static PetscErrorCode MatHYPRE_MultKernel_Private(Mat, HYPRE_Complex, Vec, HYPRE_Complex, Vec, PetscBool);
316ea7df73SStefano Zampini static PetscErrorCode MatSetValues_HYPRE(Mat, PetscInt, const PetscInt[], PetscInt, const PetscInt[], const PetscScalar[], InsertMode ins);
3263c07aadSStefano Zampini 
33d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_IJMatrixPreallocate(Mat A_d, Mat A_o, HYPRE_IJMatrix ij)
34d71ae5a4SJacob Faibussowitsch {
3563c07aadSStefano Zampini   PetscInt        i, n_d, n_o;
3663c07aadSStefano Zampini   const PetscInt *ia_d, *ia_o;
3763c07aadSStefano Zampini   PetscBool       done_d = PETSC_FALSE, done_o = PETSC_FALSE;
382cf14000SStefano Zampini   HYPRE_Int      *nnz_d = NULL, *nnz_o = NULL;
3963c07aadSStefano Zampini 
4063c07aadSStefano Zampini   PetscFunctionBegin;
4163c07aadSStefano Zampini   if (A_d) { /* determine number of nonzero entries in local diagonal part */
429566063dSJacob Faibussowitsch     PetscCall(MatGetRowIJ(A_d, 0, PETSC_FALSE, PETSC_FALSE, &n_d, &ia_d, NULL, &done_d));
4363c07aadSStefano Zampini     if (done_d) {
449566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(n_d, &nnz_d));
45*f2f41e48SZach Atkins       for (i = 0; i < n_d; i++) nnz_d[i] = (HYPRE_Int)(ia_d[i + 1] - ia_d[i]);
4663c07aadSStefano Zampini     }
479566063dSJacob Faibussowitsch     PetscCall(MatRestoreRowIJ(A_d, 0, PETSC_FALSE, PETSC_FALSE, NULL, &ia_d, NULL, &done_d));
4863c07aadSStefano Zampini   }
4963c07aadSStefano Zampini   if (A_o) { /* determine number of nonzero entries in local off-diagonal part */
509566063dSJacob Faibussowitsch     PetscCall(MatGetRowIJ(A_o, 0, PETSC_FALSE, PETSC_FALSE, &n_o, &ia_o, NULL, &done_o));
5163c07aadSStefano Zampini     if (done_o) {
529566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(n_o, &nnz_o));
53*f2f41e48SZach Atkins       for (i = 0; i < n_o; i++) nnz_o[i] = (HYPRE_Int)(ia_o[i + 1] - ia_o[i]);
5463c07aadSStefano Zampini     }
559566063dSJacob Faibussowitsch     PetscCall(MatRestoreRowIJ(A_o, 0, PETSC_FALSE, PETSC_FALSE, &n_o, &ia_o, NULL, &done_o));
5663c07aadSStefano Zampini   }
5763c07aadSStefano Zampini   if (done_d) {    /* set number of nonzeros in HYPRE IJ matrix */
5863c07aadSStefano Zampini     if (!done_o) { /* only diagonal part */
599566063dSJacob Faibussowitsch       PetscCall(PetscCalloc1(n_d, &nnz_o));
6063c07aadSStefano Zampini     }
61c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2, 16, 0)
62c6698e78SStefano Zampini     { /* If we don't do this, the columns of the matrix will be all zeros! */
63c6698e78SStefano Zampini       hypre_AuxParCSRMatrix *aux_matrix;
64c6698e78SStefano Zampini       aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij);
65c6698e78SStefano Zampini       hypre_AuxParCSRMatrixDestroy(aux_matrix);
66c6698e78SStefano Zampini       hypre_IJMatrixTranslator(ij) = NULL;
67a333fa2bSZach Atkins       PetscCallHYPRE(HYPRE_IJMatrixSetDiagOffdSizes(ij, nnz_d, nnz_o));
6822235d61SPierre Jolivet       /* it seems they partially fixed it in 2.19.0 */
6922235d61SPierre Jolivet   #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0)
70c6698e78SStefano Zampini       aux_matrix                               = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij);
71c6698e78SStefano Zampini       hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 1;
7222235d61SPierre Jolivet   #endif
73c6698e78SStefano Zampini     }
74c6698e78SStefano Zampini #else
75a333fa2bSZach Atkins     PetscCallHYPRE(HYPRE_IJMatrixSetDiagOffdSizes(ij, nnz_d, nnz_o));
76c6698e78SStefano Zampini #endif
779566063dSJacob Faibussowitsch     PetscCall(PetscFree(nnz_d));
789566063dSJacob Faibussowitsch     PetscCall(PetscFree(nnz_o));
7963c07aadSStefano Zampini   }
803ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
8163c07aadSStefano Zampini }
8263c07aadSStefano Zampini 
83d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_CreateFromMat(Mat A, Mat_HYPRE *hA)
84d71ae5a4SJacob Faibussowitsch {
85*f2f41e48SZach Atkins   HYPRE_Int rstart, rend, cstart, cend;
8663c07aadSStefano Zampini 
8763c07aadSStefano Zampini   PetscFunctionBegin;
889566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->rmap));
899566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->cmap));
90*f2f41e48SZach Atkins   rstart = (HYPRE_Int)A->rmap->rstart;
91*f2f41e48SZach Atkins   rend   = (HYPRE_Int)A->rmap->rend;
92*f2f41e48SZach Atkins   cstart = (HYPRE_Int)A->cmap->rstart;
93*f2f41e48SZach Atkins   cend   = (HYPRE_Int)A->cmap->rend;
94ea9ee2c1SPierre Jolivet   PetscHYPREInitialize();
95651b1cf9SStefano Zampini   if (hA->ij) {
96651b1cf9SStefano Zampini     if (!hA->inner_free) hypre_IJMatrixObject(hA->ij) = NULL;
97a333fa2bSZach Atkins     PetscCallHYPRE(HYPRE_IJMatrixDestroy(hA->ij));
98651b1cf9SStefano Zampini   }
99a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixCreate(hA->comm, rstart, rend - 1, cstart, cend - 1, &hA->ij));
100a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixSetObjectType(hA->ij, HYPRE_PARCSR));
10163c07aadSStefano Zampini   {
10263c07aadSStefano Zampini     PetscBool       same;
10363c07aadSStefano Zampini     Mat             A_d, A_o;
10463c07aadSStefano Zampini     const PetscInt *colmap;
1059566063dSJacob Faibussowitsch     PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &same));
10663c07aadSStefano Zampini     if (same) {
1079566063dSJacob Faibussowitsch       PetscCall(MatMPIAIJGetSeqAIJ(A, &A_d, &A_o, &colmap));
1089566063dSJacob Faibussowitsch       PetscCall(MatHYPRE_IJMatrixPreallocate(A_d, A_o, hA->ij));
1093ba16761SJacob Faibussowitsch       PetscFunctionReturn(PETSC_SUCCESS);
11063c07aadSStefano Zampini     }
1119566063dSJacob Faibussowitsch     PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIBAIJ, &same));
11263c07aadSStefano Zampini     if (same) {
1139566063dSJacob Faibussowitsch       PetscCall(MatMPIBAIJGetSeqBAIJ(A, &A_d, &A_o, &colmap));
1149566063dSJacob Faibussowitsch       PetscCall(MatHYPRE_IJMatrixPreallocate(A_d, A_o, hA->ij));
1153ba16761SJacob Faibussowitsch       PetscFunctionReturn(PETSC_SUCCESS);
11663c07aadSStefano Zampini     }
1179566063dSJacob Faibussowitsch     PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATSEQAIJ, &same));
11863c07aadSStefano Zampini     if (same) {
1199566063dSJacob Faibussowitsch       PetscCall(MatHYPRE_IJMatrixPreallocate(A, NULL, hA->ij));
1203ba16761SJacob Faibussowitsch       PetscFunctionReturn(PETSC_SUCCESS);
12163c07aadSStefano Zampini     }
1229566063dSJacob Faibussowitsch     PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATSEQBAIJ, &same));
12363c07aadSStefano Zampini     if (same) {
1249566063dSJacob Faibussowitsch       PetscCall(MatHYPRE_IJMatrixPreallocate(A, NULL, hA->ij));
1253ba16761SJacob Faibussowitsch       PetscFunctionReturn(PETSC_SUCCESS);
12663c07aadSStefano Zampini     }
12763c07aadSStefano Zampini   }
1283ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
12963c07aadSStefano Zampini }
13063c07aadSStefano Zampini 
131b73e3080SStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixCopyIJ(Mat A, HYPRE_IJMatrix ij)
132d71ae5a4SJacob Faibussowitsch {
13363c07aadSStefano Zampini   PetscBool flg;
13463c07aadSStefano Zampini 
13563c07aadSStefano Zampini   PetscFunctionBegin;
1366ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0)
137a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixInitialize(ij));
1386ea7df73SStefano Zampini #else
139a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixInitialize_v2(ij, HYPRE_MEMORY_HOST));
1406ea7df73SStefano Zampini #endif
1419566063dSJacob Faibussowitsch   PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &flg));
142b73e3080SStefano Zampini   if (flg) {
143b73e3080SStefano Zampini     PetscCall(MatHYPRE_IJMatrixCopyIJ_MPIAIJ(A, ij));
1443ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
14563c07aadSStefano Zampini   }
1469566063dSJacob Faibussowitsch   PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATSEQAIJ, &flg));
14763c07aadSStefano Zampini   if (flg) {
148b73e3080SStefano Zampini     PetscCall(MatHYPRE_IJMatrixCopyIJ_SeqAIJ(A, ij));
1493ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
15063c07aadSStefano Zampini   }
151b73e3080SStefano Zampini   PetscCheck(PETSC_FALSE, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "No support for matrix type %s", ((PetscObject)A)->type_name);
15287ef5fa6SStefano Zampini   PetscFunctionReturn(PETSC_SUCCESS);
15363c07aadSStefano Zampini }
15463c07aadSStefano Zampini 
155b73e3080SStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixCopyIJ_SeqAIJ(Mat A, HYPRE_IJMatrix ij)
156d71ae5a4SJacob Faibussowitsch {
15763c07aadSStefano Zampini   Mat_SeqAIJ            *pdiag = (Mat_SeqAIJ *)A->data;
15858968eb6SStefano Zampini   HYPRE_Int              type;
15963c07aadSStefano Zampini   hypre_ParCSRMatrix    *par_matrix;
16063c07aadSStefano Zampini   hypre_AuxParCSRMatrix *aux_matrix;
16163c07aadSStefano Zampini   hypre_CSRMatrix       *hdiag;
1622cf14000SStefano Zampini   PetscBool              sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int));
16363c07aadSStefano Zampini 
16463c07aadSStefano Zampini   PetscFunctionBegin;
165a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(ij, &type));
16608401ef6SPierre Jolivet   PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported");
167a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixGetObject(ij, (void **)&par_matrix));
16863c07aadSStefano Zampini   hdiag = hypre_ParCSRMatrixDiag(par_matrix);
16963c07aadSStefano Zampini   /*
17063c07aadSStefano Zampini        this is the Hack part where we monkey directly with the hypre datastructures
17163c07aadSStefano Zampini   */
1722cf14000SStefano Zampini   if (sameint) {
1739566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(hdiag->i, pdiag->i, A->rmap->n + 1));
1749566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(hdiag->j, pdiag->j, pdiag->nz));
1752cf14000SStefano Zampini   } else {
1762cf14000SStefano Zampini     PetscInt i;
1772cf14000SStefano Zampini 
1782cf14000SStefano Zampini     for (i = 0; i < A->rmap->n + 1; i++) hdiag->i[i] = (HYPRE_Int)pdiag->i[i];
1792cf14000SStefano Zampini     for (i = 0; i < pdiag->nz; i++) hdiag->j[i] = (HYPRE_Int)pdiag->j[i];
1802cf14000SStefano Zampini   }
1816ea7df73SStefano Zampini 
182ea9daf28SStefano Zampini   aux_matrix                               = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij);
18363c07aadSStefano Zampini   hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0;
1843ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
18563c07aadSStefano Zampini }
18663c07aadSStefano Zampini 
187b73e3080SStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixCopyIJ_MPIAIJ(Mat A, HYPRE_IJMatrix ij)
188d71ae5a4SJacob Faibussowitsch {
18963c07aadSStefano Zampini   Mat_MPIAIJ            *pA = (Mat_MPIAIJ *)A->data;
19063c07aadSStefano Zampini   Mat_SeqAIJ            *pdiag, *poffd;
19163c07aadSStefano Zampini   PetscInt               i, *garray = pA->garray, *jj, cstart, *pjj;
1922cf14000SStefano Zampini   HYPRE_Int             *hjj, type;
19363c07aadSStefano Zampini   hypre_ParCSRMatrix    *par_matrix;
19463c07aadSStefano Zampini   hypre_AuxParCSRMatrix *aux_matrix;
19563c07aadSStefano Zampini   hypre_CSRMatrix       *hdiag, *hoffd;
1962cf14000SStefano Zampini   PetscBool              sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int));
19763c07aadSStefano Zampini 
19863c07aadSStefano Zampini   PetscFunctionBegin;
19963c07aadSStefano Zampini   pdiag = (Mat_SeqAIJ *)pA->A->data;
20063c07aadSStefano Zampini   poffd = (Mat_SeqAIJ *)pA->B->data;
201da81f932SPierre Jolivet   /* cstart is only valid for square MPIAIJ laid out in the usual way */
2029566063dSJacob Faibussowitsch   PetscCall(MatGetOwnershipRange(A, &cstart, NULL));
20363c07aadSStefano Zampini 
204a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(ij, &type));
20508401ef6SPierre Jolivet   PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported");
206a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixGetObject(ij, (void **)&par_matrix));
20763c07aadSStefano Zampini   hdiag = hypre_ParCSRMatrixDiag(par_matrix);
20863c07aadSStefano Zampini   hoffd = hypre_ParCSRMatrixOffd(par_matrix);
20963c07aadSStefano Zampini 
2102cf14000SStefano Zampini   if (sameint) {
2119566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(hdiag->i, pdiag->i, pA->A->rmap->n + 1));
2122cf14000SStefano Zampini   } else {
213f4f49eeaSPierre Jolivet     for (i = 0; i < pA->A->rmap->n + 1; i++) hdiag->i[i] = (HYPRE_Int)pdiag->i[i];
2142cf14000SStefano Zampini   }
215b73e3080SStefano Zampini 
2162cf14000SStefano Zampini   hjj = hdiag->j;
2172cf14000SStefano Zampini   pjj = pdiag->j;
218c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2, 16, 0)
219*f2f41e48SZach Atkins   for (i = 0; i < pdiag->nz; i++) hjj[i] = (HYPRE_Int)pjj[i];
220c6698e78SStefano Zampini #else
2212cf14000SStefano Zampini   for (i = 0; i < pdiag->nz; i++) hjj[i] = cstart + pjj[i];
222c6698e78SStefano Zampini #endif
2232cf14000SStefano Zampini   if (sameint) {
2249566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(hoffd->i, poffd->i, pA->A->rmap->n + 1));
2252cf14000SStefano Zampini   } else {
226f4f49eeaSPierre Jolivet     for (i = 0; i < pA->A->rmap->n + 1; i++) hoffd->i[i] = (HYPRE_Int)poffd->i[i];
2272cf14000SStefano Zampini   }
2282cf14000SStefano Zampini 
22906977982Sstefanozampini   jj = (PetscInt *)hoffd->j;
230c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2, 16, 0)
231a333fa2bSZach Atkins   PetscCallHYPRE(hypre_CSRMatrixBigInitialize(hoffd));
232c6698e78SStefano Zampini   jj = (PetscInt *)hoffd->big_j;
233c6698e78SStefano Zampini #endif
2342cf14000SStefano Zampini   pjj = poffd->j;
23563c07aadSStefano Zampini   for (i = 0; i < poffd->nz; i++) jj[i] = garray[pjj[i]];
236c6698e78SStefano Zampini 
237ea9daf28SStefano Zampini   aux_matrix                               = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij);
23863c07aadSStefano Zampini   hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0;
2393ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
24063c07aadSStefano Zampini }
24163c07aadSStefano Zampini 
242d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatConvert_HYPRE_IS(Mat A, MatType mtype, MatReuse reuse, Mat *B)
243d71ae5a4SJacob Faibussowitsch {
244f4f49eeaSPierre Jolivet   Mat_HYPRE             *mhA = (Mat_HYPRE *)A->data;
2452df22349SStefano Zampini   Mat                    lA;
2462df22349SStefano Zampini   ISLocalToGlobalMapping rl2g, cl2g;
2472df22349SStefano Zampini   IS                     is;
2482df22349SStefano Zampini   hypre_ParCSRMatrix    *hA;
2492df22349SStefano Zampini   hypre_CSRMatrix       *hdiag, *hoffd;
2502df22349SStefano Zampini   MPI_Comm               comm;
25139accc25SStefano Zampini   HYPRE_Complex         *hdd, *hod, *aa;
25239accc25SStefano Zampini   PetscScalar           *data;
2532cf14000SStefano Zampini   HYPRE_BigInt          *col_map_offd;
2542cf14000SStefano Zampini   HYPRE_Int             *hdi, *hdj, *hoi, *hoj;
2552df22349SStefano Zampini   PetscInt              *ii, *jj, *iptr, *jptr;
2562df22349SStefano Zampini   PetscInt               cum, dr, dc, oc, str, stc, nnz, i, jd, jo, M, N;
25758968eb6SStefano Zampini   HYPRE_Int              type;
25806977982Sstefanozampini   MatType                lmattype   = NULL;
25906977982Sstefanozampini   PetscBool              freeparcsr = PETSC_FALSE;
2602df22349SStefano Zampini 
2612df22349SStefano Zampini   PetscFunctionBegin;
262a1787963SStefano Zampini   comm = PetscObjectComm((PetscObject)A);
263a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(mhA->ij, &type));
26408401ef6SPierre Jolivet   PetscCheck(type == HYPRE_PARCSR, comm, PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported");
265a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixGetObject(mhA->ij, (void **)&hA));
26606977982Sstefanozampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
26706977982Sstefanozampini   if (HYPRE_MEMORY_DEVICE == hypre_IJMatrixMemoryLocation(mhA->ij)) {
26806977982Sstefanozampini     /* Support by copying back on the host and copy to GPU
26906977982Sstefanozampini        Kind of inefficient, but this is the best we can do now */
27006977982Sstefanozampini   #if defined(HYPRE_USING_HIP)
27106977982Sstefanozampini     lmattype = MATSEQAIJHIPSPARSE;
27206977982Sstefanozampini   #elif defined(HYPRE_USING_CUDA)
27306977982Sstefanozampini     lmattype = MATSEQAIJCUSPARSE;
27406977982Sstefanozampini   #endif
27506977982Sstefanozampini     hA         = hypre_ParCSRMatrixClone_v2(hA, 1, HYPRE_MEMORY_HOST);
27606977982Sstefanozampini     freeparcsr = PETSC_TRUE;
27706977982Sstefanozampini   }
27806977982Sstefanozampini #endif
2792df22349SStefano Zampini   M     = hypre_ParCSRMatrixGlobalNumRows(hA);
2802df22349SStefano Zampini   N     = hypre_ParCSRMatrixGlobalNumCols(hA);
2812df22349SStefano Zampini   str   = hypre_ParCSRMatrixFirstRowIndex(hA);
2822df22349SStefano Zampini   stc   = hypre_ParCSRMatrixFirstColDiag(hA);
2832df22349SStefano Zampini   hdiag = hypre_ParCSRMatrixDiag(hA);
2842df22349SStefano Zampini   hoffd = hypre_ParCSRMatrixOffd(hA);
2852df22349SStefano Zampini   dr    = hypre_CSRMatrixNumRows(hdiag);
2862df22349SStefano Zampini   dc    = hypre_CSRMatrixNumCols(hdiag);
2872df22349SStefano Zampini   nnz   = hypre_CSRMatrixNumNonzeros(hdiag);
2882df22349SStefano Zampini   hdi   = hypre_CSRMatrixI(hdiag);
2892df22349SStefano Zampini   hdj   = hypre_CSRMatrixJ(hdiag);
2902df22349SStefano Zampini   hdd   = hypre_CSRMatrixData(hdiag);
2912df22349SStefano Zampini   oc    = hypre_CSRMatrixNumCols(hoffd);
2922df22349SStefano Zampini   nnz += hypre_CSRMatrixNumNonzeros(hoffd);
2932df22349SStefano Zampini   hoi = hypre_CSRMatrixI(hoffd);
2942df22349SStefano Zampini   hoj = hypre_CSRMatrixJ(hoffd);
2952df22349SStefano Zampini   hod = hypre_CSRMatrixData(hoffd);
2962df22349SStefano Zampini   if (reuse != MAT_REUSE_MATRIX) {
2972df22349SStefano Zampini     PetscInt *aux;
2982df22349SStefano Zampini 
2992df22349SStefano Zampini     /* generate l2g maps for rows and cols */
3009566063dSJacob Faibussowitsch     PetscCall(ISCreateStride(comm, dr, str, 1, &is));
3019566063dSJacob Faibussowitsch     PetscCall(ISLocalToGlobalMappingCreateIS(is, &rl2g));
3029566063dSJacob Faibussowitsch     PetscCall(ISDestroy(&is));
3032df22349SStefano Zampini     col_map_offd = hypre_ParCSRMatrixColMapOffd(hA);
3049566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(dc + oc, &aux));
3052df22349SStefano Zampini     for (i = 0; i < dc; i++) aux[i] = i + stc;
3062df22349SStefano Zampini     for (i = 0; i < oc; i++) aux[i + dc] = col_map_offd[i];
3079566063dSJacob Faibussowitsch     PetscCall(ISCreateGeneral(comm, dc + oc, aux, PETSC_OWN_POINTER, &is));
3089566063dSJacob Faibussowitsch     PetscCall(ISLocalToGlobalMappingCreateIS(is, &cl2g));
3099566063dSJacob Faibussowitsch     PetscCall(ISDestroy(&is));
3102df22349SStefano Zampini     /* create MATIS object */
3119566063dSJacob Faibussowitsch     PetscCall(MatCreate(comm, B));
3129566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(*B, dr, dc, M, N));
3139566063dSJacob Faibussowitsch     PetscCall(MatSetType(*B, MATIS));
3149566063dSJacob Faibussowitsch     PetscCall(MatSetLocalToGlobalMapping(*B, rl2g, cl2g));
3159566063dSJacob Faibussowitsch     PetscCall(ISLocalToGlobalMappingDestroy(&rl2g));
3169566063dSJacob Faibussowitsch     PetscCall(ISLocalToGlobalMappingDestroy(&cl2g));
3172df22349SStefano Zampini 
3182df22349SStefano Zampini     /* allocate CSR for local matrix */
3199566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(dr + 1, &iptr));
3209566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nnz, &jptr));
3219566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nnz, &data));
3222df22349SStefano Zampini   } else {
3232df22349SStefano Zampini     PetscInt  nr;
3242df22349SStefano Zampini     PetscBool done;
3259566063dSJacob Faibussowitsch     PetscCall(MatISGetLocalMat(*B, &lA));
3269566063dSJacob Faibussowitsch     PetscCall(MatGetRowIJ(lA, 0, PETSC_FALSE, PETSC_FALSE, &nr, (const PetscInt **)&iptr, (const PetscInt **)&jptr, &done));
32708401ef6SPierre Jolivet     PetscCheck(nr == dr, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of rows in local mat! %" PetscInt_FMT " != %" PetscInt_FMT, nr, dr);
32808401ef6SPierre Jolivet     PetscCheck(iptr[nr] >= nnz, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of nonzeros in local mat! reuse %" PetscInt_FMT " requested %" PetscInt_FMT, iptr[nr], nnz);
32906977982Sstefanozampini     PetscCall(MatSeqAIJGetArrayWrite(lA, &data));
3302df22349SStefano Zampini   }
3312df22349SStefano Zampini   /* merge local matrices */
3322df22349SStefano Zampini   ii  = iptr;
3332df22349SStefano Zampini   jj  = jptr;
33439accc25SStefano Zampini   aa  = (HYPRE_Complex *)data; /* this cast fixes the clang error when doing the assignments below: implicit conversion from 'HYPRE_Complex' (aka '_Complex double') to 'double' is not permitted in C++ */
3352df22349SStefano Zampini   *ii = *(hdi++) + *(hoi++);
3362df22349SStefano Zampini   for (jd = 0, jo = 0, cum = 0; *ii < nnz; cum++) {
33739accc25SStefano Zampini     PetscScalar *aold = (PetscScalar *)aa;
3382df22349SStefano Zampini     PetscInt    *jold = jj, nc = jd + jo;
3399371c9d4SSatish Balay     for (; jd < *hdi; jd++) {
3409371c9d4SSatish Balay       *jj++ = *hdj++;
3419371c9d4SSatish Balay       *aa++ = *hdd++;
3429371c9d4SSatish Balay     }
3439371c9d4SSatish Balay     for (; jo < *hoi; jo++) {
3449371c9d4SSatish Balay       *jj++ = *hoj++ + dc;
3459371c9d4SSatish Balay       *aa++ = *hod++;
3469371c9d4SSatish Balay     }
3472df22349SStefano Zampini     *(++ii) = *(hdi++) + *(hoi++);
3489566063dSJacob Faibussowitsch     PetscCall(PetscSortIntWithScalarArray(jd + jo - nc, jold, aold));
3492df22349SStefano Zampini   }
3502df22349SStefano Zampini   for (; cum < dr; cum++) *(++ii) = nnz;
3512df22349SStefano Zampini   if (reuse != MAT_REUSE_MATRIX) {
352a033916dSStefano Zampini     Mat_SeqAIJ *a;
353a033916dSStefano Zampini 
3549566063dSJacob Faibussowitsch     PetscCall(MatCreateSeqAIJWithArrays(PETSC_COMM_SELF, dr, dc + oc, iptr, jptr, data, &lA));
355a033916dSStefano Zampini     /* hack SeqAIJ */
356f4f49eeaSPierre Jolivet     a          = (Mat_SeqAIJ *)lA->data;
357a033916dSStefano Zampini     a->free_a  = PETSC_TRUE;
358a033916dSStefano Zampini     a->free_ij = PETSC_TRUE;
35906977982Sstefanozampini     if (lmattype) PetscCall(MatConvert(lA, lmattype, MAT_INPLACE_MATRIX, &lA));
36006977982Sstefanozampini     PetscCall(MatISSetLocalMat(*B, lA));
3619566063dSJacob Faibussowitsch     PetscCall(MatDestroy(&lA));
36206977982Sstefanozampini   } else {
36306977982Sstefanozampini     PetscCall(MatSeqAIJRestoreArrayWrite(lA, &data));
3642df22349SStefano Zampini   }
3659566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY));
3669566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY));
36748a46eb9SPierre Jolivet   if (reuse == MAT_INPLACE_MATRIX) PetscCall(MatHeaderReplace(A, B));
368a333fa2bSZach Atkins   if (freeparcsr) PetscCallHYPRE(hypre_ParCSRMatrixDestroy(hA));
3693ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3702df22349SStefano Zampini }
3712df22349SStefano Zampini 
37206977982Sstefanozampini static PetscErrorCode MatHYPRE_DestroyCOOMat(Mat mat)
373d71ae5a4SJacob Faibussowitsch {
37406977982Sstefanozampini   Mat_HYPRE *hA = (Mat_HYPRE *)mat->data;
37563c07aadSStefano Zampini 
37663c07aadSStefano Zampini   PetscFunctionBegin;
37706977982Sstefanozampini   if (hA->cooMat) { /* If cooMat is present we need to destroy the column indices */
37806977982Sstefanozampini     PetscCall(MatDestroy(&hA->cooMat));
37906977982Sstefanozampini     if (hA->cooMatAttached) {
38006977982Sstefanozampini       hypre_CSRMatrix     *csr;
38106977982Sstefanozampini       hypre_ParCSRMatrix  *parcsr;
38206977982Sstefanozampini       HYPRE_MemoryLocation mem;
38306977982Sstefanozampini 
384a333fa2bSZach Atkins       PetscCallHYPRE(HYPRE_IJMatrixGetObject(hA->ij, (void **)&parcsr));
38506977982Sstefanozampini       csr = hypre_ParCSRMatrixDiag(parcsr);
38606977982Sstefanozampini       if (csr) {
38706977982Sstefanozampini         mem = hypre_CSRMatrixMemoryLocation(csr);
38806977982Sstefanozampini         PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hypre_CSRMatrixJ(csr), mem));
38906977982Sstefanozampini         PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hypre_CSRMatrixBigJ(csr), mem));
390b73e3080SStefano Zampini       }
39106977982Sstefanozampini       csr = hypre_ParCSRMatrixOffd(parcsr);
39206977982Sstefanozampini       if (csr) {
39306977982Sstefanozampini         mem = hypre_CSRMatrixMemoryLocation(csr);
39406977982Sstefanozampini         PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hypre_CSRMatrixJ(csr), mem));
39506977982Sstefanozampini         PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hypre_CSRMatrixBigJ(csr), mem));
396b73e3080SStefano Zampini       }
397b73e3080SStefano Zampini     }
39806977982Sstefanozampini   }
39906977982Sstefanozampini   hA->cooMatAttached = PETSC_FALSE;
400b73e3080SStefano Zampini   PetscFunctionReturn(PETSC_SUCCESS);
401b73e3080SStefano Zampini }
402b73e3080SStefano Zampini 
40306977982Sstefanozampini static PetscErrorCode MatHYPRE_CreateCOOMat(Mat mat)
404b73e3080SStefano Zampini {
40506977982Sstefanozampini   MPI_Comm    comm;
40606977982Sstefanozampini   PetscMPIInt size;
40706977982Sstefanozampini   PetscLayout rmap, cmap;
40806977982Sstefanozampini   Mat_HYPRE  *hmat    = (Mat_HYPRE *)mat->data;
40906977982Sstefanozampini   MatType     matType = MATAIJ; /* default type of cooMat */
410b73e3080SStefano Zampini 
411b73e3080SStefano Zampini   PetscFunctionBegin;
41206977982Sstefanozampini   /* Build an agent matrix cooMat with AIJ format
41306977982Sstefanozampini      It has the same sparsity pattern as mat, and also shares the data array with mat. We use cooMat to do the COO work.
41406977982Sstefanozampini    */
41506977982Sstefanozampini   PetscCall(PetscObjectGetComm((PetscObject)mat, &comm));
41606977982Sstefanozampini   PetscCallMPI(MPI_Comm_size(comm, &size));
41706977982Sstefanozampini   PetscCall(PetscLayoutSetUp(mat->rmap));
41806977982Sstefanozampini   PetscCall(PetscLayoutSetUp(mat->cmap));
41906977982Sstefanozampini   PetscCall(MatGetLayouts(mat, &rmap, &cmap));
420b73e3080SStefano Zampini 
42106977982Sstefanozampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
42206977982Sstefanozampini   if (!mat->boundtocpu) { /* mat will be on device, so will cooMat */
42306977982Sstefanozampini   #if defined(HYPRE_USING_HIP)
42406977982Sstefanozampini     matType = MATAIJHIPSPARSE;
42506977982Sstefanozampini   #elif defined(HYPRE_USING_CUDA)
42606977982Sstefanozampini     matType = MATAIJCUSPARSE;
427e64794e4SJunchao Zhang   #elif defined(HYPRE_USING_SYCL) && defined(PETSC_HAVE_KOKKOS_KERNELS)
428e64794e4SJunchao Zhang     matType = MATAIJKOKKOS;
42906977982Sstefanozampini   #else
430e64794e4SJunchao Zhang     SETERRQ(comm, PETSC_ERR_SUP, "No HYPRE device available. Suggest re-installing with Kokkos Kernels");
43106977982Sstefanozampini   #endif
432b73e3080SStefano Zampini   }
43306977982Sstefanozampini #endif
43406977982Sstefanozampini 
43506977982Sstefanozampini   /* Do COO preallocation through cooMat */
43606977982Sstefanozampini   PetscCall(MatHYPRE_DestroyCOOMat(mat));
43706977982Sstefanozampini   PetscCall(MatCreate(comm, &hmat->cooMat));
43806977982Sstefanozampini   PetscCall(MatSetType(hmat->cooMat, matType));
43906977982Sstefanozampini   PetscCall(MatSetLayouts(hmat->cooMat, rmap, cmap));
44006977982Sstefanozampini 
44106977982Sstefanozampini   /* allocate local matrices if needed */
44206977982Sstefanozampini   PetscCall(MatMPIAIJSetPreallocation(hmat->cooMat, 0, NULL, 0, NULL));
44306977982Sstefanozampini   PetscFunctionReturn(PETSC_SUCCESS);
44406977982Sstefanozampini }
44506977982Sstefanozampini 
44606977982Sstefanozampini /* Attach cooMat data array to hypre matrix.
44706977982Sstefanozampini    When AIJCUPMSPARSE will support raw device pointers and not THRUSTARRAY
44806977982Sstefanozampini    we should swap the arrays: i.e., attach hypre matrix array to cooMat
44906977982Sstefanozampini    This is because hypre should be in charge of handling the memory,
45006977982Sstefanozampini    cooMat is only a way to reuse PETSc COO code.
45106977982Sstefanozampini    attaching the memory will then be done at MatSetValuesCOO time and it will dynamically
45206977982Sstefanozampini    support hypre matrix migrating to host.
45306977982Sstefanozampini */
45406977982Sstefanozampini static PetscErrorCode MatHYPRE_AttachCOOMat(Mat mat)
45506977982Sstefanozampini {
45606977982Sstefanozampini   Mat_HYPRE           *hmat = (Mat_HYPRE *)mat->data;
45706977982Sstefanozampini   hypre_CSRMatrix     *diag, *offd;
45806977982Sstefanozampini   hypre_ParCSRMatrix  *parCSR;
45906977982Sstefanozampini   HYPRE_MemoryLocation hmem = HYPRE_MEMORY_HOST;
46006977982Sstefanozampini   PetscMemType         pmem;
46106977982Sstefanozampini   Mat                  A, B;
46206977982Sstefanozampini   PetscScalar         *a;
46306977982Sstefanozampini   PetscMPIInt          size;
46406977982Sstefanozampini   MPI_Comm             comm;
46506977982Sstefanozampini 
46606977982Sstefanozampini   PetscFunctionBegin;
46706977982Sstefanozampini   PetscCheck(hmat->cooMat, PetscObjectComm((PetscObject)mat), PETSC_ERR_PLIB, "HYPRE COO delegate matrix has not been created yet");
46806977982Sstefanozampini   if (hmat->cooMatAttached) PetscFunctionReturn(PETSC_SUCCESS);
46906977982Sstefanozampini   PetscCheck(hmat->cooMat->preallocated, PetscObjectComm((PetscObject)mat), PETSC_ERR_PLIB, "HYPRE COO delegate matrix is not preallocated");
47006977982Sstefanozampini   PetscCall(PetscObjectSetName((PetscObject)hmat->cooMat, "_internal_COO_mat_for_hypre"));
47106977982Sstefanozampini   PetscCall(PetscObjectGetComm((PetscObject)mat, &comm));
47206977982Sstefanozampini   PetscCallMPI(MPI_Comm_size(comm, &size));
47306977982Sstefanozampini 
47406977982Sstefanozampini   /* Alias cooMat's data array to IJMatrix's */
475a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixGetObject(hmat->ij, (void **)&parCSR));
47606977982Sstefanozampini   diag = hypre_ParCSRMatrixDiag(parCSR);
47706977982Sstefanozampini   offd = hypre_ParCSRMatrixOffd(parCSR);
47806977982Sstefanozampini 
47906977982Sstefanozampini   A = (size == 1) ? hmat->cooMat : ((Mat_MPIAIJ *)hmat->cooMat->data)->A;
48006977982Sstefanozampini   B = (size == 1) ? NULL : ((Mat_MPIAIJ *)hmat->cooMat->data)->B;
48106977982Sstefanozampini 
48206977982Sstefanozampini   PetscCall(PetscObjectSetName((PetscObject)A, "_internal_COO_mat_for_hypre"));
48306977982Sstefanozampini   hmem = hypre_CSRMatrixMemoryLocation(diag);
48406977982Sstefanozampini   PetscCall(MatSeqAIJGetCSRAndMemType(A, NULL, NULL, &a, &pmem));
48506977982Sstefanozampini   PetscAssert((PetscMemTypeHost(pmem) && hmem == HYPRE_MEMORY_HOST) || (PetscMemTypeDevice(pmem) && hmem == HYPRE_MEMORY_DEVICE), comm, PETSC_ERR_PLIB, "PETSc and hypre's memory types mismatch");
48606977982Sstefanozampini   PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hypre_CSRMatrixData(diag), hmem));
48706977982Sstefanozampini   hypre_CSRMatrixData(diag)     = (HYPRE_Complex *)a;
48806977982Sstefanozampini   hypre_CSRMatrixOwnsData(diag) = 0; /* Take ownership of (j,a) away from hypre. As a result, we need to free them on our own */
48906977982Sstefanozampini 
49006977982Sstefanozampini   if (B) {
49106977982Sstefanozampini     hmem = hypre_CSRMatrixMemoryLocation(offd);
49206977982Sstefanozampini     PetscCall(MatSeqAIJGetCSRAndMemType(B, NULL, NULL, &a, &pmem));
49306977982Sstefanozampini     PetscAssert((PetscMemTypeHost(pmem) && hmem == HYPRE_MEMORY_HOST) || (PetscMemTypeDevice(pmem) && hmem == HYPRE_MEMORY_DEVICE), comm, PETSC_ERR_PLIB, "PETSc and hypre's memory types mismatch");
49406977982Sstefanozampini     PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hypre_CSRMatrixData(offd), hmem));
49506977982Sstefanozampini     hypre_CSRMatrixData(offd)     = (HYPRE_Complex *)a;
49606977982Sstefanozampini     hypre_CSRMatrixOwnsData(offd) = 0;
49706977982Sstefanozampini   }
49806977982Sstefanozampini   hmat->cooMatAttached = PETSC_TRUE;
49906977982Sstefanozampini   PetscFunctionReturn(PETSC_SUCCESS);
50006977982Sstefanozampini }
50106977982Sstefanozampini 
5021c265611SJunchao Zhang // Build COO's coordinate list i[], j[] based on CSR's i[], j[] arrays and the number of local rows 'n'
50306977982Sstefanozampini static PetscErrorCode CSRtoCOO_Private(PetscInt n, const PetscInt ii[], const PetscInt jj[], PetscCount *ncoo, PetscInt **coo_i, PetscInt **coo_j)
50406977982Sstefanozampini {
50506977982Sstefanozampini   PetscInt *cooi, *cooj;
50606977982Sstefanozampini 
50706977982Sstefanozampini   PetscFunctionBegin;
50806977982Sstefanozampini   *ncoo = ii[n];
50906977982Sstefanozampini   PetscCall(PetscMalloc2(*ncoo, &cooi, *ncoo, &cooj));
51006977982Sstefanozampini   for (PetscInt i = 0; i < n; i++) {
51106977982Sstefanozampini     for (PetscInt j = ii[i]; j < ii[i + 1]; j++) cooi[j] = i;
51206977982Sstefanozampini   }
51306977982Sstefanozampini   PetscCall(PetscArraycpy(cooj, jj, *ncoo));
51406977982Sstefanozampini   *coo_i = cooi;
51506977982Sstefanozampini   *coo_j = cooj;
51606977982Sstefanozampini   PetscFunctionReturn(PETSC_SUCCESS);
51706977982Sstefanozampini }
51806977982Sstefanozampini 
5191c265611SJunchao Zhang // Similar to CSRtoCOO_Private, but the CSR's i[], j[] are of type HYPRE_Int
52006977982Sstefanozampini static PetscErrorCode CSRtoCOO_HYPRE_Int_Private(PetscInt n, const HYPRE_Int ii[], const HYPRE_Int jj[], PetscCount *ncoo, PetscInt **coo_i, PetscInt **coo_j)
52106977982Sstefanozampini {
52206977982Sstefanozampini   PetscInt *cooi, *cooj;
52306977982Sstefanozampini 
52406977982Sstefanozampini   PetscFunctionBegin;
52506977982Sstefanozampini   *ncoo = ii[n];
52606977982Sstefanozampini   PetscCall(PetscMalloc2(*ncoo, &cooi, *ncoo, &cooj));
52706977982Sstefanozampini   for (PetscInt i = 0; i < n; i++) {
52806977982Sstefanozampini     for (HYPRE_Int j = ii[i]; j < ii[i + 1]; j++) cooi[j] = i;
52906977982Sstefanozampini   }
53006977982Sstefanozampini   for (PetscCount i = 0; i < *ncoo; i++) cooj[i] = jj[i];
53106977982Sstefanozampini   *coo_i = cooi;
53206977982Sstefanozampini   *coo_j = cooj;
53306977982Sstefanozampini   PetscFunctionReturn(PETSC_SUCCESS);
53406977982Sstefanozampini }
53506977982Sstefanozampini 
5361c265611SJunchao Zhang // Build a COO data structure for the seqaij matrix, as if the nonzeros are laid out in the same order as in the CSR
53706977982Sstefanozampini static PetscErrorCode MatSeqAIJGetCOO_Private(Mat A, PetscCount *ncoo, PetscInt **coo_i, PetscInt **coo_j)
53806977982Sstefanozampini {
53906977982Sstefanozampini   PetscInt        n;
54006977982Sstefanozampini   const PetscInt *ii, *jj;
54106977982Sstefanozampini   PetscBool       done;
54206977982Sstefanozampini 
54306977982Sstefanozampini   PetscFunctionBegin;
54406977982Sstefanozampini   PetscCall(MatGetRowIJ(A, 0, PETSC_FALSE, PETSC_FALSE, &n, &ii, &jj, &done));
54506977982Sstefanozampini   PetscCheck(done, PetscObjectComm((PetscObject)A), PETSC_ERR_PLIB, "Failure for MatGetRowIJ");
54606977982Sstefanozampini   PetscCall(CSRtoCOO_Private(n, ii, jj, ncoo, coo_i, coo_j));
54706977982Sstefanozampini   PetscCall(MatRestoreRowIJ(A, 0, PETSC_FALSE, PETSC_FALSE, &n, &ii, &jj, &done));
54806977982Sstefanozampini   PetscCheck(done, PetscObjectComm((PetscObject)A), PETSC_ERR_PLIB, "Failure for MatRestoreRowIJ");
54906977982Sstefanozampini   PetscFunctionReturn(PETSC_SUCCESS);
55006977982Sstefanozampini }
55106977982Sstefanozampini 
5521c265611SJunchao Zhang // Build a COO data structure for the hypreCSRMatrix, as if the nonzeros are laid out in the same order as in the hypreCSRMatrix
55306977982Sstefanozampini static PetscErrorCode hypreCSRMatrixGetCOO_Private(hypre_CSRMatrix *A, PetscCount *ncoo, PetscInt **coo_i, PetscInt **coo_j)
55406977982Sstefanozampini {
55506977982Sstefanozampini   PetscInt             n = hypre_CSRMatrixNumRows(A);
55606977982Sstefanozampini   HYPRE_Int           *ii, *jj;
55706977982Sstefanozampini   HYPRE_MemoryLocation mem = HYPRE_MEMORY_HOST;
55806977982Sstefanozampini 
55906977982Sstefanozampini   PetscFunctionBegin;
56006977982Sstefanozampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
56106977982Sstefanozampini   mem = hypre_CSRMatrixMemoryLocation(A);
56206977982Sstefanozampini   if (mem != HYPRE_MEMORY_HOST) {
56306977982Sstefanozampini     PetscCount nnz = hypre_CSRMatrixNumNonzeros(A);
56406977982Sstefanozampini     PetscCall(PetscMalloc2(n + 1, &ii, nnz, &jj));
56506977982Sstefanozampini     hypre_TMemcpy(ii, hypre_CSRMatrixI(A), HYPRE_Int, n + 1, HYPRE_MEMORY_HOST, mem);
56606977982Sstefanozampini     hypre_TMemcpy(jj, hypre_CSRMatrixJ(A), HYPRE_Int, nnz, HYPRE_MEMORY_HOST, mem);
56706977982Sstefanozampini   } else {
56806977982Sstefanozampini #else
56906977982Sstefanozampini   {
57006977982Sstefanozampini #endif
57106977982Sstefanozampini     ii = hypre_CSRMatrixI(A);
57206977982Sstefanozampini     jj = hypre_CSRMatrixJ(A);
57306977982Sstefanozampini   }
57406977982Sstefanozampini   PetscCall(CSRtoCOO_HYPRE_Int_Private(n, ii, jj, ncoo, coo_i, coo_j));
57506977982Sstefanozampini   if (mem != HYPRE_MEMORY_HOST) PetscCall(PetscFree2(ii, jj));
57606977982Sstefanozampini   PetscFunctionReturn(PETSC_SUCCESS);
57706977982Sstefanozampini }
57806977982Sstefanozampini 
57906977982Sstefanozampini static PetscErrorCode MatSetValuesCOOFromCSRMatrix_Private(Mat A, hypre_CSRMatrix *H)
58006977982Sstefanozampini {
58106977982Sstefanozampini   PetscBool            iscpu = PETSC_TRUE;
58206977982Sstefanozampini   PetscScalar         *a;
58306977982Sstefanozampini   HYPRE_MemoryLocation mem = HYPRE_MEMORY_HOST;
58406977982Sstefanozampini 
58506977982Sstefanozampini   PetscFunctionBegin;
58606977982Sstefanozampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
58706977982Sstefanozampini   mem = hypre_CSRMatrixMemoryLocation(H);
58806977982Sstefanozampini   PetscCall(PetscObjectTypeCompare((PetscObject)A, MATSEQAIJ, &iscpu));
58906977982Sstefanozampini #endif
59006977982Sstefanozampini   if (iscpu && mem != HYPRE_MEMORY_HOST) {
59106977982Sstefanozampini     PetscCount nnz = hypre_CSRMatrixNumNonzeros(H);
59206977982Sstefanozampini     PetscCall(PetscMalloc1(nnz, &a));
59306977982Sstefanozampini     hypre_TMemcpy(a, hypre_CSRMatrixData(H), PetscScalar, nnz, HYPRE_MEMORY_HOST, mem);
59406977982Sstefanozampini   } else {
59506977982Sstefanozampini     a = (PetscScalar *)hypre_CSRMatrixData(H);
59606977982Sstefanozampini   }
59706977982Sstefanozampini   PetscCall(MatSetValuesCOO(A, a, INSERT_VALUES));
59806977982Sstefanozampini   if (iscpu && mem != HYPRE_MEMORY_HOST) PetscCall(PetscFree(a));
599b73e3080SStefano Zampini   PetscFunctionReturn(PETSC_SUCCESS);
600b73e3080SStefano Zampini }
601b73e3080SStefano Zampini 
602b73e3080SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType type, MatReuse reuse, Mat *B)
603b73e3080SStefano Zampini {
604b73e3080SStefano Zampini   MPI_Comm     comm = PetscObjectComm((PetscObject)A);
60506977982Sstefanozampini   Mat          M = NULL, dH = NULL, oH = NULL, dA = NULL, oA = NULL;
606d7185485SAlex Lindsay   PetscBool    ismpiaij, issbaij, isbaij, boundtocpu = PETSC_TRUE;
607b73e3080SStefano Zampini   Mat_HYPRE   *hA;
608d7185485SAlex Lindsay   PetscMemType memtype = PETSC_MEMTYPE_HOST;
609b73e3080SStefano Zampini 
610b73e3080SStefano Zampini   PetscFunctionBegin;
611d7185485SAlex Lindsay   if (PetscDefined(HAVE_HYPRE_DEVICE)) {
612d7185485SAlex Lindsay     PetscCall(MatGetCurrentMemType(A, &memtype));
613d7185485SAlex Lindsay     PetscHYPREInitialize();
614d7185485SAlex Lindsay     boundtocpu = PetscMemTypeHost(memtype) ? PETSC_TRUE : PETSC_FALSE;
615a333fa2bSZach Atkins     PetscCallHYPRE(HYPRE_SetMemoryLocation(boundtocpu ? HYPRE_MEMORY_HOST : HYPRE_MEMORY_DEVICE));
616d7185485SAlex Lindsay   }
617d7185485SAlex Lindsay 
618b73e3080SStefano Zampini   PetscCall(PetscObjectTypeCompareAny((PetscObject)A, &issbaij, MATSEQSBAIJ, MATMPIBAIJ, ""));
619b73e3080SStefano Zampini   PetscCall(PetscObjectTypeCompareAny((PetscObject)A, &isbaij, MATSEQBAIJ, MATMPIBAIJ, ""));
620b73e3080SStefano Zampini   if (isbaij || issbaij) { /* handle BAIJ and SBAIJ */
621b73e3080SStefano Zampini     PetscBool ismpi;
622b73e3080SStefano Zampini     MatType   newtype;
623b73e3080SStefano Zampini 
624b73e3080SStefano Zampini     PetscCall(PetscObjectTypeCompareAny((PetscObject)A, &ismpi, MATMPISBAIJ, MATMPIBAIJ, ""));
625b73e3080SStefano Zampini     newtype = ismpi ? MATMPIAIJ : MATSEQAIJ;
62663c07aadSStefano Zampini     if (reuse == MAT_REUSE_MATRIX) {
627b73e3080SStefano Zampini       PetscCall(MatConvert(*B, newtype, MAT_INPLACE_MATRIX, B));
628b73e3080SStefano Zampini       PetscCall(MatConvert(A, newtype, MAT_REUSE_MATRIX, B));
629b73e3080SStefano Zampini       PetscCall(MatConvert(*B, MATHYPRE, MAT_INPLACE_MATRIX, B));
630b73e3080SStefano Zampini     } else if (reuse == MAT_INITIAL_MATRIX) {
631b73e3080SStefano Zampini       PetscCall(MatConvert(A, newtype, MAT_INITIAL_MATRIX, B));
632b73e3080SStefano Zampini       PetscCall(MatConvert(*B, MATHYPRE, MAT_INPLACE_MATRIX, B));
63363c07aadSStefano Zampini     } else {
634b73e3080SStefano Zampini       PetscCall(MatConvert(A, newtype, MAT_INPLACE_MATRIX, &A));
635b73e3080SStefano Zampini       PetscCall(MatConvert(A, MATHYPRE, MAT_INPLACE_MATRIX, &A));
636b73e3080SStefano Zampini     }
637d7185485SAlex Lindsay #if defined(PETSC_HAVE_DEVICE)
638d7185485SAlex Lindsay     (*B)->boundtocpu = boundtocpu;
639d7185485SAlex Lindsay #endif
640b73e3080SStefano Zampini     PetscFunctionReturn(PETSC_SUCCESS);
641b73e3080SStefano Zampini   }
64206977982Sstefanozampini 
64306977982Sstefanozampini   dA = A;
644b73e3080SStefano Zampini   PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &ismpiaij));
645b73e3080SStefano Zampini   if (ismpiaij) PetscCall(MatMPIAIJGetSeqAIJ(A, &dA, &oA, NULL));
64606977982Sstefanozampini 
647b73e3080SStefano Zampini   if (reuse != MAT_REUSE_MATRIX) {
64806977982Sstefanozampini     PetscCount coo_n;
64906977982Sstefanozampini     PetscInt  *coo_i, *coo_j;
65006977982Sstefanozampini 
6519566063dSJacob Faibussowitsch     PetscCall(MatCreate(comm, &M));
6529566063dSJacob Faibussowitsch     PetscCall(MatSetType(M, MATHYPRE));
6539566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(M, A->rmap->n, A->cmap->n, A->rmap->N, A->cmap->N));
654b73e3080SStefano Zampini     PetscCall(MatSetOption(M, MAT_SORTED_FULL, PETSC_TRUE));
655b73e3080SStefano Zampini     PetscCall(MatSetOption(M, MAT_NO_OFF_PROC_ENTRIES, PETSC_TRUE));
656b73e3080SStefano Zampini 
657b73e3080SStefano Zampini     hA = (Mat_HYPRE *)M->data;
65806977982Sstefanozampini     PetscCall(MatHYPRE_CreateFromMat(A, hA));
65906977982Sstefanozampini     PetscCall(MatHYPRE_IJMatrixCopyIJ(A, hA->ij));
66006977982Sstefanozampini 
66106977982Sstefanozampini     PetscCall(MatHYPRE_CreateCOOMat(M));
66206977982Sstefanozampini 
66306977982Sstefanozampini     dH = hA->cooMat;
66406977982Sstefanozampini     PetscCall(PetscObjectBaseTypeCompare((PetscObject)hA->cooMat, MATMPIAIJ, &ismpiaij));
66506977982Sstefanozampini     if (ismpiaij) PetscCall(MatMPIAIJGetSeqAIJ(hA->cooMat, &dH, &oH, NULL));
66606977982Sstefanozampini 
66706977982Sstefanozampini     PetscCall(PetscObjectSetName((PetscObject)dH, "_internal_COO_mat_for_hypre"));
66806977982Sstefanozampini     PetscCall(MatSeqAIJGetCOO_Private(dA, &coo_n, &coo_i, &coo_j));
66906977982Sstefanozampini     PetscCall(MatSetPreallocationCOO(dH, coo_n, coo_i, coo_j));
67006977982Sstefanozampini     PetscCall(PetscFree2(coo_i, coo_j));
67106977982Sstefanozampini     if (oH) {
67206977982Sstefanozampini       PetscCall(PetscLayoutDestroy(&oH->cmap));
67306977982Sstefanozampini       PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)oH), oA->cmap->n, oA->cmap->n, 1, &oH->cmap));
67406977982Sstefanozampini       PetscCall(MatSeqAIJGetCOO_Private(oA, &coo_n, &coo_i, &coo_j));
67506977982Sstefanozampini       PetscCall(MatSetPreallocationCOO(oH, coo_n, coo_i, coo_j));
67606977982Sstefanozampini       PetscCall(PetscFree2(coo_i, coo_j));
67706977982Sstefanozampini     }
67806977982Sstefanozampini     hA->cooMat->assembled = PETSC_TRUE;
67906977982Sstefanozampini 
680b73e3080SStefano Zampini     M->preallocated = PETSC_TRUE;
68106977982Sstefanozampini     PetscCall(MatAssemblyBegin(M, MAT_FINAL_ASSEMBLY));
68206977982Sstefanozampini     PetscCall(MatAssemblyEnd(M, MAT_FINAL_ASSEMBLY));
68306977982Sstefanozampini 
68406977982Sstefanozampini     PetscCall(MatHYPRE_AttachCOOMat(M));
68584d4e069SStefano Zampini     if (reuse == MAT_INITIAL_MATRIX) *B = M;
686b73e3080SStefano Zampini   } else M = *B;
687b73e3080SStefano Zampini 
688b73e3080SStefano Zampini   hA = (Mat_HYPRE *)M->data;
68906977982Sstefanozampini   PetscCheck(hA->cooMat, PetscObjectComm((PetscObject)A), PETSC_ERR_PLIB, "HYPRE COO delegate matrix has not been created yet");
69006977982Sstefanozampini 
69106977982Sstefanozampini   dH = hA->cooMat;
69206977982Sstefanozampini   PetscCall(PetscObjectBaseTypeCompare((PetscObject)hA->cooMat, MATMPIAIJ, &ismpiaij));
69306977982Sstefanozampini   if (ismpiaij) PetscCall(MatMPIAIJGetSeqAIJ(hA->cooMat, &dH, &oH, NULL));
69406977982Sstefanozampini 
69506977982Sstefanozampini   PetscScalar *a;
69606977982Sstefanozampini   PetscCall(MatSeqAIJGetCSRAndMemType(dA, NULL, NULL, &a, NULL));
69706977982Sstefanozampini   PetscCall(MatSetValuesCOO(dH, a, INSERT_VALUES));
69806977982Sstefanozampini   if (oH) {
69906977982Sstefanozampini     PetscCall(MatSeqAIJGetCSRAndMemType(oA, NULL, NULL, &a, NULL));
70006977982Sstefanozampini     PetscCall(MatSetValuesCOO(oH, a, INSERT_VALUES));
70106977982Sstefanozampini   }
702b73e3080SStefano Zampini 
70348a46eb9SPierre Jolivet   if (reuse == MAT_INPLACE_MATRIX) PetscCall(MatHeaderReplace(A, &M));
704d7185485SAlex Lindsay #if defined(PETSC_HAVE_DEVICE)
705d7185485SAlex Lindsay   (*B)->boundtocpu = boundtocpu;
706d7185485SAlex Lindsay #endif
7073ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
70863c07aadSStefano Zampini }
70963c07aadSStefano Zampini 
710d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatConvert_HYPRE_AIJ(Mat A, MatType mtype, MatReuse reuse, Mat *B)
711d71ae5a4SJacob Faibussowitsch {
71206977982Sstefanozampini   Mat                 M, dA = NULL, oA = NULL;
71363c07aadSStefano Zampini   hypre_ParCSRMatrix *parcsr;
71406977982Sstefanozampini   hypre_CSRMatrix    *dH, *oH;
71563c07aadSStefano Zampini   MPI_Comm            comm;
71606977982Sstefanozampini   PetscBool           ismpiaij, isseqaij;
71763c07aadSStefano Zampini 
71863c07aadSStefano Zampini   PetscFunctionBegin;
71963c07aadSStefano Zampini   comm = PetscObjectComm((PetscObject)A);
72063c07aadSStefano Zampini   if (reuse == MAT_REUSE_MATRIX) {
7219566063dSJacob Faibussowitsch     PetscCall(PetscObjectBaseTypeCompare((PetscObject)*B, MATMPIAIJ, &ismpiaij));
7229566063dSJacob Faibussowitsch     PetscCall(PetscObjectBaseTypeCompare((PetscObject)*B, MATSEQAIJ, &isseqaij));
72306977982Sstefanozampini     PetscCheck(ismpiaij || isseqaij, comm, PETSC_ERR_SUP, "Only MATMPIAIJ or MATSEQAIJ base types are supported");
72463c07aadSStefano Zampini   }
72506977982Sstefanozampini   PetscCall(MatHYPREGetParCSR(A, &parcsr));
7266ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
72706977982Sstefanozampini   if (HYPRE_MEMORY_DEVICE == hypre_ParCSRMatrixMemoryLocation(parcsr)) {
72806977982Sstefanozampini     PetscBool isaij;
72906977982Sstefanozampini 
73006977982Sstefanozampini     PetscCall(PetscStrcmp(mtype, MATAIJ, &isaij));
73106977982Sstefanozampini     if (isaij) {
73206977982Sstefanozampini       PetscMPIInt size;
73306977982Sstefanozampini 
7349566063dSJacob Faibussowitsch       PetscCallMPI(MPI_Comm_size(comm, &size));
73506977982Sstefanozampini   #if defined(HYPRE_USING_HIP)
73606977982Sstefanozampini       mtype = size > 1 ? MATMPIAIJHIPSPARSE : MATSEQAIJHIPSPARSE;
73706977982Sstefanozampini   #elif defined(HYPRE_USING_CUDA)
73806977982Sstefanozampini       mtype = size > 1 ? MATMPIAIJCUSPARSE : MATSEQAIJCUSPARSE;
73906977982Sstefanozampini   #else
74006977982Sstefanozampini       mtype = size > 1 ? MATMPIAIJ : MATSEQAIJ;
74106977982Sstefanozampini   #endif
74263c07aadSStefano Zampini     }
74363c07aadSStefano Zampini   }
74406977982Sstefanozampini #endif
74506977982Sstefanozampini   dH = hypre_ParCSRMatrixDiag(parcsr);
74606977982Sstefanozampini   oH = hypre_ParCSRMatrixOffd(parcsr);
7479371c9d4SSatish Balay   if (reuse != MAT_REUSE_MATRIX) {
74806977982Sstefanozampini     PetscCount coo_n;
74906977982Sstefanozampini     PetscInt  *coo_i, *coo_j;
75063c07aadSStefano Zampini 
75106977982Sstefanozampini     PetscCall(MatCreate(comm, &M));
75206977982Sstefanozampini     PetscCall(MatSetType(M, mtype));
75306977982Sstefanozampini     PetscCall(MatSetSizes(M, A->rmap->n, A->cmap->n, A->rmap->N, A->cmap->N));
75406977982Sstefanozampini     PetscCall(MatMPIAIJSetPreallocation(M, 0, NULL, 0, NULL));
75563c07aadSStefano Zampini 
75606977982Sstefanozampini     dA = M;
75706977982Sstefanozampini     PetscCall(PetscObjectBaseTypeCompare((PetscObject)M, MATMPIAIJ, &ismpiaij));
75806977982Sstefanozampini     if (ismpiaij) PetscCall(MatMPIAIJGetSeqAIJ(M, &dA, &oA, NULL));
759a16187a7SStefano Zampini 
76006977982Sstefanozampini     PetscCall(hypreCSRMatrixGetCOO_Private(dH, &coo_n, &coo_i, &coo_j));
76106977982Sstefanozampini     PetscCall(MatSetPreallocationCOO(dA, coo_n, coo_i, coo_j));
76206977982Sstefanozampini     PetscCall(PetscFree2(coo_i, coo_j));
76306977982Sstefanozampini     if (ismpiaij) {
76406977982Sstefanozampini       HYPRE_Int nc = hypre_CSRMatrixNumCols(oH);
765a16187a7SStefano Zampini 
76606977982Sstefanozampini       PetscCall(PetscLayoutDestroy(&oA->cmap));
76706977982Sstefanozampini       PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)oA), nc, nc, 1, &oA->cmap));
76806977982Sstefanozampini       PetscCall(hypreCSRMatrixGetCOO_Private(oH, &coo_n, &coo_i, &coo_j));
76906977982Sstefanozampini       PetscCall(MatSetPreallocationCOO(oA, coo_n, coo_i, coo_j));
77006977982Sstefanozampini       PetscCall(PetscFree2(coo_i, coo_j));
771a16187a7SStefano Zampini 
77206977982Sstefanozampini       /* garray */
773f4f49eeaSPierre Jolivet       Mat_MPIAIJ   *aij    = (Mat_MPIAIJ *)M->data;
77406977982Sstefanozampini       HYPRE_BigInt *harray = hypre_ParCSRMatrixColMapOffd(parcsr);
77506977982Sstefanozampini       PetscInt     *garray;
77606977982Sstefanozampini 
77706977982Sstefanozampini       PetscCall(PetscFree(aij->garray));
77806977982Sstefanozampini       PetscCall(PetscMalloc1(nc, &garray));
77906977982Sstefanozampini       for (HYPRE_Int i = 0; i < nc; i++) garray[i] = (PetscInt)harray[i];
78006977982Sstefanozampini       aij->garray = garray;
78106977982Sstefanozampini       PetscCall(MatSetUpMultiply_MPIAIJ(M));
782a16187a7SStefano Zampini     }
78306977982Sstefanozampini     if (reuse == MAT_INITIAL_MATRIX) *B = M;
78406977982Sstefanozampini   } else M = *B;
785225daaf8SStefano Zampini 
78606977982Sstefanozampini   dA = M;
78706977982Sstefanozampini   PetscCall(PetscObjectBaseTypeCompare((PetscObject)M, MATMPIAIJ, &ismpiaij));
78806977982Sstefanozampini   if (ismpiaij) PetscCall(MatMPIAIJGetSeqAIJ(M, &dA, &oA, NULL));
78906977982Sstefanozampini   PetscCall(MatSetValuesCOOFromCSRMatrix_Private(dA, dH));
79006977982Sstefanozampini   if (oA) PetscCall(MatSetValuesCOOFromCSRMatrix_Private(oA, oH));
79106977982Sstefanozampini   M->assembled = PETSC_TRUE;
79206977982Sstefanozampini   if (reuse == MAT_INPLACE_MATRIX) PetscCall(MatHeaderReplace(A, &M));
7933ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
79463c07aadSStefano Zampini }
79563c07aadSStefano Zampini 
796d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAIJGetParCSR_Private(Mat A, hypre_ParCSRMatrix **hA)
797d71ae5a4SJacob Faibussowitsch {
798613e5ff0Sstefano_zampini   hypre_ParCSRMatrix *tA;
799c1a070e6SStefano Zampini   hypre_CSRMatrix    *hdiag, *hoffd;
800c1a070e6SStefano Zampini   Mat_SeqAIJ         *diag, *offd;
8012cf14000SStefano Zampini   PetscInt           *garray, i, noffd, dnnz, onnz, *row_starts, *col_starts;
802c1a070e6SStefano Zampini   MPI_Comm            comm = PetscObjectComm((PetscObject)A);
803613e5ff0Sstefano_zampini   PetscBool           ismpiaij, isseqaij;
8042cf14000SStefano Zampini   PetscBool           sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int));
8056ea7df73SStefano Zampini   HYPRE_Int          *hdi = NULL, *hdj = NULL, *hoi = NULL, *hoj = NULL;
8065c97c10fSStefano Zampini   PetscInt           *pdi = NULL, *pdj = NULL, *poi = NULL, *poj = NULL;
80706977982Sstefanozampini   PetscBool           iscuda, iship;
80806977982Sstefanozampini #if defined(PETSC_HAVE_DEVICE) && defined(PETSC_HAVE_HYPRE_DEVICE)
80906977982Sstefanozampini   PetscBool boundtocpu = A->boundtocpu;
81006977982Sstefanozampini #else
81106977982Sstefanozampini   PetscBool boundtocpu = PETSC_TRUE;
8126ea7df73SStefano Zampini #endif
813c1a070e6SStefano Zampini 
814c1a070e6SStefano Zampini   PetscFunctionBegin;
8159566063dSJacob Faibussowitsch   PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &ismpiaij));
8169566063dSJacob Faibussowitsch   PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATSEQAIJ, &isseqaij));
81708401ef6SPierre Jolivet   PetscCheck(ismpiaij || isseqaij, comm, PETSC_ERR_SUP, "Unsupported type %s", ((PetscObject)A)->type_name);
818b655ebf8SZach Atkins   PetscCall(PetscObjectTypeCompareAny((PetscObject)A, &iscuda, MATSEQAIJCUSPARSE, MATMPIAIJCUSPARSE, ""));
819b655ebf8SZach Atkins   PetscCall(PetscObjectTypeCompareAny((PetscObject)A, &iship, MATSEQAIJHIPSPARSE, MATMPIAIJHIPSPARSE, ""));
820ea9ee2c1SPierre Jolivet   PetscHYPREInitialize();
821c1a070e6SStefano Zampini   if (ismpiaij) {
822f4f49eeaSPierre Jolivet     Mat_MPIAIJ *a = (Mat_MPIAIJ *)A->data;
823c1a070e6SStefano Zampini 
824c1a070e6SStefano Zampini     diag = (Mat_SeqAIJ *)a->A->data;
825c1a070e6SStefano Zampini     offd = (Mat_SeqAIJ *)a->B->data;
82606977982Sstefanozampini     if (!boundtocpu && (iscuda || iship)) {
82706977982Sstefanozampini #if defined(HYPRE_USING_CUDA) && defined(PETSC_HAVE_CUDA)
82806977982Sstefanozampini       if (iscuda) {
8296ea7df73SStefano Zampini         sameint = PETSC_TRUE;
8309566063dSJacob Faibussowitsch         PetscCall(MatSeqAIJCUSPARSEGetIJ(a->A, PETSC_FALSE, (const HYPRE_Int **)&hdi, (const HYPRE_Int **)&hdj));
8319566063dSJacob Faibussowitsch         PetscCall(MatSeqAIJCUSPARSEGetIJ(a->B, PETSC_FALSE, (const HYPRE_Int **)&hoi, (const HYPRE_Int **)&hoj));
83206977982Sstefanozampini       }
8336ea7df73SStefano Zampini #endif
83406977982Sstefanozampini #if defined(HYPRE_USING_HIP) && defined(PETSC_HAVE_HIP)
83506977982Sstefanozampini       if (iship) {
83606977982Sstefanozampini         sameint = PETSC_TRUE;
83706977982Sstefanozampini         PetscCall(MatSeqAIJHIPSPARSEGetIJ(a->A, PETSC_FALSE, (const HYPRE_Int **)&hdi, (const HYPRE_Int **)&hdj));
83806977982Sstefanozampini         PetscCall(MatSeqAIJHIPSPARSEGetIJ(a->B, PETSC_FALSE, (const HYPRE_Int **)&hoi, (const HYPRE_Int **)&hoj));
83906977982Sstefanozampini       }
84006977982Sstefanozampini #endif
84106977982Sstefanozampini     } else {
84206977982Sstefanozampini       boundtocpu = PETSC_TRUE;
8436ea7df73SStefano Zampini       pdi        = diag->i;
8446ea7df73SStefano Zampini       pdj        = diag->j;
8456ea7df73SStefano Zampini       poi        = offd->i;
8466ea7df73SStefano Zampini       poj        = offd->j;
8476ea7df73SStefano Zampini       if (sameint) {
8486ea7df73SStefano Zampini         hdi = (HYPRE_Int *)pdi;
8496ea7df73SStefano Zampini         hdj = (HYPRE_Int *)pdj;
8506ea7df73SStefano Zampini         hoi = (HYPRE_Int *)poi;
8516ea7df73SStefano Zampini         hoj = (HYPRE_Int *)poj;
8526ea7df73SStefano Zampini       }
8536ea7df73SStefano Zampini     }
854c1a070e6SStefano Zampini     garray = a->garray;
855c1a070e6SStefano Zampini     noffd  = a->B->cmap->N;
856c1a070e6SStefano Zampini     dnnz   = diag->nz;
857c1a070e6SStefano Zampini     onnz   = offd->nz;
858c1a070e6SStefano Zampini   } else {
859c1a070e6SStefano Zampini     diag = (Mat_SeqAIJ *)A->data;
860c1a070e6SStefano Zampini     offd = NULL;
86106977982Sstefanozampini     if (!boundtocpu && (iscuda || iship)) {
86206977982Sstefanozampini #if defined(HYPRE_USING_CUDA) && defined(PETSC_HAVE_CUDA)
86306977982Sstefanozampini       if (iscuda) {
8646ea7df73SStefano Zampini         sameint = PETSC_TRUE;
8659566063dSJacob Faibussowitsch         PetscCall(MatSeqAIJCUSPARSEGetIJ(A, PETSC_FALSE, (const HYPRE_Int **)&hdi, (const HYPRE_Int **)&hdj));
86606977982Sstefanozampini       }
8676ea7df73SStefano Zampini #endif
86806977982Sstefanozampini #if defined(HYPRE_USING_HIP) && defined(PETSC_HAVE_HIP)
86906977982Sstefanozampini       if (iship) {
87006977982Sstefanozampini         sameint = PETSC_TRUE;
87106977982Sstefanozampini         PetscCall(MatSeqAIJHIPSPARSEGetIJ(A, PETSC_FALSE, (const HYPRE_Int **)&hdi, (const HYPRE_Int **)&hdj));
87206977982Sstefanozampini       }
87306977982Sstefanozampini #endif
87406977982Sstefanozampini     } else {
87506977982Sstefanozampini       boundtocpu = PETSC_TRUE;
8766ea7df73SStefano Zampini       pdi        = diag->i;
8776ea7df73SStefano Zampini       pdj        = diag->j;
8786ea7df73SStefano Zampini       if (sameint) {
8796ea7df73SStefano Zampini         hdi = (HYPRE_Int *)pdi;
8806ea7df73SStefano Zampini         hdj = (HYPRE_Int *)pdj;
8816ea7df73SStefano Zampini       }
8826ea7df73SStefano Zampini     }
883c1a070e6SStefano Zampini     garray = NULL;
884c1a070e6SStefano Zampini     noffd  = 0;
885c1a070e6SStefano Zampini     dnnz   = diag->nz;
886c1a070e6SStefano Zampini     onnz   = 0;
887c1a070e6SStefano Zampini   }
888225daaf8SStefano Zampini 
889c1a070e6SStefano Zampini   /* create a temporary ParCSR */
890c1a070e6SStefano Zampini   if (HYPRE_AssumedPartitionCheck()) {
891c1a070e6SStefano Zampini     PetscMPIInt myid;
892c1a070e6SStefano Zampini 
8939566063dSJacob Faibussowitsch     PetscCallMPI(MPI_Comm_rank(comm, &myid));
894c1a070e6SStefano Zampini     row_starts = A->rmap->range + myid;
895c1a070e6SStefano Zampini     col_starts = A->cmap->range + myid;
896c1a070e6SStefano Zampini   } else {
897c1a070e6SStefano Zampini     row_starts = A->rmap->range;
898c1a070e6SStefano Zampini     col_starts = A->cmap->range;
899c1a070e6SStefano Zampini   }
900*f2f41e48SZach Atkins   tA = hypre_ParCSRMatrixCreate(comm, A->rmap->N, A->cmap->N, (HYPRE_BigInt *)row_starts, (HYPRE_BigInt *)col_starts, (HYPRE_Int)noffd, (HYPRE_Int)dnnz, (HYPRE_Int)onnz);
901a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts)
902c1a070e6SStefano Zampini   hypre_ParCSRMatrixSetRowStartsOwner(tA, 0);
903c1a070e6SStefano Zampini   hypre_ParCSRMatrixSetColStartsOwner(tA, 0);
904a1d2239cSSatish Balay #endif
905c1a070e6SStefano Zampini 
906225daaf8SStefano Zampini   /* set diagonal part */
907c1a070e6SStefano Zampini   hdiag = hypre_ParCSRMatrixDiag(tA);
9086ea7df73SStefano Zampini   if (!sameint) { /* malloc CSR pointers */
9099566063dSJacob Faibussowitsch     PetscCall(PetscMalloc2(A->rmap->n + 1, &hdi, dnnz, &hdj));
910f4f49eeaSPierre Jolivet     for (i = 0; i < A->rmap->n + 1; i++) hdi[i] = (HYPRE_Int)pdi[i];
911f4f49eeaSPierre Jolivet     for (i = 0; i < dnnz; i++) hdj[i] = (HYPRE_Int)pdj[i];
9122cf14000SStefano Zampini   }
9136ea7df73SStefano Zampini   hypre_CSRMatrixI(hdiag)           = hdi;
9146ea7df73SStefano Zampini   hypre_CSRMatrixJ(hdiag)           = hdj;
91539accc25SStefano Zampini   hypre_CSRMatrixData(hdiag)        = (HYPRE_Complex *)diag->a;
916*f2f41e48SZach Atkins   hypre_CSRMatrixNumNonzeros(hdiag) = (HYPRE_Int)diag->nz;
917c1a070e6SStefano Zampini   hypre_CSRMatrixSetDataOwner(hdiag, 0);
918c1a070e6SStefano Zampini 
9194cf0e950SBarry Smith   /* set off-diagonal part */
920c1a070e6SStefano Zampini   hoffd = hypre_ParCSRMatrixOffd(tA);
921c1a070e6SStefano Zampini   if (offd) {
9226ea7df73SStefano Zampini     if (!sameint) { /* malloc CSR pointers */
9239566063dSJacob Faibussowitsch       PetscCall(PetscMalloc2(A->rmap->n + 1, &hoi, onnz, &hoj));
924f4f49eeaSPierre Jolivet       for (i = 0; i < A->rmap->n + 1; i++) hoi[i] = (HYPRE_Int)poi[i];
925f4f49eeaSPierre Jolivet       for (i = 0; i < onnz; i++) hoj[i] = (HYPRE_Int)poj[i];
9262cf14000SStefano Zampini     }
9276ea7df73SStefano Zampini     hypre_CSRMatrixI(hoffd)           = hoi;
9286ea7df73SStefano Zampini     hypre_CSRMatrixJ(hoffd)           = hoj;
92939accc25SStefano Zampini     hypre_CSRMatrixData(hoffd)        = (HYPRE_Complex *)offd->a;
930*f2f41e48SZach Atkins     hypre_CSRMatrixNumNonzeros(hoffd) = (HYPRE_Int)offd->nz;
931c1a070e6SStefano Zampini     hypre_CSRMatrixSetDataOwner(hoffd, 0);
9326ea7df73SStefano Zampini   }
9336ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
934a333fa2bSZach Atkins   PetscCallHYPRE(hypre_ParCSRMatrixInitialize_v2(tA, !boundtocpu ? HYPRE_MEMORY_DEVICE : HYPRE_MEMORY_HOST));
9356ea7df73SStefano Zampini #else
9366ea7df73SStefano Zampini   #if PETSC_PKG_HYPRE_VERSION_LT(2, 18, 0)
937a333fa2bSZach Atkins   PetscCallHYPRE(hypre_ParCSRMatrixInitialize(tA));
9386ea7df73SStefano Zampini   #else
939a333fa2bSZach Atkins   PetscCallHYPRE(hypre_ParCSRMatrixInitialize_v2(tA, HYPRE_MEMORY_HOST));
9406ea7df73SStefano Zampini   #endif
9416ea7df73SStefano Zampini #endif
942bb16242fSVictor A. P. Magri 
943bb16242fSVictor A. P. Magri   /* MatrixSetRownnz comes after MatrixInitialize, so the first uses the right memory location */
944bb16242fSVictor A. P. Magri   hypre_CSRMatrixSetRownnz(hdiag);
945bb16242fSVictor A. P. Magri   if (offd) hypre_CSRMatrixSetRownnz(hoffd);
946bb16242fSVictor A. P. Magri 
9476ea7df73SStefano Zampini   hypre_TFree(hypre_ParCSRMatrixColMapOffd(tA), HYPRE_MEMORY_HOST);
948c1a070e6SStefano Zampini   hypre_ParCSRMatrixSetNumNonzeros(tA);
9492cf14000SStefano Zampini   hypre_ParCSRMatrixColMapOffd(tA) = (HYPRE_BigInt *)garray;
950a333fa2bSZach Atkins   if (!hypre_ParCSRMatrixCommPkg(tA)) PetscCallHYPRE(hypre_MatvecCommPkgCreate(tA));
951613e5ff0Sstefano_zampini   *hA = tA;
9523ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
953613e5ff0Sstefano_zampini }
954c1a070e6SStefano Zampini 
955d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAIJRestoreParCSR_Private(Mat A, hypre_ParCSRMatrix **hA)
956d71ae5a4SJacob Faibussowitsch {
957613e5ff0Sstefano_zampini   hypre_CSRMatrix *hdiag, *hoffd;
9586ea7df73SStefano Zampini   PetscBool        ismpiaij, sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int));
959b655ebf8SZach Atkins   PetscBool        iscuda, iship;
960c1a070e6SStefano Zampini 
961613e5ff0Sstefano_zampini   PetscFunctionBegin;
9629566063dSJacob Faibussowitsch   PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &ismpiaij));
9639566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompareAny((PetscObject)A, &iscuda, MATSEQAIJCUSPARSE, MATMPIAIJCUSPARSE, ""));
964b655ebf8SZach Atkins   PetscCall(PetscObjectTypeCompareAny((PetscObject)A, &iship, MATSEQAIJHIPSPARSE, MATMPIAIJHIPSPARSE, ""));
965b655ebf8SZach Atkins #if defined(HYPRE_USING_CUDA) && defined(PETSC_HAVE_CUDA)
9666ea7df73SStefano Zampini   if (iscuda) sameint = PETSC_TRUE;
967b655ebf8SZach Atkins #elif defined(HYPRE_USING_HIP) && defined(PETSC_HAVE_HIP)
968b655ebf8SZach Atkins   if (iship) sameint = PETSC_TRUE;
9696ea7df73SStefano Zampini #endif
970613e5ff0Sstefano_zampini   hdiag = hypre_ParCSRMatrixDiag(*hA);
971613e5ff0Sstefano_zampini   hoffd = hypre_ParCSRMatrixOffd(*hA);
9726ea7df73SStefano Zampini   /* free temporary memory allocated by PETSc
9736ea7df73SStefano Zampini      set pointers to NULL before destroying tA */
9742cf14000SStefano Zampini   if (!sameint) {
9752cf14000SStefano Zampini     HYPRE_Int *hi, *hj;
9762cf14000SStefano Zampini 
9772cf14000SStefano Zampini     hi = hypre_CSRMatrixI(hdiag);
9782cf14000SStefano Zampini     hj = hypre_CSRMatrixJ(hdiag);
9799566063dSJacob Faibussowitsch     PetscCall(PetscFree2(hi, hj));
9806ea7df73SStefano Zampini     if (ismpiaij) {
9812cf14000SStefano Zampini       hi = hypre_CSRMatrixI(hoffd);
9822cf14000SStefano Zampini       hj = hypre_CSRMatrixJ(hoffd);
9839566063dSJacob Faibussowitsch       PetscCall(PetscFree2(hi, hj));
9842cf14000SStefano Zampini     }
9852cf14000SStefano Zampini   }
986c1a070e6SStefano Zampini   hypre_CSRMatrixI(hdiag)    = NULL;
987c1a070e6SStefano Zampini   hypre_CSRMatrixJ(hdiag)    = NULL;
988c1a070e6SStefano Zampini   hypre_CSRMatrixData(hdiag) = NULL;
9896ea7df73SStefano Zampini   if (ismpiaij) {
990c1a070e6SStefano Zampini     hypre_CSRMatrixI(hoffd)    = NULL;
991c1a070e6SStefano Zampini     hypre_CSRMatrixJ(hoffd)    = NULL;
992c1a070e6SStefano Zampini     hypre_CSRMatrixData(hoffd) = NULL;
9936ea7df73SStefano Zampini   }
994613e5ff0Sstefano_zampini   hypre_ParCSRMatrixColMapOffd(*hA) = NULL;
995613e5ff0Sstefano_zampini   hypre_ParCSRMatrixDestroy(*hA);
996613e5ff0Sstefano_zampini   *hA = NULL;
9973ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
998613e5ff0Sstefano_zampini }
999613e5ff0Sstefano_zampini 
1000613e5ff0Sstefano_zampini /* calls RAP from BoomerAMG:
10013dad0653Sstefano_zampini    the resulting ParCSR will not own the column and row starts
10026ea7df73SStefano Zampini    It looks like we don't need to have the diagonal entries ordered first */
1003d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_ParCSR_RAP(hypre_ParCSRMatrix *hR, hypre_ParCSRMatrix *hA, hypre_ParCSRMatrix *hP, hypre_ParCSRMatrix **hRAP)
1004d71ae5a4SJacob Faibussowitsch {
1005a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts)
1006613e5ff0Sstefano_zampini   HYPRE_Int P_owns_col_starts, R_owns_row_starts;
1007a1d2239cSSatish Balay #endif
1008613e5ff0Sstefano_zampini 
1009613e5ff0Sstefano_zampini   PetscFunctionBegin;
1010a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts)
1011613e5ff0Sstefano_zampini   P_owns_col_starts = hypre_ParCSRMatrixOwnsColStarts(hP);
1012613e5ff0Sstefano_zampini   R_owns_row_starts = hypre_ParCSRMatrixOwnsRowStarts(hR);
1013a1d2239cSSatish Balay #endif
10146ea7df73SStefano Zampini   /* can be replaced by version test later */
10156ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
1016792fecdfSBarry Smith   PetscStackPushExternal("hypre_ParCSRMatrixRAP");
10176ea7df73SStefano Zampini   *hRAP = hypre_ParCSRMatrixRAP(hR, hA, hP);
10186ea7df73SStefano Zampini   PetscStackPop;
10196ea7df73SStefano Zampini #else
1020a333fa2bSZach Atkins   PetscCallHYPRE(hypre_BoomerAMGBuildCoarseOperator(hR, hA, hP, hRAP));
1021a333fa2bSZach Atkins   PetscCallHYPRE(hypre_ParCSRMatrixSetNumNonzeros(*hRAP));
10226ea7df73SStefano Zampini #endif
1023613e5ff0Sstefano_zampini   /* hypre_BoomerAMGBuildCoarseOperator steals the col_starts from P and the row_starts from R */
1024a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts)
1025613e5ff0Sstefano_zampini   hypre_ParCSRMatrixSetRowStartsOwner(*hRAP, 0);
1026613e5ff0Sstefano_zampini   hypre_ParCSRMatrixSetColStartsOwner(*hRAP, 0);
1027613e5ff0Sstefano_zampini   if (P_owns_col_starts) hypre_ParCSRMatrixSetColStartsOwner(hP, 1);
1028613e5ff0Sstefano_zampini   if (R_owns_row_starts) hypre_ParCSRMatrixSetRowStartsOwner(hR, 1);
1029a1d2239cSSatish Balay #endif
10303ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1031613e5ff0Sstefano_zampini }
1032613e5ff0Sstefano_zampini 
1033d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatPtAPNumeric_AIJ_AIJ_wHYPRE(Mat A, Mat P, Mat C)
1034d71ae5a4SJacob Faibussowitsch {
10356f231fbdSstefano_zampini   Mat                 B;
10366abb4441SStefano Zampini   hypre_ParCSRMatrix *hA, *hP, *hPtAP = NULL;
10374222ddf1SHong Zhang   Mat_Product        *product = C->product;
1038613e5ff0Sstefano_zampini 
1039613e5ff0Sstefano_zampini   PetscFunctionBegin;
10409566063dSJacob Faibussowitsch   PetscCall(MatAIJGetParCSR_Private(A, &hA));
10419566063dSJacob Faibussowitsch   PetscCall(MatAIJGetParCSR_Private(P, &hP));
10429566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_ParCSR_RAP(hP, hA, hP, &hPtAP));
10439566063dSJacob Faibussowitsch   PetscCall(MatCreateFromParCSR(hPtAP, MATAIJ, PETSC_OWN_POINTER, &B));
10444222ddf1SHong Zhang 
10459566063dSJacob Faibussowitsch   PetscCall(MatHeaderMerge(C, &B));
10464222ddf1SHong Zhang   C->product = product;
10474222ddf1SHong Zhang 
10489566063dSJacob Faibussowitsch   PetscCall(MatAIJRestoreParCSR_Private(A, &hA));
10499566063dSJacob Faibussowitsch   PetscCall(MatAIJRestoreParCSR_Private(P, &hP));
10503ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
10516f231fbdSstefano_zampini }
10526f231fbdSstefano_zampini 
1053d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatPtAPSymbolic_AIJ_AIJ_wHYPRE(Mat A, Mat P, PetscReal fill, Mat C)
1054d71ae5a4SJacob Faibussowitsch {
10556f231fbdSstefano_zampini   PetscFunctionBegin;
10569566063dSJacob Faibussowitsch   PetscCall(MatSetType(C, MATAIJ));
10574222ddf1SHong Zhang   C->ops->ptapnumeric    = MatPtAPNumeric_AIJ_AIJ_wHYPRE;
10584222ddf1SHong Zhang   C->ops->productnumeric = MatProductNumeric_PtAP;
10593ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1060613e5ff0Sstefano_zampini }
1061613e5ff0Sstefano_zampini 
1062d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatPtAPNumeric_AIJ_HYPRE(Mat A, Mat P, Mat C)
1063d71ae5a4SJacob Faibussowitsch {
10644cc28894Sstefano_zampini   Mat                 B;
10654cc28894Sstefano_zampini   Mat_HYPRE          *hP;
10666abb4441SStefano Zampini   hypre_ParCSRMatrix *hA = NULL, *Pparcsr, *ptapparcsr = NULL;
1067613e5ff0Sstefano_zampini   HYPRE_Int           type;
1068613e5ff0Sstefano_zampini   MPI_Comm            comm = PetscObjectComm((PetscObject)A);
10694cc28894Sstefano_zampini   PetscBool           ishypre;
1070613e5ff0Sstefano_zampini 
1071613e5ff0Sstefano_zampini   PetscFunctionBegin;
10729566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)P, MATHYPRE, &ishypre));
107328b400f6SJacob Faibussowitsch   PetscCheck(ishypre, comm, PETSC_ERR_USER, "P should be of type %s", MATHYPRE);
10744cc28894Sstefano_zampini   hP = (Mat_HYPRE *)P->data;
1075a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(hP->ij, &type));
107608401ef6SPierre Jolivet   PetscCheck(type == HYPRE_PARCSR, comm, PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported");
1077a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixGetObject(hP->ij, (void **)&Pparcsr));
1078613e5ff0Sstefano_zampini 
10799566063dSJacob Faibussowitsch   PetscCall(MatAIJGetParCSR_Private(A, &hA));
10809566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_ParCSR_RAP(Pparcsr, hA, Pparcsr, &ptapparcsr));
10819566063dSJacob Faibussowitsch   PetscCall(MatAIJRestoreParCSR_Private(A, &hA));
1082225daaf8SStefano Zampini 
10834cc28894Sstefano_zampini   /* create temporary matrix and merge to C */
10849566063dSJacob Faibussowitsch   PetscCall(MatCreateFromParCSR(ptapparcsr, ((PetscObject)C)->type_name, PETSC_OWN_POINTER, &B));
10859566063dSJacob Faibussowitsch   PetscCall(MatHeaderMerge(C, &B));
10863ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
10874cc28894Sstefano_zampini }
10884cc28894Sstefano_zampini 
1089d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatPtAPNumeric_HYPRE_HYPRE(Mat A, Mat P, Mat C)
1090d71ae5a4SJacob Faibussowitsch {
10914cc28894Sstefano_zampini   Mat                 B;
10926abb4441SStefano Zampini   hypre_ParCSRMatrix *Aparcsr, *Pparcsr, *ptapparcsr = NULL;
10934cc28894Sstefano_zampini   Mat_HYPRE          *hA, *hP;
10944cc28894Sstefano_zampini   PetscBool           ishypre;
10954cc28894Sstefano_zampini   HYPRE_Int           type;
10964cc28894Sstefano_zampini 
10974cc28894Sstefano_zampini   PetscFunctionBegin;
10989566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)P, MATHYPRE, &ishypre));
109928b400f6SJacob Faibussowitsch   PetscCheck(ishypre, PetscObjectComm((PetscObject)P), PETSC_ERR_USER, "P should be of type %s", MATHYPRE);
11009566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)A, MATHYPRE, &ishypre));
110128b400f6SJacob Faibussowitsch   PetscCheck(ishypre, PetscObjectComm((PetscObject)A), PETSC_ERR_USER, "A should be of type %s", MATHYPRE);
11024cc28894Sstefano_zampini   hA = (Mat_HYPRE *)A->data;
11034cc28894Sstefano_zampini   hP = (Mat_HYPRE *)P->data;
1104a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(hA->ij, &type));
110508401ef6SPierre Jolivet   PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported");
1106a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(hP->ij, &type));
110708401ef6SPierre Jolivet   PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)P), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported");
1108a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixGetObject(hA->ij, (void **)&Aparcsr));
1109a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixGetObject(hP->ij, (void **)&Pparcsr));
11109566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_ParCSR_RAP(Pparcsr, Aparcsr, Pparcsr, &ptapparcsr));
11119566063dSJacob Faibussowitsch   PetscCall(MatCreateFromParCSR(ptapparcsr, MATHYPRE, PETSC_OWN_POINTER, &B));
11129566063dSJacob Faibussowitsch   PetscCall(MatHeaderMerge(C, &B));
11133ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
11144cc28894Sstefano_zampini }
11154cc28894Sstefano_zampini 
1116d501dc42Sstefano_zampini /* calls hypre_ParMatmul
1117d501dc42Sstefano_zampini    hypre_ParMatMul uses hypre_ParMatrixCreate with the communicator of hA
11183dad0653Sstefano_zampini    hypre_ParMatrixCreate does not duplicate the communicator
11196ea7df73SStefano Zampini    It looks like we don't need to have the diagonal entries ordered first */
1120d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_ParCSR_MatMatMult(hypre_ParCSRMatrix *hA, hypre_ParCSRMatrix *hB, hypre_ParCSRMatrix **hAB)
1121d71ae5a4SJacob Faibussowitsch {
1122d501dc42Sstefano_zampini   PetscFunctionBegin;
11236ea7df73SStefano Zampini   /* can be replaced by version test later */
11246ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
1125792fecdfSBarry Smith   PetscStackPushExternal("hypre_ParCSRMatMat");
11266ea7df73SStefano Zampini   *hAB = hypre_ParCSRMatMat(hA, hB);
11276ea7df73SStefano Zampini #else
1128792fecdfSBarry Smith   PetscStackPushExternal("hypre_ParMatmul");
1129d501dc42Sstefano_zampini   *hAB = hypre_ParMatmul(hA, hB);
11306ea7df73SStefano Zampini #endif
1131d501dc42Sstefano_zampini   PetscStackPop;
11323ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1133d501dc42Sstefano_zampini }
1134d501dc42Sstefano_zampini 
1135d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMatMultNumeric_AIJ_AIJ_wHYPRE(Mat A, Mat B, Mat C)
1136d71ae5a4SJacob Faibussowitsch {
11375e5acdf2Sstefano_zampini   Mat                 D;
1138d501dc42Sstefano_zampini   hypre_ParCSRMatrix *hA, *hB, *hAB = NULL;
11394222ddf1SHong Zhang   Mat_Product        *product = C->product;
11405e5acdf2Sstefano_zampini 
11415e5acdf2Sstefano_zampini   PetscFunctionBegin;
11429566063dSJacob Faibussowitsch   PetscCall(MatAIJGetParCSR_Private(A, &hA));
11439566063dSJacob Faibussowitsch   PetscCall(MatAIJGetParCSR_Private(B, &hB));
11449566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_ParCSR_MatMatMult(hA, hB, &hAB));
11459566063dSJacob Faibussowitsch   PetscCall(MatCreateFromParCSR(hAB, MATAIJ, PETSC_OWN_POINTER, &D));
11464222ddf1SHong Zhang 
11479566063dSJacob Faibussowitsch   PetscCall(MatHeaderMerge(C, &D));
11484222ddf1SHong Zhang   C->product = product;
11494222ddf1SHong Zhang 
11509566063dSJacob Faibussowitsch   PetscCall(MatAIJRestoreParCSR_Private(A, &hA));
11519566063dSJacob Faibussowitsch   PetscCall(MatAIJRestoreParCSR_Private(B, &hB));
11523ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
11535e5acdf2Sstefano_zampini }
11545e5acdf2Sstefano_zampini 
1155d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatMatMultSymbolic_AIJ_AIJ_wHYPRE(Mat A, Mat B, PetscReal fill, Mat C)
1156d71ae5a4SJacob Faibussowitsch {
11575e5acdf2Sstefano_zampini   PetscFunctionBegin;
11589566063dSJacob Faibussowitsch   PetscCall(MatSetType(C, MATAIJ));
11594222ddf1SHong Zhang   C->ops->matmultnumeric = MatMatMultNumeric_AIJ_AIJ_wHYPRE;
11604222ddf1SHong Zhang   C->ops->productnumeric = MatProductNumeric_AB;
11613ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
11625e5acdf2Sstefano_zampini }
11635e5acdf2Sstefano_zampini 
1164d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMatMultNumeric_HYPRE_HYPRE(Mat A, Mat B, Mat C)
1165d71ae5a4SJacob Faibussowitsch {
1166d501dc42Sstefano_zampini   Mat                 D;
1167d501dc42Sstefano_zampini   hypre_ParCSRMatrix *Aparcsr, *Bparcsr, *ABparcsr = NULL;
1168d501dc42Sstefano_zampini   Mat_HYPRE          *hA, *hB;
1169d501dc42Sstefano_zampini   PetscBool           ishypre;
1170d501dc42Sstefano_zampini   HYPRE_Int           type;
11714222ddf1SHong Zhang   Mat_Product        *product;
1172d501dc42Sstefano_zampini 
1173d501dc42Sstefano_zampini   PetscFunctionBegin;
11749566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)B, MATHYPRE, &ishypre));
117528b400f6SJacob Faibussowitsch   PetscCheck(ishypre, PetscObjectComm((PetscObject)B), PETSC_ERR_USER, "B should be of type %s", MATHYPRE);
11769566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)A, MATHYPRE, &ishypre));
117728b400f6SJacob Faibussowitsch   PetscCheck(ishypre, PetscObjectComm((PetscObject)A), PETSC_ERR_USER, "A should be of type %s", MATHYPRE);
1178d501dc42Sstefano_zampini   hA = (Mat_HYPRE *)A->data;
1179d501dc42Sstefano_zampini   hB = (Mat_HYPRE *)B->data;
1180a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(hA->ij, &type));
118108401ef6SPierre Jolivet   PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported");
1182a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(hB->ij, &type));
118308401ef6SPierre Jolivet   PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)B), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported");
1184a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixGetObject(hA->ij, (void **)&Aparcsr));
1185a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixGetObject(hB->ij, (void **)&Bparcsr));
11869566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_ParCSR_MatMatMult(Aparcsr, Bparcsr, &ABparcsr));
11879566063dSJacob Faibussowitsch   PetscCall(MatCreateFromParCSR(ABparcsr, MATHYPRE, PETSC_OWN_POINTER, &D));
11884222ddf1SHong Zhang 
1189d501dc42Sstefano_zampini   /* need to use HeaderReplace because HeaderMerge messes up with the communicator */
11904222ddf1SHong Zhang   product    = C->product; /* save it from MatHeaderReplace() */
11914222ddf1SHong Zhang   C->product = NULL;
11929566063dSJacob Faibussowitsch   PetscCall(MatHeaderReplace(C, &D));
11934222ddf1SHong Zhang   C->product             = product;
1194d501dc42Sstefano_zampini   C->ops->matmultnumeric = MatMatMultNumeric_HYPRE_HYPRE;
11954222ddf1SHong Zhang   C->ops->productnumeric = MatProductNumeric_AB;
11963ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1197d501dc42Sstefano_zampini }
1198d501dc42Sstefano_zampini 
1199d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatTransposeMatMatMultNumeric_AIJ_AIJ_AIJ_wHYPRE(Mat A, Mat B, Mat C, Mat D)
1200d71ae5a4SJacob Faibussowitsch {
120120e1dc0dSstefano_zampini   Mat                 E;
12026abb4441SStefano Zampini   hypre_ParCSRMatrix *hA, *hB, *hC, *hABC = NULL;
120320e1dc0dSstefano_zampini 
120420e1dc0dSstefano_zampini   PetscFunctionBegin;
12059566063dSJacob Faibussowitsch   PetscCall(MatAIJGetParCSR_Private(A, &hA));
12069566063dSJacob Faibussowitsch   PetscCall(MatAIJGetParCSR_Private(B, &hB));
12079566063dSJacob Faibussowitsch   PetscCall(MatAIJGetParCSR_Private(C, &hC));
12089566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_ParCSR_RAP(hA, hB, hC, &hABC));
12099566063dSJacob Faibussowitsch   PetscCall(MatCreateFromParCSR(hABC, MATAIJ, PETSC_OWN_POINTER, &E));
12109566063dSJacob Faibussowitsch   PetscCall(MatHeaderMerge(D, &E));
12119566063dSJacob Faibussowitsch   PetscCall(MatAIJRestoreParCSR_Private(A, &hA));
12129566063dSJacob Faibussowitsch   PetscCall(MatAIJRestoreParCSR_Private(B, &hB));
12139566063dSJacob Faibussowitsch   PetscCall(MatAIJRestoreParCSR_Private(C, &hC));
12143ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
121520e1dc0dSstefano_zampini }
121620e1dc0dSstefano_zampini 
1217d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatTransposeMatMatMultSymbolic_AIJ_AIJ_AIJ_wHYPRE(Mat A, Mat B, Mat C, PetscReal fill, Mat D)
1218d71ae5a4SJacob Faibussowitsch {
121920e1dc0dSstefano_zampini   PetscFunctionBegin;
12209566063dSJacob Faibussowitsch   PetscCall(MatSetType(D, MATAIJ));
12213ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
122220e1dc0dSstefano_zampini }
122320e1dc0dSstefano_zampini 
1224d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSymbolic_AB_HYPRE(Mat C)
1225d71ae5a4SJacob Faibussowitsch {
12264222ddf1SHong Zhang   PetscFunctionBegin;
12274222ddf1SHong Zhang   C->ops->productnumeric = MatProductNumeric_AB;
12283ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
12294222ddf1SHong Zhang }
12304222ddf1SHong Zhang 
1231d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSetFromOptions_HYPRE_AB(Mat C)
1232d71ae5a4SJacob Faibussowitsch {
12334222ddf1SHong Zhang   Mat_Product *product = C->product;
12344222ddf1SHong Zhang   PetscBool    Ahypre;
12354222ddf1SHong Zhang 
12364222ddf1SHong Zhang   PetscFunctionBegin;
12379566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)product->A, MATHYPRE, &Ahypre));
12384222ddf1SHong Zhang   if (Ahypre) { /* A is a Hypre matrix */
12399566063dSJacob Faibussowitsch     PetscCall(MatSetType(C, MATHYPRE));
12404222ddf1SHong Zhang     C->ops->productsymbolic = MatProductSymbolic_AB_HYPRE;
12414222ddf1SHong Zhang     C->ops->matmultnumeric  = MatMatMultNumeric_HYPRE_HYPRE;
12423ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
12436718818eSStefano Zampini   }
12443ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
12454222ddf1SHong Zhang }
12464222ddf1SHong Zhang 
1247d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSymbolic_PtAP_HYPRE(Mat C)
1248d71ae5a4SJacob Faibussowitsch {
12494222ddf1SHong Zhang   PetscFunctionBegin;
12504222ddf1SHong Zhang   C->ops->productnumeric = MatProductNumeric_PtAP;
12513ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
12524222ddf1SHong Zhang }
12534222ddf1SHong Zhang 
1254d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSetFromOptions_HYPRE_PtAP(Mat C)
1255d71ae5a4SJacob Faibussowitsch {
12564222ddf1SHong Zhang   Mat_Product *product = C->product;
12574222ddf1SHong Zhang   PetscBool    flg;
12584222ddf1SHong Zhang   PetscInt     type        = 0;
12594222ddf1SHong Zhang   const char  *outTypes[4] = {"aij", "seqaij", "mpiaij", "hypre"};
12604222ddf1SHong Zhang   PetscInt     ntype       = 4;
12614222ddf1SHong Zhang   Mat          A           = product->A;
12624222ddf1SHong Zhang   PetscBool    Ahypre;
12634222ddf1SHong Zhang 
12644222ddf1SHong Zhang   PetscFunctionBegin;
12659566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)A, MATHYPRE, &Ahypre));
12664222ddf1SHong Zhang   if (Ahypre) { /* A is a Hypre matrix */
12679566063dSJacob Faibussowitsch     PetscCall(MatSetType(C, MATHYPRE));
12684222ddf1SHong Zhang     C->ops->productsymbolic = MatProductSymbolic_PtAP_HYPRE;
12694222ddf1SHong Zhang     C->ops->ptapnumeric     = MatPtAPNumeric_HYPRE_HYPRE;
12703ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
12714222ddf1SHong Zhang   }
12724222ddf1SHong Zhang 
12734222ddf1SHong Zhang   /* A is AIJ, P is Hypre, C = PtAP can be either AIJ or Hypre format */
12744222ddf1SHong Zhang   /* Get runtime option */
12754222ddf1SHong Zhang   if (product->api_user) {
1276d0609cedSBarry Smith     PetscOptionsBegin(PetscObjectComm((PetscObject)C), ((PetscObject)C)->prefix, "MatPtAP_HYPRE", "Mat");
12779566063dSJacob Faibussowitsch     PetscCall(PetscOptionsEList("-matptap_hypre_outtype", "MatPtAP outtype", "MatPtAP outtype", outTypes, ntype, outTypes[type], &type, &flg));
1278d0609cedSBarry Smith     PetscOptionsEnd();
12794222ddf1SHong Zhang   } else {
1280d0609cedSBarry Smith     PetscOptionsBegin(PetscObjectComm((PetscObject)C), ((PetscObject)C)->prefix, "MatProduct_PtAP_HYPRE", "Mat");
12819566063dSJacob Faibussowitsch     PetscCall(PetscOptionsEList("-mat_product_algorithm_hypre_outtype", "MatProduct_PtAP outtype", "MatProduct_PtAP", outTypes, ntype, outTypes[type], &type, &flg));
1282d0609cedSBarry Smith     PetscOptionsEnd();
12834222ddf1SHong Zhang   }
12844222ddf1SHong Zhang 
12854222ddf1SHong Zhang   if (type == 0 || type == 1 || type == 2) {
12869566063dSJacob Faibussowitsch     PetscCall(MatSetType(C, MATAIJ));
12874222ddf1SHong Zhang   } else if (type == 3) {
12889566063dSJacob Faibussowitsch     PetscCall(MatSetType(C, MATHYPRE));
12894222ddf1SHong Zhang   } else SETERRQ(PetscObjectComm((PetscObject)C), PETSC_ERR_SUP, "MatPtAP outtype is not supported");
12904222ddf1SHong Zhang   C->ops->productsymbolic = MatProductSymbolic_PtAP_HYPRE;
12914222ddf1SHong Zhang   C->ops->ptapnumeric     = MatPtAPNumeric_AIJ_HYPRE;
12923ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
12934222ddf1SHong Zhang }
12944222ddf1SHong Zhang 
1295d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSetFromOptions_HYPRE(Mat C)
1296d71ae5a4SJacob Faibussowitsch {
12974222ddf1SHong Zhang   Mat_Product *product = C->product;
12984222ddf1SHong Zhang 
12994222ddf1SHong Zhang   PetscFunctionBegin;
13004222ddf1SHong Zhang   switch (product->type) {
1301d71ae5a4SJacob Faibussowitsch   case MATPRODUCT_AB:
1302d71ae5a4SJacob Faibussowitsch     PetscCall(MatProductSetFromOptions_HYPRE_AB(C));
1303d71ae5a4SJacob Faibussowitsch     break;
1304d71ae5a4SJacob Faibussowitsch   case MATPRODUCT_PtAP:
1305d71ae5a4SJacob Faibussowitsch     PetscCall(MatProductSetFromOptions_HYPRE_PtAP(C));
1306d71ae5a4SJacob Faibussowitsch     break;
1307d71ae5a4SJacob Faibussowitsch   default:
1308d71ae5a4SJacob Faibussowitsch     break;
13094222ddf1SHong Zhang   }
13103ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
13114222ddf1SHong Zhang }
13124222ddf1SHong Zhang 
1313d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMultTranspose_HYPRE(Mat A, Vec x, Vec y)
1314d71ae5a4SJacob Faibussowitsch {
131563c07aadSStefano Zampini   PetscFunctionBegin;
13169566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_MultKernel_Private(A, 1.0, x, 0.0, y, PETSC_TRUE));
13173ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
131863c07aadSStefano Zampini }
131963c07aadSStefano Zampini 
1320d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMult_HYPRE(Mat A, Vec x, Vec y)
1321d71ae5a4SJacob Faibussowitsch {
132263c07aadSStefano Zampini   PetscFunctionBegin;
13239566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_MultKernel_Private(A, 1.0, x, 0.0, y, PETSC_FALSE));
13243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
132563c07aadSStefano Zampini }
132663c07aadSStefano Zampini 
1327d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMultAdd_HYPRE(Mat A, Vec x, Vec y, Vec z)
1328d71ae5a4SJacob Faibussowitsch {
1329414bd5c3SStefano Zampini   PetscFunctionBegin;
133048a46eb9SPierre Jolivet   if (y != z) PetscCall(VecCopy(y, z));
13319566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_MultKernel_Private(A, 1.0, x, 1.0, z, PETSC_FALSE));
13323ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1333414bd5c3SStefano Zampini }
1334414bd5c3SStefano Zampini 
1335d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMultTransposeAdd_HYPRE(Mat A, Vec x, Vec y, Vec z)
1336d71ae5a4SJacob Faibussowitsch {
1337414bd5c3SStefano Zampini   PetscFunctionBegin;
133848a46eb9SPierre Jolivet   if (y != z) PetscCall(VecCopy(y, z));
13399566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_MultKernel_Private(A, 1.0, x, 1.0, z, PETSC_TRUE));
13403ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1341414bd5c3SStefano Zampini }
1342414bd5c3SStefano Zampini 
1343414bd5c3SStefano Zampini /* y = a * A * x + b * y or y = a * A^t * x + b * y depending on trans */
1344d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_MultKernel_Private(Mat A, HYPRE_Complex a, Vec x, HYPRE_Complex b, Vec y, PetscBool trans)
1345d71ae5a4SJacob Faibussowitsch {
134663c07aadSStefano Zampini   Mat_HYPRE          *hA = (Mat_HYPRE *)A->data;
134763c07aadSStefano Zampini   hypre_ParCSRMatrix *parcsr;
134863c07aadSStefano Zampini   hypre_ParVector    *hx, *hy;
134963c07aadSStefano Zampini 
135063c07aadSStefano Zampini   PetscFunctionBegin;
135163c07aadSStefano Zampini   if (trans) {
13529566063dSJacob Faibussowitsch     PetscCall(VecHYPRE_IJVectorPushVecRead(hA->b, x));
13539566063dSJacob Faibussowitsch     if (b != 0.0) PetscCall(VecHYPRE_IJVectorPushVec(hA->x, y));
13549566063dSJacob Faibussowitsch     else PetscCall(VecHYPRE_IJVectorPushVecWrite(hA->x, y));
1355a333fa2bSZach Atkins     PetscCallHYPRE(HYPRE_IJVectorGetObject(hA->b->ij, (void **)&hx));
1356a333fa2bSZach Atkins     PetscCallHYPRE(HYPRE_IJVectorGetObject(hA->x->ij, (void **)&hy));
135763c07aadSStefano Zampini   } else {
13589566063dSJacob Faibussowitsch     PetscCall(VecHYPRE_IJVectorPushVecRead(hA->x, x));
13599566063dSJacob Faibussowitsch     if (b != 0.0) PetscCall(VecHYPRE_IJVectorPushVec(hA->b, y));
13609566063dSJacob Faibussowitsch     else PetscCall(VecHYPRE_IJVectorPushVecWrite(hA->b, y));
1361a333fa2bSZach Atkins     PetscCallHYPRE(HYPRE_IJVectorGetObject(hA->x->ij, (void **)&hx));
1362a333fa2bSZach Atkins     PetscCallHYPRE(HYPRE_IJVectorGetObject(hA->b->ij, (void **)&hy));
136363c07aadSStefano Zampini   }
1364a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixGetObject(hA->ij, (void **)&parcsr));
13656ea7df73SStefano Zampini   if (trans) {
1366a333fa2bSZach Atkins     PetscCallHYPRE(hypre_ParCSRMatrixMatvecT(a, parcsr, hx, b, hy));
13676ea7df73SStefano Zampini   } else {
1368a333fa2bSZach Atkins     PetscCallHYPRE(hypre_ParCSRMatrixMatvec(a, parcsr, hx, b, hy));
13696ea7df73SStefano Zampini   }
13709566063dSJacob Faibussowitsch   PetscCall(VecHYPRE_IJVectorPopVec(hA->x));
13719566063dSJacob Faibussowitsch   PetscCall(VecHYPRE_IJVectorPopVec(hA->b));
13723ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
137363c07aadSStefano Zampini }
137463c07aadSStefano Zampini 
1375d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatDestroy_HYPRE(Mat A)
1376d71ae5a4SJacob Faibussowitsch {
137763c07aadSStefano Zampini   Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
137863c07aadSStefano Zampini 
137963c07aadSStefano Zampini   PetscFunctionBegin;
13809566063dSJacob Faibussowitsch   PetscCall(VecHYPRE_IJVectorDestroy(&hA->x));
13819566063dSJacob Faibussowitsch   PetscCall(VecHYPRE_IJVectorDestroy(&hA->b));
138206977982Sstefanozampini   PetscCall(MatHYPRE_DestroyCOOMat(A)); /* must be called before destroying the individual CSR */
1383978814f1SStefano Zampini   if (hA->ij) {
1384978814f1SStefano Zampini     if (!hA->inner_free) hypre_IJMatrixObject(hA->ij) = NULL;
1385a333fa2bSZach Atkins     PetscCallHYPRE(HYPRE_IJMatrixDestroy(hA->ij));
1386978814f1SStefano Zampini   }
13879566063dSJacob Faibussowitsch   if (hA->comm) PetscCall(PetscCommRestoreComm(PetscObjectComm((PetscObject)A), &hA->comm));
1388c69f721fSFande Kong 
13899566063dSJacob Faibussowitsch   PetscCall(MatStashDestroy_Private(&A->stash));
13909566063dSJacob Faibussowitsch   PetscCall(PetscFree(hA->array));
1391a32e9c99SJunchao Zhang   if (hA->rows_d) PetscStackCallExternalVoid("hypre_Free", hypre_Free(hA->rows_d, HYPRE_MEMORY_DEVICE));
1392c69f721fSFande Kong 
13939566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_hypre_aij_C", NULL));
13949566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_hypre_is_C", NULL));
13959566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_hypre_C", NULL));
13969566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_mpiaij_hypre_C", NULL));
139706977982Sstefanozampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijhipsparse_hypre_C", NULL));
139806977982Sstefanozampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_mpiaijhipsparse_hypre_C", NULL));
139906977982Sstefanozampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_hypre_C", NULL));
140006977982Sstefanozampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_mpiaijcusparse_hypre_C", NULL));
14019566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatHYPRESetPreallocation_C", NULL));
14029566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatHYPREGetParCSR_C", NULL));
14035fbaff96SJunchao Zhang   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL));
14045fbaff96SJunchao Zhang   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL));
14059566063dSJacob Faibussowitsch   PetscCall(PetscFree(A->data));
14063ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
140763c07aadSStefano Zampini }
140863c07aadSStefano Zampini 
1409d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetUp_HYPRE(Mat A)
1410d71ae5a4SJacob Faibussowitsch {
14114ec6421dSstefano_zampini   PetscFunctionBegin;
141206977982Sstefanozampini   if (!A->preallocated) PetscCall(MatHYPRESetPreallocation(A, PETSC_DEFAULT, NULL, PETSC_DEFAULT, NULL));
14133ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
14144ec6421dSstefano_zampini }
14154ec6421dSstefano_zampini 
14166ea7df73SStefano Zampini //TODO FIX hypre_CSRMatrixMatvecOutOfPlace
14176ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
1418d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatBindToCPU_HYPRE(Mat A, PetscBool bind)
1419d71ae5a4SJacob Faibussowitsch {
14206ea7df73SStefano Zampini   Mat_HYPRE           *hA   = (Mat_HYPRE *)A->data;
14216ea7df73SStefano Zampini   HYPRE_MemoryLocation hmem = bind ? HYPRE_MEMORY_HOST : HYPRE_MEMORY_DEVICE;
14226ea7df73SStefano Zampini 
14236ea7df73SStefano Zampini   PetscFunctionBegin;
14246ea7df73SStefano Zampini   A->boundtocpu = bind;
14255fbaff96SJunchao Zhang   if (hA->ij && hypre_IJMatrixAssembleFlag(hA->ij) && hmem != hypre_IJMatrixMemoryLocation(hA->ij)) {
14266ea7df73SStefano Zampini     hypre_ParCSRMatrix *parcsr;
1427a333fa2bSZach Atkins     PetscCallHYPRE(HYPRE_IJMatrixGetObject(hA->ij, (void **)&parcsr));
1428a333fa2bSZach Atkins     PetscCallHYPRE(hypre_ParCSRMatrixMigrate(parcsr, hmem));
14296ea7df73SStefano Zampini   }
14309566063dSJacob Faibussowitsch   if (hA->x) PetscCall(VecHYPRE_IJBindToCPU(hA->x, bind));
14319566063dSJacob Faibussowitsch   if (hA->b) PetscCall(VecHYPRE_IJBindToCPU(hA->b, bind));
14323ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
14336ea7df73SStefano Zampini }
14346ea7df73SStefano Zampini #endif
14356ea7df73SStefano Zampini 
1436d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAssemblyEnd_HYPRE(Mat A, MatAssemblyType mode)
1437d71ae5a4SJacob Faibussowitsch {
143863c07aadSStefano Zampini   Mat_HYPRE   *hA = (Mat_HYPRE *)A->data;
1439c69f721fSFande Kong   PetscMPIInt  n;
1440c69f721fSFande Kong   PetscInt     i, j, rstart, ncols, flg;
1441c69f721fSFande Kong   PetscInt    *row, *col;
1442c69f721fSFande Kong   PetscScalar *val;
144363c07aadSStefano Zampini 
144463c07aadSStefano Zampini   PetscFunctionBegin;
144508401ef6SPierre Jolivet   PetscCheck(mode != MAT_FLUSH_ASSEMBLY, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "MAT_FLUSH_ASSEMBLY currently not supported with MATHYPRE");
1446c69f721fSFande Kong 
1447c69f721fSFande Kong   if (!A->nooffprocentries) {
1448c69f721fSFande Kong     while (1) {
14499566063dSJacob Faibussowitsch       PetscCall(MatStashScatterGetMesg_Private(&A->stash, &n, &row, &col, &val, &flg));
1450c69f721fSFande Kong       if (!flg) break;
1451c69f721fSFande Kong 
1452c69f721fSFande Kong       for (i = 0; i < n;) {
1453c69f721fSFande Kong         /* Now identify the consecutive vals belonging to the same row */
1454c69f721fSFande Kong         for (j = i, rstart = row[j]; j < n; j++) {
1455c69f721fSFande Kong           if (row[j] != rstart) break;
1456c69f721fSFande Kong         }
1457c69f721fSFande Kong         if (j < n) ncols = j - i;
1458c69f721fSFande Kong         else ncols = n - i;
1459c69f721fSFande Kong         /* Now assemble all these values with a single function call */
14609566063dSJacob Faibussowitsch         PetscCall(MatSetValues_HYPRE(A, 1, row + i, ncols, col + i, val + i, A->insertmode));
1461c69f721fSFande Kong 
1462c69f721fSFande Kong         i = j;
1463c69f721fSFande Kong       }
1464c69f721fSFande Kong     }
14659566063dSJacob Faibussowitsch     PetscCall(MatStashScatterEnd_Private(&A->stash));
1466c69f721fSFande Kong   }
1467c69f721fSFande Kong 
1468a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixAssemble(hA->ij));
1469336664bdSPierre Jolivet   /* The assembly routine destroys the aux_matrix, we recreate it here by calling HYPRE_IJMatrixInitialize */
1470336664bdSPierre Jolivet   /* If the option MAT_SORTED_FULL is set to true, the indices and values can be passed to hypre directly, so we don't need the aux_matrix */
1471651b1cf9SStefano Zampini   if (!A->sortedfull) {
1472af1cf968SStefano Zampini     hypre_AuxParCSRMatrix *aux_matrix;
1473af1cf968SStefano Zampini 
1474af1cf968SStefano Zampini     /* call destroy just to make sure we do not leak anything */
1475af1cf968SStefano Zampini     aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(hA->ij);
1476a333fa2bSZach Atkins     PetscCallHYPRE(hypre_AuxParCSRMatrixDestroy(aux_matrix));
1477af1cf968SStefano Zampini     hypre_IJMatrixTranslator(hA->ij) = NULL;
1478af1cf968SStefano Zampini 
1479af1cf968SStefano Zampini     /* Initialize with assembled flag -> it only recreates the aux_par_matrix */
1480a333fa2bSZach Atkins     PetscCallHYPRE(HYPRE_IJMatrixInitialize(hA->ij));
1481af1cf968SStefano Zampini     aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(hA->ij);
14826ea7df73SStefano Zampini     if (aux_matrix) {
1483af1cf968SStefano Zampini       hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 1; /* see comment in MatHYPRESetPreallocation_HYPRE */
148422235d61SPierre Jolivet #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0)
1485a333fa2bSZach Atkins       PetscCallHYPRE(hypre_AuxParCSRMatrixInitialize(aux_matrix));
148622235d61SPierre Jolivet #else
1487a333fa2bSZach Atkins       PetscCallHYPRE(hypre_AuxParCSRMatrixInitialize_v2(aux_matrix, HYPRE_MEMORY_HOST));
148822235d61SPierre Jolivet #endif
1489af1cf968SStefano Zampini     }
14906ea7df73SStefano Zampini   }
14916ea7df73SStefano Zampini   {
14926ea7df73SStefano Zampini     hypre_ParCSRMatrix *parcsr;
14936ea7df73SStefano Zampini 
1494a333fa2bSZach Atkins     PetscCallHYPRE(HYPRE_IJMatrixGetObject(hA->ij, (void **)&parcsr));
1495a333fa2bSZach Atkins     if (!hypre_ParCSRMatrixCommPkg(parcsr)) PetscCallHYPRE(hypre_MatvecCommPkgCreate(parcsr));
14966ea7df73SStefano Zampini   }
14979566063dSJacob Faibussowitsch   if (!hA->x) PetscCall(VecHYPRE_IJVectorCreate(A->cmap, &hA->x));
14989566063dSJacob Faibussowitsch   if (!hA->b) PetscCall(VecHYPRE_IJVectorCreate(A->rmap, &hA->b));
14996ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
15009566063dSJacob Faibussowitsch   PetscCall(MatBindToCPU_HYPRE(A, A->boundtocpu));
15016ea7df73SStefano Zampini #endif
15023ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
150363c07aadSStefano Zampini }
150463c07aadSStefano Zampini 
1505d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetArray_HYPRE(Mat A, PetscInt size, void **array)
1506d71ae5a4SJacob Faibussowitsch {
1507c69f721fSFande Kong   Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
1508c69f721fSFande Kong 
1509c69f721fSFande Kong   PetscFunctionBegin;
1510651b1cf9SStefano Zampini   PetscCheck(hA->array_available, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Temporary space is in use");
1511c69f721fSFande Kong 
1512651b1cf9SStefano Zampini   if (hA->array_size >= size) {
151339accc25SStefano Zampini     *array = hA->array;
151439accc25SStefano Zampini   } else {
15159566063dSJacob Faibussowitsch     PetscCall(PetscFree(hA->array));
1516651b1cf9SStefano Zampini     hA->array_size = size;
1517651b1cf9SStefano Zampini     PetscCall(PetscMalloc(hA->array_size, &hA->array));
1518c69f721fSFande Kong     *array = hA->array;
1519c69f721fSFande Kong   }
1520c69f721fSFande Kong 
1521651b1cf9SStefano Zampini   hA->array_available = PETSC_FALSE;
15223ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1523c69f721fSFande Kong }
1524c69f721fSFande Kong 
1525d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatRestoreArray_HYPRE(Mat A, void **array)
1526d71ae5a4SJacob Faibussowitsch {
1527c69f721fSFande Kong   Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
1528c69f721fSFande Kong 
1529c69f721fSFande Kong   PetscFunctionBegin;
1530c69f721fSFande Kong   *array              = NULL;
1531651b1cf9SStefano Zampini   hA->array_available = PETSC_TRUE;
15323ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1533c69f721fSFande Kong }
1534c69f721fSFande Kong 
1535d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValues_HYPRE(Mat A, PetscInt nr, const PetscInt rows[], PetscInt nc, const PetscInt cols[], const PetscScalar v[], InsertMode ins)
1536d71ae5a4SJacob Faibussowitsch {
1537d975228cSstefano_zampini   Mat_HYPRE     *hA   = (Mat_HYPRE *)A->data;
1538d975228cSstefano_zampini   PetscScalar   *vals = (PetscScalar *)v;
153939accc25SStefano Zampini   HYPRE_Complex *sscr;
1540c69f721fSFande Kong   PetscInt      *cscr[2];
1541c69f721fSFande Kong   PetscInt       i, nzc;
1542651b1cf9SStefano Zampini   PetscInt       rst = A->rmap->rstart, ren = A->rmap->rend;
154308defe43SFande Kong   void          *array = NULL;
1544d975228cSstefano_zampini 
1545d975228cSstefano_zampini   PetscFunctionBegin;
15469566063dSJacob Faibussowitsch   PetscCall(MatGetArray_HYPRE(A, sizeof(PetscInt) * (2 * nc) + sizeof(HYPRE_Complex) * nc * nr, &array));
1547c69f721fSFande Kong   cscr[0] = (PetscInt *)array;
1548c69f721fSFande Kong   cscr[1] = ((PetscInt *)array) + nc;
154939accc25SStefano Zampini   sscr    = (HYPRE_Complex *)(((PetscInt *)array) + nc * 2);
1550d975228cSstefano_zampini   for (i = 0, nzc = 0; i < nc; i++) {
1551d975228cSstefano_zampini     if (cols[i] >= 0) {
1552d975228cSstefano_zampini       cscr[0][nzc]   = cols[i];
1553d975228cSstefano_zampini       cscr[1][nzc++] = i;
1554d975228cSstefano_zampini     }
1555d975228cSstefano_zampini   }
1556c69f721fSFande Kong   if (!nzc) {
15579566063dSJacob Faibussowitsch     PetscCall(MatRestoreArray_HYPRE(A, &array));
15583ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1559c69f721fSFande Kong   }
1560d975228cSstefano_zampini 
15616ea7df73SStefano Zampini #if 0 //defined(PETSC_HAVE_HYPRE_DEVICE)
15626ea7df73SStefano Zampini   if (HYPRE_MEMORY_HOST != hypre_IJMatrixMemoryLocation(hA->ij)) {
15636ea7df73SStefano Zampini     hypre_ParCSRMatrix *parcsr;
15646ea7df73SStefano Zampini 
1565a333fa2bSZach Atkins     PetscCallHYPRE(HYPRE_IJMatrixGetObject(hA->ij,(void**)&parcsr));
1566a333fa2bSZach Atkins     PetscCallHYPRE(hypre_ParCSRMatrixMigrate(parcsr, HYPRE_MEMORY_HOST));
15676ea7df73SStefano Zampini   }
15686ea7df73SStefano Zampini #endif
15696ea7df73SStefano Zampini 
1570d975228cSstefano_zampini   if (ins == ADD_VALUES) {
1571d975228cSstefano_zampini     for (i = 0; i < nr; i++) {
15726ea7df73SStefano Zampini       if (rows[i] >= 0) {
1573d975228cSstefano_zampini         PetscInt  j;
15742cf14000SStefano Zampini         HYPRE_Int hnc = (HYPRE_Int)nzc;
15752cf14000SStefano Zampini 
1576651b1cf9SStefano Zampini         if (!nzc) continue;
1577651b1cf9SStefano Zampini         /* nonlocal values */
1578651b1cf9SStefano Zampini         if (rows[i] < rst || rows[i] >= ren) {
1579651b1cf9SStefano Zampini           PetscCheck(!A->nooffprocentries, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Setting off process row %" PetscInt_FMT " even though MatSetOption(,MAT_NO_OFF_PROC_ENTRIES,PETSC_TRUE) was set", rows[i]);
1580651b1cf9SStefano Zampini           if (hA->donotstash) continue;
1581651b1cf9SStefano Zampini         }
1582aed4548fSBarry Smith         PetscCheck((PetscInt)hnc == nzc, PETSC_COMM_SELF, PETSC_ERR_SUP, "Hypre overflow! number of columns %" PetscInt_FMT " for row %" PetscInt_FMT, nzc, rows[i]);
15839566063dSJacob Faibussowitsch         for (j = 0; j < nzc; j++) PetscCall(PetscHYPREScalarCast(vals[cscr[1][j]], &sscr[j]));
1584a333fa2bSZach Atkins         PetscCallHYPRE(HYPRE_IJMatrixAddToValues(hA->ij, 1, &hnc, (HYPRE_BigInt *)(rows + i), (HYPRE_BigInt *)cscr[0], sscr));
1585d975228cSstefano_zampini       }
1586d975228cSstefano_zampini       vals += nc;
1587d975228cSstefano_zampini     }
1588d975228cSstefano_zampini   } else { /* INSERT_VALUES */
1589d975228cSstefano_zampini     for (i = 0; i < nr; i++) {
15906ea7df73SStefano Zampini       if (rows[i] >= 0) {
1591d975228cSstefano_zampini         PetscInt  j;
15922cf14000SStefano Zampini         HYPRE_Int hnc = (HYPRE_Int)nzc;
15932cf14000SStefano Zampini 
1594651b1cf9SStefano Zampini         if (!nzc) continue;
1595aed4548fSBarry Smith         PetscCheck((PetscInt)hnc == nzc, PETSC_COMM_SELF, PETSC_ERR_SUP, "Hypre overflow! number of columns %" PetscInt_FMT " for row %" PetscInt_FMT, nzc, rows[i]);
15969566063dSJacob Faibussowitsch         for (j = 0; j < nzc; j++) PetscCall(PetscHYPREScalarCast(vals[cscr[1][j]], &sscr[j]));
1597c69f721fSFande Kong         /* nonlocal values */
1598651b1cf9SStefano Zampini         if (rows[i] < rst || rows[i] >= ren) {
1599651b1cf9SStefano Zampini           PetscCheck(!A->nooffprocentries, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Setting off process row %" PetscInt_FMT " even though MatSetOption(,MAT_NO_OFF_PROC_ENTRIES,PETSC_TRUE) was set", rows[i]);
1600651b1cf9SStefano Zampini           if (!hA->donotstash) PetscCall(MatStashValuesRow_Private(&A->stash, rows[i], nzc, cscr[0], (PetscScalar *)sscr, PETSC_FALSE));
1601651b1cf9SStefano Zampini         }
1602c69f721fSFande Kong         /* local values */
1603651b1cf9SStefano Zampini         else
1604a333fa2bSZach Atkins           PetscCallHYPRE(HYPRE_IJMatrixSetValues(hA->ij, 1, &hnc, (HYPRE_BigInt *)(rows + i), (HYPRE_BigInt *)cscr[0], sscr));
1605d975228cSstefano_zampini       }
1606d975228cSstefano_zampini       vals += nc;
1607d975228cSstefano_zampini     }
1608d975228cSstefano_zampini   }
1609c69f721fSFande Kong 
16109566063dSJacob Faibussowitsch   PetscCall(MatRestoreArray_HYPRE(A, &array));
16113ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1612d975228cSstefano_zampini }
1613d975228cSstefano_zampini 
1614d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRESetPreallocation_HYPRE(Mat A, PetscInt dnz, const PetscInt dnnz[], PetscInt onz, const PetscInt onnz[])
1615d71ae5a4SJacob Faibussowitsch {
1616d975228cSstefano_zampini   Mat_HYPRE  *hA = (Mat_HYPRE *)A->data;
16177d968826Sstefano_zampini   HYPRE_Int  *hdnnz, *honnz;
161806a29025Sstefano_zampini   PetscInt    i, rs, re, cs, ce, bs;
1619d975228cSstefano_zampini   PetscMPIInt size;
1620d975228cSstefano_zampini 
1621d975228cSstefano_zampini   PetscFunctionBegin;
16229566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->rmap));
16239566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->cmap));
1624d975228cSstefano_zampini   rs = A->rmap->rstart;
1625d975228cSstefano_zampini   re = A->rmap->rend;
1626d975228cSstefano_zampini   cs = A->cmap->rstart;
1627d975228cSstefano_zampini   ce = A->cmap->rend;
1628d975228cSstefano_zampini   if (!hA->ij) {
1629a333fa2bSZach Atkins     PetscCallHYPRE(HYPRE_IJMatrixCreate(hA->comm, rs, re - 1, cs, ce - 1, &hA->ij));
1630a333fa2bSZach Atkins     PetscCallHYPRE(HYPRE_IJMatrixSetObjectType(hA->ij, HYPRE_PARCSR));
1631d975228cSstefano_zampini   } else {
16322cf14000SStefano Zampini     HYPRE_BigInt hrs, hre, hcs, hce;
1633a333fa2bSZach Atkins     PetscCallHYPRE(HYPRE_IJMatrixGetLocalRange(hA->ij, &hrs, &hre, &hcs, &hce));
1634aed4548fSBarry Smith     PetscCheck(hre - hrs + 1 == re - rs, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Inconsistent local rows: IJMatrix [%" PetscHYPRE_BigInt_FMT ",%" PetscHYPRE_BigInt_FMT "), PETSc [%" PetscInt_FMT ",%" PetscInt_FMT ")", hrs, hre + 1, rs, re);
1635aed4548fSBarry Smith     PetscCheck(hce - hcs + 1 == ce - cs, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Inconsistent local cols: IJMatrix [%" PetscHYPRE_BigInt_FMT ",%" PetscHYPRE_BigInt_FMT "), PETSc [%" PetscInt_FMT ",%" PetscInt_FMT ")", hcs, hce + 1, cs, ce);
1636d975228cSstefano_zampini   }
163706977982Sstefanozampini   PetscCall(MatHYPRE_DestroyCOOMat(A));
16389566063dSJacob Faibussowitsch   PetscCall(MatGetBlockSize(A, &bs));
163906a29025Sstefano_zampini   if (dnz == PETSC_DEFAULT || dnz == PETSC_DECIDE) dnz = 10 * bs;
164006a29025Sstefano_zampini   if (onz == PETSC_DEFAULT || onz == PETSC_DECIDE) onz = 10 * bs;
164106a29025Sstefano_zampini 
1642d975228cSstefano_zampini   if (!dnnz) {
16439566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n, &hdnnz));
1644*f2f41e48SZach Atkins     for (i = 0; i < A->rmap->n; i++) hdnnz[i] = (HYPRE_Int)dnz;
1645d975228cSstefano_zampini   } else {
16467d968826Sstefano_zampini     hdnnz = (HYPRE_Int *)dnnz;
1647d975228cSstefano_zampini   }
16489566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)A), &size));
1649d975228cSstefano_zampini   if (size > 1) {
1650ddbeb582SStefano Zampini     hypre_AuxParCSRMatrix *aux_matrix;
1651d975228cSstefano_zampini     if (!onnz) {
16529566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(A->rmap->n, &honnz));
1653*f2f41e48SZach Atkins       for (i = 0; i < A->rmap->n; i++) honnz[i] = (HYPRE_Int)onz;
165422235d61SPierre Jolivet     } else honnz = (HYPRE_Int *)onnz;
1655ddbeb582SStefano Zampini     /* SetDiagOffdSizes sets hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0, since it seems
1656ddbeb582SStefano Zampini        they assume the user will input the entire row values, properly sorted
1657336664bdSPierre Jolivet        In PETSc, we don't make such an assumption and set this flag to 1,
1658336664bdSPierre Jolivet        unless the option MAT_SORTED_FULL is set to true.
1659ddbeb582SStefano Zampini        Also, to avoid possible memory leaks, we destroy and recreate the translator
1660ddbeb582SStefano Zampini        This has to be done here, as HYPRE_IJMatrixInitialize will properly initialize
1661ddbeb582SStefano Zampini        the IJ matrix for us */
1662ddbeb582SStefano Zampini     aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(hA->ij);
1663ddbeb582SStefano Zampini     hypre_AuxParCSRMatrixDestroy(aux_matrix);
1664ddbeb582SStefano Zampini     hypre_IJMatrixTranslator(hA->ij) = NULL;
1665a333fa2bSZach Atkins     PetscCallHYPRE(HYPRE_IJMatrixSetDiagOffdSizes(hA->ij, hdnnz, honnz));
1666ddbeb582SStefano Zampini     aux_matrix                               = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(hA->ij);
1667651b1cf9SStefano Zampini     hypre_AuxParCSRMatrixNeedAux(aux_matrix) = !A->sortedfull;
1668d975228cSstefano_zampini   } else {
1669d975228cSstefano_zampini     honnz = NULL;
1670a333fa2bSZach Atkins     PetscCallHYPRE(HYPRE_IJMatrixSetRowSizes(hA->ij, hdnnz));
1671d975228cSstefano_zampini   }
1672ddbeb582SStefano Zampini 
1673af1cf968SStefano Zampini   /* reset assembled flag and call the initialize method */
1674af1cf968SStefano Zampini   hypre_IJMatrixAssembleFlag(hA->ij) = 0;
16756ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0)
1676a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixInitialize(hA->ij));
16776ea7df73SStefano Zampini #else
1678a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixInitialize_v2(hA->ij, HYPRE_MEMORY_HOST));
16796ea7df73SStefano Zampini #endif
168048a46eb9SPierre Jolivet   if (!dnnz) PetscCall(PetscFree(hdnnz));
168148a46eb9SPierre Jolivet   if (!onnz && honnz) PetscCall(PetscFree(honnz));
1682af1cf968SStefano Zampini   /* Match AIJ logic */
168306a29025Sstefano_zampini   A->preallocated = PETSC_TRUE;
1684af1cf968SStefano Zampini   A->assembled    = PETSC_FALSE;
16853ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1686d975228cSstefano_zampini }
1687d975228cSstefano_zampini 
1688d975228cSstefano_zampini /*@C
1689d975228cSstefano_zampini   MatHYPRESetPreallocation - Preallocates memory for a sparse parallel matrix in HYPRE IJ format
1690d975228cSstefano_zampini 
1691c3339decSBarry Smith   Collective
1692d975228cSstefano_zampini 
1693d975228cSstefano_zampini   Input Parameters:
1694d975228cSstefano_zampini + A    - the matrix
1695d975228cSstefano_zampini . dnz  - number of nonzeros per row in DIAGONAL portion of local submatrix
1696d975228cSstefano_zampini           (same value is used for all local rows)
1697d975228cSstefano_zampini . dnnz - array containing the number of nonzeros in the various rows of the
1698d975228cSstefano_zampini           DIAGONAL portion of the local submatrix (possibly different for each row)
16992ef1f0ffSBarry Smith           or `NULL` (`PETSC_NULL_INTEGER` in Fortran), if `d_nz` is used to specify the nonzero structure.
17002ef1f0ffSBarry Smith           The size of this array is equal to the number of local rows, i.e `m`.
1701d975228cSstefano_zampini           For matrices that will be factored, you must leave room for (and set)
1702d975228cSstefano_zampini           the diagonal entry even if it is zero.
1703d975228cSstefano_zampini . onz  - number of nonzeros per row in the OFF-DIAGONAL portion of local
1704d975228cSstefano_zampini           submatrix (same value is used for all local rows).
1705d975228cSstefano_zampini - onnz - array containing the number of nonzeros in the various rows of the
1706d975228cSstefano_zampini           OFF-DIAGONAL portion of the local submatrix (possibly different for
17072ef1f0ffSBarry Smith           each row) or `NULL` (`PETSC_NULL_INTEGER` in Fortran), if `o_nz` is used to specify the nonzero
1708d975228cSstefano_zampini           structure. The size of this array is equal to the number
17092ef1f0ffSBarry Smith           of local rows, i.e `m`.
1710d975228cSstefano_zampini 
17112fe279fdSBarry Smith   Level: intermediate
17122fe279fdSBarry Smith 
171311a5261eSBarry Smith   Note:
17142ef1f0ffSBarry Smith   If the *nnz parameter is given then the *nz parameter is ignored; for sequential matrices, `onz` and `onnz` are ignored.
1715d975228cSstefano_zampini 
17161cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatMPIAIJSetPreallocation()`, `MATHYPRE`, `MATAIJ`
1717d975228cSstefano_zampini @*/
1718d71ae5a4SJacob Faibussowitsch PetscErrorCode MatHYPRESetPreallocation(Mat A, PetscInt dnz, const PetscInt dnnz[], PetscInt onz, const PetscInt onnz[])
1719d71ae5a4SJacob Faibussowitsch {
1720d975228cSstefano_zampini   PetscFunctionBegin;
1721d975228cSstefano_zampini   PetscValidHeaderSpecific(A, MAT_CLASSID, 1);
1722d975228cSstefano_zampini   PetscValidType(A, 1);
1723cac4c232SBarry Smith   PetscTryMethod(A, "MatHYPRESetPreallocation_C", (Mat, PetscInt, const PetscInt[], PetscInt, const PetscInt[]), (A, dnz, dnnz, onz, onnz));
17243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1725d975228cSstefano_zampini }
1726d975228cSstefano_zampini 
172720f4b53cSBarry Smith /*@C
17282ef1f0ffSBarry Smith   MatCreateFromParCSR - Creates a `Mat` from a `hypre_ParCSRMatrix`
1729225daaf8SStefano Zampini 
1730225daaf8SStefano Zampini   Collective
1731225daaf8SStefano Zampini 
1732225daaf8SStefano Zampini   Input Parameters:
17332ef1f0ffSBarry Smith + parcsr   - the pointer to the `hypre_ParCSRMatrix`
17342ef1f0ffSBarry Smith . mtype    - matrix type to be created. Currently `MATAIJ`, `MATIS` and `MATHYPRE` are supported.
173520f4b53cSBarry Smith - copymode - PETSc copying options, see  `PetscCopyMode`
1736225daaf8SStefano Zampini 
1737225daaf8SStefano Zampini   Output Parameter:
1738225daaf8SStefano Zampini . A - the matrix
1739225daaf8SStefano Zampini 
1740225daaf8SStefano Zampini   Level: intermediate
1741225daaf8SStefano Zampini 
1742bfe80ac4SPierre Jolivet .seealso: [](ch_matrices), `Mat`, `MATHYPRE`, `PetscCopyMode`
174320f4b53cSBarry Smith @*/
1744d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreateFromParCSR(hypre_ParCSRMatrix *parcsr, MatType mtype, PetscCopyMode copymode, Mat *A)
1745d71ae5a4SJacob Faibussowitsch {
1746225daaf8SStefano Zampini   Mat        T;
1747978814f1SStefano Zampini   Mat_HYPRE *hA;
1748978814f1SStefano Zampini   MPI_Comm   comm;
1749978814f1SStefano Zampini   PetscInt   rstart, rend, cstart, cend, M, N;
1750d248a85cSRichard Tran Mills   PetscBool  isseqaij, isseqaijmkl, ismpiaij, isaij, ishyp, isis;
1751978814f1SStefano Zampini 
1752978814f1SStefano Zampini   PetscFunctionBegin;
1753978814f1SStefano Zampini   comm = hypre_ParCSRMatrixComm(parcsr);
17549566063dSJacob Faibussowitsch   PetscCall(PetscStrcmp(mtype, MATSEQAIJ, &isseqaij));
17559566063dSJacob Faibussowitsch   PetscCall(PetscStrcmp(mtype, MATSEQAIJMKL, &isseqaijmkl));
17569566063dSJacob Faibussowitsch   PetscCall(PetscStrcmp(mtype, MATMPIAIJ, &ismpiaij));
17579566063dSJacob Faibussowitsch   PetscCall(PetscStrcmp(mtype, MATAIJ, &isaij));
17589566063dSJacob Faibussowitsch   PetscCall(PetscStrcmp(mtype, MATHYPRE, &ishyp));
17599566063dSJacob Faibussowitsch   PetscCall(PetscStrcmp(mtype, MATIS, &isis));
1760d248a85cSRichard Tran Mills   isaij = (PetscBool)(isseqaij || isseqaijmkl || ismpiaij || isaij);
17616ea7df73SStefano Zampini   /* TODO */
1762aed4548fSBarry Smith   PetscCheck(isaij || ishyp || isis, comm, PETSC_ERR_SUP, "Unsupported MatType %s! Supported types are %s, %s, %s, %s, %s, and %s", mtype, MATAIJ, MATSEQAIJ, MATSEQAIJMKL, MATMPIAIJ, MATIS, MATHYPRE);
1763978814f1SStefano Zampini   /* access ParCSRMatrix */
1764978814f1SStefano Zampini   rstart = hypre_ParCSRMatrixFirstRowIndex(parcsr);
1765978814f1SStefano Zampini   rend   = hypre_ParCSRMatrixLastRowIndex(parcsr);
1766978814f1SStefano Zampini   cstart = hypre_ParCSRMatrixFirstColDiag(parcsr);
1767978814f1SStefano Zampini   cend   = hypre_ParCSRMatrixLastColDiag(parcsr);
1768978814f1SStefano Zampini   M      = hypre_ParCSRMatrixGlobalNumRows(parcsr);
1769978814f1SStefano Zampini   N      = hypre_ParCSRMatrixGlobalNumCols(parcsr);
1770978814f1SStefano Zampini 
1771978814f1SStefano Zampini   /* create PETSc matrix with MatHYPRE */
17729566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, &T));
1773c2886e86SStefano Zampini   PetscCall(MatSetSizes(T, PetscMax(rend - rstart + 1, 0), PetscMax(cend - cstart + 1, 0), M, N));
17749566063dSJacob Faibussowitsch   PetscCall(MatSetType(T, MATHYPRE));
1775f4f49eeaSPierre Jolivet   hA = (Mat_HYPRE *)T->data;
1776978814f1SStefano Zampini 
1777978814f1SStefano Zampini   /* create HYPRE_IJMatrix */
1778a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixCreate(hA->comm, rstart, rend, cstart, cend, &hA->ij));
1779a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixSetObjectType(hA->ij, HYPRE_PARCSR));
178045b8d346SStefano Zampini 
178145b8d346SStefano Zampini   /* create new ParCSR object if needed */
178245b8d346SStefano Zampini   if (ishyp && copymode == PETSC_COPY_VALUES) {
178345b8d346SStefano Zampini     hypre_ParCSRMatrix *new_parcsr;
17846ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 18, 0)
178545b8d346SStefano Zampini     hypre_CSRMatrix *hdiag, *hoffd, *ndiag, *noffd;
178645b8d346SStefano Zampini 
17870e6427aaSSatish Balay     new_parcsr = hypre_ParCSRMatrixClone(parcsr, 0);
178845b8d346SStefano Zampini     hdiag      = hypre_ParCSRMatrixDiag(parcsr);
178945b8d346SStefano Zampini     hoffd      = hypre_ParCSRMatrixOffd(parcsr);
179045b8d346SStefano Zampini     ndiag      = hypre_ParCSRMatrixDiag(new_parcsr);
179145b8d346SStefano Zampini     noffd      = hypre_ParCSRMatrixOffd(new_parcsr);
17929566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(hypre_CSRMatrixData(ndiag), hypre_CSRMatrixData(hdiag), hypre_CSRMatrixNumNonzeros(hdiag)));
17939566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(hypre_CSRMatrixData(noffd), hypre_CSRMatrixData(hoffd), hypre_CSRMatrixNumNonzeros(hoffd)));
17946ea7df73SStefano Zampini #else
17956ea7df73SStefano Zampini     new_parcsr = hypre_ParCSRMatrixClone(parcsr, 1);
17966ea7df73SStefano Zampini #endif
179745b8d346SStefano Zampini     parcsr   = new_parcsr;
179845b8d346SStefano Zampini     copymode = PETSC_OWN_POINTER;
179945b8d346SStefano Zampini   }
1800978814f1SStefano Zampini 
1801978814f1SStefano Zampini   /* set ParCSR object */
1802978814f1SStefano Zampini   hypre_IJMatrixObject(hA->ij) = parcsr;
18034ec6421dSstefano_zampini   T->preallocated              = PETSC_TRUE;
1804978814f1SStefano Zampini 
1805978814f1SStefano Zampini   /* set assembled flag */
1806978814f1SStefano Zampini   hypre_IJMatrixAssembleFlag(hA->ij) = 1;
18076ea7df73SStefano Zampini #if 0
1808a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixInitialize(hA->ij));
18096ea7df73SStefano Zampini #endif
1810225daaf8SStefano Zampini   if (ishyp) {
18116d2a658fSstefano_zampini     PetscMPIInt myid = 0;
18126d2a658fSstefano_zampini 
18136d2a658fSstefano_zampini     /* make sure we always have row_starts and col_starts available */
181448a46eb9SPierre Jolivet     if (HYPRE_AssumedPartitionCheck()) PetscCallMPI(MPI_Comm_rank(comm, &myid));
1815a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts)
18166d2a658fSstefano_zampini     if (!hypre_ParCSRMatrixOwnsColStarts(parcsr)) {
18176d2a658fSstefano_zampini       PetscLayout map;
18186d2a658fSstefano_zampini 
18199566063dSJacob Faibussowitsch       PetscCall(MatGetLayouts(T, NULL, &map));
18209566063dSJacob Faibussowitsch       PetscCall(PetscLayoutSetUp(map));
18212cf14000SStefano Zampini       hypre_ParCSRMatrixColStarts(parcsr) = (HYPRE_BigInt *)(map->range + myid);
18226d2a658fSstefano_zampini     }
18236d2a658fSstefano_zampini     if (!hypre_ParCSRMatrixOwnsRowStarts(parcsr)) {
18246d2a658fSstefano_zampini       PetscLayout map;
18256d2a658fSstefano_zampini 
18269566063dSJacob Faibussowitsch       PetscCall(MatGetLayouts(T, &map, NULL));
18279566063dSJacob Faibussowitsch       PetscCall(PetscLayoutSetUp(map));
18282cf14000SStefano Zampini       hypre_ParCSRMatrixRowStarts(parcsr) = (HYPRE_BigInt *)(map->range + myid);
18296d2a658fSstefano_zampini     }
1830a1d2239cSSatish Balay #endif
1831978814f1SStefano Zampini     /* prevent from freeing the pointer */
1832978814f1SStefano Zampini     if (copymode == PETSC_USE_POINTER) hA->inner_free = PETSC_FALSE;
1833225daaf8SStefano Zampini     *A = T;
18349566063dSJacob Faibussowitsch     PetscCall(MatSetOption(*A, MAT_SORTED_FULL, PETSC_TRUE));
18359566063dSJacob Faibussowitsch     PetscCall(MatAssemblyBegin(*A, MAT_FINAL_ASSEMBLY));
18369566063dSJacob Faibussowitsch     PetscCall(MatAssemblyEnd(*A, MAT_FINAL_ASSEMBLY));
1837bb4689ddSStefano Zampini   } else if (isaij) {
1838bb4689ddSStefano Zampini     if (copymode != PETSC_OWN_POINTER) {
1839225daaf8SStefano Zampini       /* prevent from freeing the pointer */
1840225daaf8SStefano Zampini       hA->inner_free = PETSC_FALSE;
18419566063dSJacob Faibussowitsch       PetscCall(MatConvert_HYPRE_AIJ(T, MATAIJ, MAT_INITIAL_MATRIX, A));
18429566063dSJacob Faibussowitsch       PetscCall(MatDestroy(&T));
1843225daaf8SStefano Zampini     } else { /* AIJ return type with PETSC_OWN_POINTER */
18449566063dSJacob Faibussowitsch       PetscCall(MatConvert_HYPRE_AIJ(T, MATAIJ, MAT_INPLACE_MATRIX, &T));
1845225daaf8SStefano Zampini       *A = T;
1846225daaf8SStefano Zampini     }
1847bb4689ddSStefano Zampini   } else if (isis) {
18489566063dSJacob Faibussowitsch     PetscCall(MatConvert_HYPRE_IS(T, MATIS, MAT_INITIAL_MATRIX, A));
18498cfe8d00SStefano Zampini     if (copymode != PETSC_OWN_POINTER) hA->inner_free = PETSC_FALSE;
18509566063dSJacob Faibussowitsch     PetscCall(MatDestroy(&T));
1851bb4689ddSStefano Zampini   }
18523ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1853978814f1SStefano Zampini }
1854978814f1SStefano Zampini 
1855d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPREGetParCSR_HYPRE(Mat A, hypre_ParCSRMatrix **parcsr)
1856d71ae5a4SJacob Faibussowitsch {
1857dd9c0a25Sstefano_zampini   Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
1858dd9c0a25Sstefano_zampini   HYPRE_Int  type;
1859dd9c0a25Sstefano_zampini 
1860dd9c0a25Sstefano_zampini   PetscFunctionBegin;
186128b400f6SJacob Faibussowitsch   PetscCheck(hA->ij, PetscObjectComm((PetscObject)A), PETSC_ERR_PLIB, "HYPRE_IJMatrix not present");
1862a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(hA->ij, &type));
186308401ef6SPierre Jolivet   PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "HYPRE_IJMatrix is not of type HYPRE_PARCSR");
1864a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_IJMatrixGetObject(hA->ij, (void **)parcsr));
18653ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1866dd9c0a25Sstefano_zampini }
1867dd9c0a25Sstefano_zampini 
186820f4b53cSBarry Smith /*@C
1869dd9c0a25Sstefano_zampini   MatHYPREGetParCSR - Gets the pointer to the ParCSR matrix
1870dd9c0a25Sstefano_zampini 
1871cc4c1da9SBarry Smith   Not Collective, No Fortran Support
1872dd9c0a25Sstefano_zampini 
187320f4b53cSBarry Smith   Input Parameter:
187420f4b53cSBarry Smith . A - the `MATHYPRE` object
1875dd9c0a25Sstefano_zampini 
1876dd9c0a25Sstefano_zampini   Output Parameter:
18772ef1f0ffSBarry Smith . parcsr - the pointer to the `hypre_ParCSRMatrix`
1878dd9c0a25Sstefano_zampini 
1879dd9c0a25Sstefano_zampini   Level: intermediate
1880dd9c0a25Sstefano_zampini 
1881bfe80ac4SPierre Jolivet .seealso: [](ch_matrices), `Mat`, `MATHYPRE`, `PetscCopyMode`
188220f4b53cSBarry Smith @*/
1883d71ae5a4SJacob Faibussowitsch PetscErrorCode MatHYPREGetParCSR(Mat A, hypre_ParCSRMatrix **parcsr)
1884d71ae5a4SJacob Faibussowitsch {
1885dd9c0a25Sstefano_zampini   PetscFunctionBegin;
1886dd9c0a25Sstefano_zampini   PetscValidHeaderSpecific(A, MAT_CLASSID, 1);
1887dd9c0a25Sstefano_zampini   PetscValidType(A, 1);
1888cac4c232SBarry Smith   PetscUseMethod(A, "MatHYPREGetParCSR_C", (Mat, hypre_ParCSRMatrix **), (A, parcsr));
18893ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1890dd9c0a25Sstefano_zampini }
1891dd9c0a25Sstefano_zampini 
1892d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMissingDiagonal_HYPRE(Mat A, PetscBool *missing, PetscInt *dd)
1893d71ae5a4SJacob Faibussowitsch {
189468ec7858SStefano Zampini   hypre_ParCSRMatrix *parcsr;
189568ec7858SStefano Zampini   hypre_CSRMatrix    *ha;
189668ec7858SStefano Zampini   PetscInt            rst;
189768ec7858SStefano Zampini 
189868ec7858SStefano Zampini   PetscFunctionBegin;
189908401ef6SPierre Jolivet   PetscCheck(A->rmap->n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_SUP, "Not implemented with non-square diagonal blocks");
19009566063dSJacob Faibussowitsch   PetscCall(MatGetOwnershipRange(A, &rst, NULL));
19019566063dSJacob Faibussowitsch   PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
190268ec7858SStefano Zampini   if (missing) *missing = PETSC_FALSE;
190368ec7858SStefano Zampini   if (dd) *dd = -1;
190468ec7858SStefano Zampini   ha = hypre_ParCSRMatrixDiag(parcsr);
190568ec7858SStefano Zampini   if (ha) {
190668299464SStefano Zampini     PetscInt   size, i;
190768299464SStefano Zampini     HYPRE_Int *ii, *jj;
190868ec7858SStefano Zampini 
190968ec7858SStefano Zampini     size = hypre_CSRMatrixNumRows(ha);
191068ec7858SStefano Zampini     ii   = hypre_CSRMatrixI(ha);
191168ec7858SStefano Zampini     jj   = hypre_CSRMatrixJ(ha);
191268ec7858SStefano Zampini     for (i = 0; i < size; i++) {
191368ec7858SStefano Zampini       PetscInt  j;
191468ec7858SStefano Zampini       PetscBool found = PETSC_FALSE;
191568ec7858SStefano Zampini 
19169371c9d4SSatish Balay       for (j = ii[i]; j < ii[i + 1] && !found; j++) found = (jj[j] == i) ? PETSC_TRUE : PETSC_FALSE;
191768ec7858SStefano Zampini 
191868ec7858SStefano Zampini       if (!found) {
19193ba16761SJacob Faibussowitsch         PetscCall(PetscInfo(A, "Matrix is missing local diagonal entry %" PetscInt_FMT "\n", i));
192068ec7858SStefano Zampini         if (missing) *missing = PETSC_TRUE;
192168ec7858SStefano Zampini         if (dd) *dd = i + rst;
19223ba16761SJacob Faibussowitsch         PetscFunctionReturn(PETSC_SUCCESS);
192368ec7858SStefano Zampini       }
192468ec7858SStefano Zampini     }
192568ec7858SStefano Zampini     if (!size) {
19263ba16761SJacob Faibussowitsch       PetscCall(PetscInfo(A, "Matrix has no diagonal entries therefore is missing diagonal\n"));
192768ec7858SStefano Zampini       if (missing) *missing = PETSC_TRUE;
192868ec7858SStefano Zampini       if (dd) *dd = rst;
192968ec7858SStefano Zampini     }
193068ec7858SStefano Zampini   } else {
19313ba16761SJacob Faibussowitsch     PetscCall(PetscInfo(A, "Matrix has no diagonal entries therefore is missing diagonal\n"));
193268ec7858SStefano Zampini     if (missing) *missing = PETSC_TRUE;
193368ec7858SStefano Zampini     if (dd) *dd = rst;
193468ec7858SStefano Zampini   }
19353ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
193668ec7858SStefano Zampini }
193768ec7858SStefano Zampini 
1938d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatScale_HYPRE(Mat A, PetscScalar s)
1939d71ae5a4SJacob Faibussowitsch {
194068ec7858SStefano Zampini   hypre_ParCSRMatrix *parcsr;
19416ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0)
194268ec7858SStefano Zampini   hypre_CSRMatrix *ha;
19436ea7df73SStefano Zampini #endif
194439accc25SStefano Zampini   HYPRE_Complex hs;
194568ec7858SStefano Zampini 
194668ec7858SStefano Zampini   PetscFunctionBegin;
19479566063dSJacob Faibussowitsch   PetscCall(PetscHYPREScalarCast(s, &hs));
19489566063dSJacob Faibussowitsch   PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
19496ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2, 19, 0)
1950a333fa2bSZach Atkins   PetscCallHYPRE(hypre_ParCSRMatrixScale(parcsr, hs));
19516ea7df73SStefano Zampini #else /* diagonal part */
195268ec7858SStefano Zampini   ha = hypre_ParCSRMatrixDiag(parcsr);
195368ec7858SStefano Zampini   if (ha) {
195468299464SStefano Zampini     PetscInt       size, i;
195568299464SStefano Zampini     HYPRE_Int     *ii;
195639accc25SStefano Zampini     HYPRE_Complex *a;
195768ec7858SStefano Zampini 
195868ec7858SStefano Zampini     size = hypre_CSRMatrixNumRows(ha);
195968ec7858SStefano Zampini     a    = hypre_CSRMatrixData(ha);
196068ec7858SStefano Zampini     ii   = hypre_CSRMatrixI(ha);
196139accc25SStefano Zampini     for (i = 0; i < ii[size]; i++) a[i] *= hs;
196268ec7858SStefano Zampini   }
19634cf0e950SBarry Smith   /* off-diagonal part */
196468ec7858SStefano Zampini   ha = hypre_ParCSRMatrixOffd(parcsr);
196568ec7858SStefano Zampini   if (ha) {
196668299464SStefano Zampini     PetscInt       size, i;
196768299464SStefano Zampini     HYPRE_Int     *ii;
196839accc25SStefano Zampini     HYPRE_Complex *a;
196968ec7858SStefano Zampini 
197068ec7858SStefano Zampini     size = hypre_CSRMatrixNumRows(ha);
197168ec7858SStefano Zampini     a    = hypre_CSRMatrixData(ha);
197268ec7858SStefano Zampini     ii   = hypre_CSRMatrixI(ha);
197339accc25SStefano Zampini     for (i = 0; i < ii[size]; i++) a[i] *= hs;
197468ec7858SStefano Zampini   }
19756ea7df73SStefano Zampini #endif
19763ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
197768ec7858SStefano Zampini }
197868ec7858SStefano Zampini 
1979d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatZeroRowsColumns_HYPRE(Mat A, PetscInt numRows, const PetscInt rows[], PetscScalar diag, Vec x, Vec b)
1980d71ae5a4SJacob Faibussowitsch {
198168ec7858SStefano Zampini   hypre_ParCSRMatrix *parcsr;
198268299464SStefano Zampini   HYPRE_Int          *lrows;
198368299464SStefano Zampini   PetscInt            rst, ren, i;
198468ec7858SStefano Zampini 
198568ec7858SStefano Zampini   PetscFunctionBegin;
198608401ef6SPierre Jolivet   PetscCheck(!x && !b, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "To be implemented");
19879566063dSJacob Faibussowitsch   PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
19889566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(numRows, &lrows));
19899566063dSJacob Faibussowitsch   PetscCall(MatGetOwnershipRange(A, &rst, &ren));
199068ec7858SStefano Zampini   for (i = 0; i < numRows; i++) {
19917a46b595SBarry Smith     PetscCheck(rows[i] >= rst && rows[i] < ren, PETSC_COMM_SELF, PETSC_ERR_SUP, "Non-local rows not yet supported");
1992*f2f41e48SZach Atkins     lrows[i] = (HYPRE_Int)(rows[i] - rst);
199368ec7858SStefano Zampini   }
1994*f2f41e48SZach Atkins   PetscCallHYPRE(hypre_ParCSRMatrixEliminateRowsCols(parcsr, (HYPRE_Int)numRows, lrows));
19959566063dSJacob Faibussowitsch   PetscCall(PetscFree(lrows));
19963ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
199768ec7858SStefano Zampini }
199868ec7858SStefano Zampini 
1999d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatZeroEntries_HYPRE_CSRMatrix(hypre_CSRMatrix *ha)
2000d71ae5a4SJacob Faibussowitsch {
2001c69f721fSFande Kong   PetscFunctionBegin;
2002c69f721fSFande Kong   if (ha) {
2003c69f721fSFande Kong     HYPRE_Int     *ii, size;
2004c69f721fSFande Kong     HYPRE_Complex *a;
2005c69f721fSFande Kong 
2006c69f721fSFande Kong     size = hypre_CSRMatrixNumRows(ha);
2007c69f721fSFande Kong     a    = hypre_CSRMatrixData(ha);
2008c69f721fSFande Kong     ii   = hypre_CSRMatrixI(ha);
2009c69f721fSFande Kong 
20109566063dSJacob Faibussowitsch     if (a) PetscCall(PetscArrayzero(a, ii[size]));
2011c69f721fSFande Kong   }
20123ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2013c69f721fSFande Kong }
2014c69f721fSFande Kong 
201566976f2fSJacob Faibussowitsch static PetscErrorCode MatZeroEntries_HYPRE(Mat A)
2016d71ae5a4SJacob Faibussowitsch {
20176ea7df73SStefano Zampini   Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
20186ea7df73SStefano Zampini 
20196ea7df73SStefano Zampini   PetscFunctionBegin;
20206ea7df73SStefano Zampini   if (HYPRE_MEMORY_DEVICE == hypre_IJMatrixMemoryLocation(hA->ij)) {
2021a333fa2bSZach Atkins     PetscCallHYPRE(HYPRE_IJMatrixSetConstantValues(hA->ij, 0.0));
20226ea7df73SStefano Zampini   } else {
2023c69f721fSFande Kong     hypre_ParCSRMatrix *parcsr;
2024c69f721fSFande Kong 
20259566063dSJacob Faibussowitsch     PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
20269566063dSJacob Faibussowitsch     PetscCall(MatZeroEntries_HYPRE_CSRMatrix(hypre_ParCSRMatrixDiag(parcsr)));
20279566063dSJacob Faibussowitsch     PetscCall(MatZeroEntries_HYPRE_CSRMatrix(hypre_ParCSRMatrixOffd(parcsr)));
20286ea7df73SStefano Zampini   }
20293ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2030c69f721fSFande Kong }
2031c69f721fSFande Kong 
2032d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatZeroRows_HYPRE_CSRMatrix(hypre_CSRMatrix *hA, PetscInt N, const PetscInt rows[], HYPRE_Complex diag)
2033d71ae5a4SJacob Faibussowitsch {
203439accc25SStefano Zampini   PetscInt       ii;
203539accc25SStefano Zampini   HYPRE_Int     *i, *j;
203639accc25SStefano Zampini   HYPRE_Complex *a;
2037c69f721fSFande Kong 
2038c69f721fSFande Kong   PetscFunctionBegin;
20393ba16761SJacob Faibussowitsch   if (!hA) PetscFunctionReturn(PETSC_SUCCESS);
2040c69f721fSFande Kong 
204139accc25SStefano Zampini   i = hypre_CSRMatrixI(hA);
204239accc25SStefano Zampini   j = hypre_CSRMatrixJ(hA);
2043c69f721fSFande Kong   a = hypre_CSRMatrixData(hA);
2044a32e9c99SJunchao Zhang #if defined(PETSC_HAVE_HYPRE_DEVICE)
2045a32e9c99SJunchao Zhang   if (HYPRE_MEMORY_DEVICE == hypre_CSRMatrixMemoryLocation(hA)) {
2046a32e9c99SJunchao Zhang   #if defined(HYPRE_USING_CUDA)
2047a32e9c99SJunchao Zhang     MatZeroRows_CUDA(N, rows, i, j, a, diag);
2048a32e9c99SJunchao Zhang   #elif defined(HYPRE_USING_HIP)
2049a32e9c99SJunchao Zhang     MatZeroRows_HIP(N, rows, i, j, a, diag);
2050a32e9c99SJunchao Zhang   #elif defined(PETSC_HAVE_KOKKOS)
2051a32e9c99SJunchao Zhang     MatZeroRows_Kokkos(N, rows, i, j, a, diag);
2052a32e9c99SJunchao Zhang   #else
2053a32e9c99SJunchao Zhang     SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for MatZeroRows on a hypre matrix in this memory location");
2054a32e9c99SJunchao Zhang   #endif
2055a32e9c99SJunchao Zhang   } else
2056a32e9c99SJunchao Zhang #endif
2057a32e9c99SJunchao Zhang   {
2058c69f721fSFande Kong     for (ii = 0; ii < N; ii++) {
205939accc25SStefano Zampini       HYPRE_Int jj, ibeg, iend, irow;
206039accc25SStefano Zampini 
2061*f2f41e48SZach Atkins       irow = (HYPRE_Int)rows[ii];
2062c69f721fSFande Kong       ibeg = i[irow];
2063c69f721fSFande Kong       iend = i[irow + 1];
2064c69f721fSFande Kong       for (jj = ibeg; jj < iend; jj++)
2065c69f721fSFande Kong         if (j[jj] == irow) a[jj] = diag;
2066c69f721fSFande Kong         else a[jj] = 0.0;
2067c69f721fSFande Kong     }
2068a32e9c99SJunchao Zhang   }
20693ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2070c69f721fSFande Kong }
2071c69f721fSFande Kong 
2072d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatZeroRows_HYPRE(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b)
2073d71ae5a4SJacob Faibussowitsch {
2074c69f721fSFande Kong   hypre_ParCSRMatrix *parcsr;
2075a32e9c99SJunchao Zhang   PetscInt           *lrows, len, *lrows2;
207639accc25SStefano Zampini   HYPRE_Complex       hdiag;
2077c69f721fSFande Kong 
2078c69f721fSFande Kong   PetscFunctionBegin;
207908401ef6SPierre Jolivet   PetscCheck(!x && !b, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Does not support to modify the solution and the right hand size");
20809566063dSJacob Faibussowitsch   PetscCall(PetscHYPREScalarCast(diag, &hdiag));
2081c69f721fSFande Kong   /* retrieve the internal matrix */
20829566063dSJacob Faibussowitsch   PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
2083c69f721fSFande Kong   /* get locally owned rows */
20849566063dSJacob Faibussowitsch   PetscCall(MatZeroRowsMapLocal_Private(A, N, rows, &len, &lrows));
2085a32e9c99SJunchao Zhang 
2086a32e9c99SJunchao Zhang #if defined(PETSC_HAVE_HYPRE_DEVICE)
2087a32e9c99SJunchao Zhang   if (HYPRE_MEMORY_DEVICE == hypre_CSRMatrixMemoryLocation(hypre_ParCSRMatrixDiag(parcsr))) {
2088a32e9c99SJunchao Zhang     Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
2089a32e9c99SJunchao Zhang     PetscInt   m;
2090a32e9c99SJunchao Zhang     PetscCall(MatGetLocalSize(A, &m, NULL));
2091a32e9c99SJunchao Zhang     if (!hA->rows_d) {
2092a32e9c99SJunchao Zhang       hA->rows_d = hypre_TAlloc(PetscInt, m, HYPRE_MEMORY_DEVICE);
2093a32e9c99SJunchao Zhang       if (m) PetscCheck(hA->rows_d, PETSC_COMM_SELF, PETSC_ERR_MEM, "HYPRE_TAlloc failed");
2094a32e9c99SJunchao Zhang     }
2095a32e9c99SJunchao Zhang     PetscCheck(len <= m, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Too many rows in rows[]");
2096a32e9c99SJunchao Zhang     PetscStackCallExternalVoid("hypre_Memcpy", hypre_Memcpy(hA->rows_d, lrows, sizeof(PetscInt) * len, HYPRE_MEMORY_DEVICE, HYPRE_MEMORY_HOST));
2097a32e9c99SJunchao Zhang     lrows2 = hA->rows_d;
2098a32e9c99SJunchao Zhang   } else
2099a32e9c99SJunchao Zhang #endif
2100a32e9c99SJunchao Zhang   {
2101a32e9c99SJunchao Zhang     lrows2 = lrows;
2102a32e9c99SJunchao Zhang   }
2103a32e9c99SJunchao Zhang 
2104c69f721fSFande Kong   /* zero diagonal part */
2105a32e9c99SJunchao Zhang   PetscCall(MatZeroRows_HYPRE_CSRMatrix(hypre_ParCSRMatrixDiag(parcsr), len, lrows2, hdiag));
2106c69f721fSFande Kong   /* zero off-diagonal part */
2107a32e9c99SJunchao Zhang   PetscCall(MatZeroRows_HYPRE_CSRMatrix(hypre_ParCSRMatrixOffd(parcsr), len, lrows2, 0.0));
2108c69f721fSFande Kong 
21099566063dSJacob Faibussowitsch   PetscCall(PetscFree(lrows));
21103ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2111c69f721fSFande Kong }
2112c69f721fSFande Kong 
2113d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAssemblyBegin_HYPRE(Mat mat, MatAssemblyType mode)
2114d71ae5a4SJacob Faibussowitsch {
2115c69f721fSFande Kong   PetscFunctionBegin;
21163ba16761SJacob Faibussowitsch   if (mat->nooffprocentries) PetscFunctionReturn(PETSC_SUCCESS);
2117c69f721fSFande Kong 
21189566063dSJacob Faibussowitsch   PetscCall(MatStashScatterBegin_Private(mat, &mat->stash, mat->rmap->range));
21193ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2120c69f721fSFande Kong }
2121c69f721fSFande Kong 
2122d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetRow_HYPRE(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
2123d71ae5a4SJacob Faibussowitsch {
2124c69f721fSFande Kong   hypre_ParCSRMatrix *parcsr;
21252cf14000SStefano Zampini   HYPRE_Int           hnz;
2126c69f721fSFande Kong 
2127c69f721fSFande Kong   PetscFunctionBegin;
2128c69f721fSFande Kong   /* retrieve the internal matrix */
21299566063dSJacob Faibussowitsch   PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
2130c69f721fSFande Kong   /* call HYPRE API */
2131a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_ParCSRMatrixGetRow(parcsr, row, &hnz, (HYPRE_BigInt **)idx, (HYPRE_Complex **)v));
21322cf14000SStefano Zampini   if (nz) *nz = (PetscInt)hnz;
21333ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2134c69f721fSFande Kong }
2135c69f721fSFande Kong 
2136d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatRestoreRow_HYPRE(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
2137d71ae5a4SJacob Faibussowitsch {
2138c69f721fSFande Kong   hypre_ParCSRMatrix *parcsr;
21392cf14000SStefano Zampini   HYPRE_Int           hnz;
2140c69f721fSFande Kong 
2141c69f721fSFande Kong   PetscFunctionBegin;
2142c69f721fSFande Kong   /* retrieve the internal matrix */
21439566063dSJacob Faibussowitsch   PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
2144c69f721fSFande Kong   /* call HYPRE API */
21452cf14000SStefano Zampini   hnz = nz ? (HYPRE_Int)(*nz) : 0;
2146a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_ParCSRMatrixRestoreRow(parcsr, row, &hnz, (HYPRE_BigInt **)idx, (HYPRE_Complex **)v));
21473ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2148c69f721fSFande Kong }
2149c69f721fSFande Kong 
2150d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetValues_HYPRE(Mat A, PetscInt m, const PetscInt idxm[], PetscInt n, const PetscInt idxn[], PetscScalar v[])
2151d71ae5a4SJacob Faibussowitsch {
215245b8d346SStefano Zampini   Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
2153c69f721fSFande Kong   PetscInt   i;
21541d4906efSStefano Zampini 
2155c69f721fSFande Kong   PetscFunctionBegin;
21563ba16761SJacob Faibussowitsch   if (!m || !n) PetscFunctionReturn(PETSC_SUCCESS);
2157c69f721fSFande Kong   /* Ignore negative row indices
2158c69f721fSFande Kong    * And negative column indices should be automatically ignored in hypre
2159c69f721fSFande Kong    * */
21602cf14000SStefano Zampini   for (i = 0; i < m; i++) {
21612cf14000SStefano Zampini     if (idxm[i] >= 0) {
21622cf14000SStefano Zampini       HYPRE_Int hn = (HYPRE_Int)n;
2163a333fa2bSZach Atkins       PetscCallHYPRE(HYPRE_IJMatrixGetValues(hA->ij, 1, &hn, (HYPRE_BigInt *)&idxm[i], (HYPRE_BigInt *)idxn, (HYPRE_Complex *)(v + i * n)));
21642cf14000SStefano Zampini     }
21652cf14000SStefano Zampini   }
21663ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2167c69f721fSFande Kong }
2168c69f721fSFande Kong 
2169d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetOption_HYPRE(Mat A, MatOption op, PetscBool flg)
2170d71ae5a4SJacob Faibussowitsch {
2171ddbeb582SStefano Zampini   Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
2172ddbeb582SStefano Zampini 
2173ddbeb582SStefano Zampini   PetscFunctionBegin;
2174c6698e78SStefano Zampini   switch (op) {
2175ddbeb582SStefano Zampini   case MAT_NO_OFF_PROC_ENTRIES:
2176a333fa2bSZach Atkins     if (flg) PetscCallHYPRE(HYPRE_IJMatrixSetMaxOffProcElmts(hA->ij, 0));
2177ddbeb582SStefano Zampini     break;
2178651b1cf9SStefano Zampini   case MAT_IGNORE_OFF_PROC_ENTRIES:
2179651b1cf9SStefano Zampini     hA->donotstash = flg;
2180d71ae5a4SJacob Faibussowitsch     break;
2181d71ae5a4SJacob Faibussowitsch   default:
2182d71ae5a4SJacob Faibussowitsch     break;
2183ddbeb582SStefano Zampini   }
21843ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2185ddbeb582SStefano Zampini }
2186c69f721fSFande Kong 
2187d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_HYPRE(Mat A, PetscViewer view)
2188d71ae5a4SJacob Faibussowitsch {
218945b8d346SStefano Zampini   PetscViewerFormat format;
219045b8d346SStefano Zampini 
219145b8d346SStefano Zampini   PetscFunctionBegin;
21929566063dSJacob Faibussowitsch   PetscCall(PetscViewerGetFormat(view, &format));
21933ba16761SJacob Faibussowitsch   if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS);
219445b8d346SStefano Zampini   if (format != PETSC_VIEWER_NATIVE) {
21956ea7df73SStefano Zampini     Mat                 B;
21966ea7df73SStefano Zampini     hypre_ParCSRMatrix *parcsr;
21976ea7df73SStefano Zampini     PetscErrorCode (*mview)(Mat, PetscViewer) = NULL;
21986ea7df73SStefano Zampini 
21999566063dSJacob Faibussowitsch     PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
22009566063dSJacob Faibussowitsch     PetscCall(MatCreateFromParCSR(parcsr, MATAIJ, PETSC_USE_POINTER, &B));
220157d50842SBarry Smith     PetscCall(MatGetOperation(B, MATOP_VIEW, (PetscErrorCodeFn **)&mview));
220228b400f6SJacob Faibussowitsch     PetscCheck(mview, PetscObjectComm((PetscObject)A), PETSC_ERR_PLIB, "Missing view operation");
22039566063dSJacob Faibussowitsch     PetscCall((*mview)(B, view));
22049566063dSJacob Faibussowitsch     PetscCall(MatDestroy(&B));
220545b8d346SStefano Zampini   } else {
220645b8d346SStefano Zampini     Mat_HYPRE  *hA = (Mat_HYPRE *)A->data;
220745b8d346SStefano Zampini     PetscMPIInt size;
220845b8d346SStefano Zampini     PetscBool   isascii;
220945b8d346SStefano Zampini     const char *filename;
221045b8d346SStefano Zampini 
221145b8d346SStefano Zampini     /* HYPRE uses only text files */
22129566063dSJacob Faibussowitsch     PetscCall(PetscObjectTypeCompare((PetscObject)view, PETSCVIEWERASCII, &isascii));
221328b400f6SJacob Faibussowitsch     PetscCheck(isascii, PetscObjectComm((PetscObject)view), PETSC_ERR_SUP, "PetscViewerType %s: native HYPRE format needs PETSCVIEWERASCII", ((PetscObject)view)->type_name);
22149566063dSJacob Faibussowitsch     PetscCall(PetscViewerFileGetName(view, &filename));
2215a333fa2bSZach Atkins     PetscCallHYPRE(HYPRE_IJMatrixPrint(hA->ij, filename));
22169566063dSJacob Faibussowitsch     PetscCallMPI(MPI_Comm_size(hA->comm, &size));
221745b8d346SStefano Zampini     if (size > 1) {
22189566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(view, "Matrix files: %s.%05d ... %s.%05d\n", filename, 0, filename, size - 1));
221945b8d346SStefano Zampini     } else {
22209566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(view, "Matrix file: %s.%05d\n", filename, 0));
222145b8d346SStefano Zampini     }
222245b8d346SStefano Zampini   }
22233ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
222445b8d346SStefano Zampini }
222545b8d346SStefano Zampini 
2226d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatCopy_HYPRE(Mat A, Mat B, MatStructure str)
2227d71ae5a4SJacob Faibussowitsch {
2228465edc17SStefano Zampini   hypre_ParCSRMatrix *acsr, *bcsr;
2229465edc17SStefano Zampini 
2230465edc17SStefano Zampini   PetscFunctionBegin;
2231465edc17SStefano Zampini   if (str == SAME_NONZERO_PATTERN && A->ops->copy == B->ops->copy) {
22329566063dSJacob Faibussowitsch     PetscCall(MatHYPREGetParCSR_HYPRE(A, &acsr));
22339566063dSJacob Faibussowitsch     PetscCall(MatHYPREGetParCSR_HYPRE(B, &bcsr));
2234a333fa2bSZach Atkins     PetscCallHYPRE(hypre_ParCSRMatrixCopy(acsr, bcsr, 1));
22359566063dSJacob Faibussowitsch     PetscCall(MatSetOption(B, MAT_SORTED_FULL, PETSC_TRUE)); /* "perfect" preallocation, so no need for hypre_AuxParCSRMatrixNeedAux */
22369566063dSJacob Faibussowitsch     PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY));
22379566063dSJacob Faibussowitsch     PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY));
2238465edc17SStefano Zampini   } else {
22399566063dSJacob Faibussowitsch     PetscCall(MatCopy_Basic(A, B, str));
2240465edc17SStefano Zampini   }
22413ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2242465edc17SStefano Zampini }
2243465edc17SStefano Zampini 
2244d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetDiagonal_HYPRE(Mat A, Vec d)
2245d71ae5a4SJacob Faibussowitsch {
22466305df00SStefano Zampini   hypre_ParCSRMatrix *parcsr;
22476305df00SStefano Zampini   hypre_CSRMatrix    *dmat;
224839accc25SStefano Zampini   HYPRE_Complex      *a;
22496305df00SStefano Zampini   PetscBool           cong;
22506305df00SStefano Zampini 
22516305df00SStefano Zampini   PetscFunctionBegin;
22529566063dSJacob Faibussowitsch   PetscCall(MatHasCongruentLayouts(A, &cong));
225328b400f6SJacob Faibussowitsch   PetscCheck(cong, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only for square matrices with same local distributions of rows and columns");
22549566063dSJacob Faibussowitsch   PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
22556305df00SStefano Zampini   dmat = hypre_ParCSRMatrixDiag(parcsr);
22566305df00SStefano Zampini   if (dmat) {
225706977982Sstefanozampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
225806977982Sstefanozampini     HYPRE_MemoryLocation mem = hypre_CSRMatrixMemoryLocation(dmat);
225906977982Sstefanozampini #else
226006977982Sstefanozampini     HYPRE_MemoryLocation mem = HYPRE_MEMORY_HOST;
226106977982Sstefanozampini #endif
226206977982Sstefanozampini 
226306977982Sstefanozampini     if (mem != HYPRE_MEMORY_HOST) PetscCall(VecGetArrayWriteAndMemType(d, (PetscScalar **)&a, NULL));
226406977982Sstefanozampini     else PetscCall(VecGetArrayWrite(d, (PetscScalar **)&a));
226506977982Sstefanozampini     hypre_CSRMatrixExtractDiagonal(dmat, a, 0);
226606977982Sstefanozampini     if (mem != HYPRE_MEMORY_HOST) PetscCall(VecRestoreArrayWriteAndMemType(d, (PetscScalar **)&a));
226706977982Sstefanozampini     else PetscCall(VecRestoreArrayWrite(d, (PetscScalar **)&a));
22686305df00SStefano Zampini   }
22693ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
22706305df00SStefano Zampini }
22716305df00SStefano Zampini 
2272363d496dSStefano Zampini #include <petscblaslapack.h>
2273363d496dSStefano Zampini 
2274d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAXPY_HYPRE(Mat Y, PetscScalar a, Mat X, MatStructure str)
2275d71ae5a4SJacob Faibussowitsch {
2276363d496dSStefano Zampini   PetscFunctionBegin;
22776ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
22786ea7df73SStefano Zampini   {
22796ea7df73SStefano Zampini     Mat                 B;
22806ea7df73SStefano Zampini     hypre_ParCSRMatrix *x, *y, *z;
22816ea7df73SStefano Zampini 
22829566063dSJacob Faibussowitsch     PetscCall(MatHYPREGetParCSR(Y, &y));
22839566063dSJacob Faibussowitsch     PetscCall(MatHYPREGetParCSR(X, &x));
2284a333fa2bSZach Atkins     PetscCallHYPRE(hypre_ParCSRMatrixAdd(1.0, y, 1.0, x, &z));
22859566063dSJacob Faibussowitsch     PetscCall(MatCreateFromParCSR(z, MATHYPRE, PETSC_OWN_POINTER, &B));
22869566063dSJacob Faibussowitsch     PetscCall(MatHeaderMerge(Y, &B));
22876ea7df73SStefano Zampini   }
22886ea7df73SStefano Zampini #else
2289363d496dSStefano Zampini   if (str == SAME_NONZERO_PATTERN) {
2290363d496dSStefano Zampini     hypre_ParCSRMatrix *x, *y;
2291363d496dSStefano Zampini     hypre_CSRMatrix    *xloc, *yloc;
2292363d496dSStefano Zampini     PetscInt            xnnz, ynnz;
229339accc25SStefano Zampini     HYPRE_Complex      *xarr, *yarr;
2294363d496dSStefano Zampini     PetscBLASInt        one = 1, bnz;
2295363d496dSStefano Zampini 
22969566063dSJacob Faibussowitsch     PetscCall(MatHYPREGetParCSR(Y, &y));
22979566063dSJacob Faibussowitsch     PetscCall(MatHYPREGetParCSR(X, &x));
2298363d496dSStefano Zampini 
2299363d496dSStefano Zampini     /* diagonal block */
2300363d496dSStefano Zampini     xloc = hypre_ParCSRMatrixDiag(x);
2301363d496dSStefano Zampini     yloc = hypre_ParCSRMatrixDiag(y);
2302363d496dSStefano Zampini     xnnz = 0;
2303363d496dSStefano Zampini     ynnz = 0;
2304363d496dSStefano Zampini     xarr = NULL;
2305363d496dSStefano Zampini     yarr = NULL;
2306363d496dSStefano Zampini     if (xloc) {
230739accc25SStefano Zampini       xarr = hypre_CSRMatrixData(xloc);
2308363d496dSStefano Zampini       xnnz = hypre_CSRMatrixNumNonzeros(xloc);
2309363d496dSStefano Zampini     }
2310363d496dSStefano Zampini     if (yloc) {
231139accc25SStefano Zampini       yarr = hypre_CSRMatrixData(yloc);
2312363d496dSStefano Zampini       ynnz = hypre_CSRMatrixNumNonzeros(yloc);
2313363d496dSStefano Zampini     }
231408401ef6SPierre Jolivet     PetscCheck(xnnz == ynnz, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Different number of nonzeros in diagonal block %" PetscInt_FMT " != %" PetscInt_FMT, xnnz, ynnz);
23159566063dSJacob Faibussowitsch     PetscCall(PetscBLASIntCast(xnnz, &bnz));
2316792fecdfSBarry Smith     PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &a, (PetscScalar *)xarr, &one, (PetscScalar *)yarr, &one));
2317363d496dSStefano Zampini 
2318363d496dSStefano Zampini     /* off-diagonal block */
2319363d496dSStefano Zampini     xloc = hypre_ParCSRMatrixOffd(x);
2320363d496dSStefano Zampini     yloc = hypre_ParCSRMatrixOffd(y);
2321363d496dSStefano Zampini     xnnz = 0;
2322363d496dSStefano Zampini     ynnz = 0;
2323363d496dSStefano Zampini     xarr = NULL;
2324363d496dSStefano Zampini     yarr = NULL;
2325363d496dSStefano Zampini     if (xloc) {
232639accc25SStefano Zampini       xarr = hypre_CSRMatrixData(xloc);
2327363d496dSStefano Zampini       xnnz = hypre_CSRMatrixNumNonzeros(xloc);
2328363d496dSStefano Zampini     }
2329363d496dSStefano Zampini     if (yloc) {
233039accc25SStefano Zampini       yarr = hypre_CSRMatrixData(yloc);
2331363d496dSStefano Zampini       ynnz = hypre_CSRMatrixNumNonzeros(yloc);
2332363d496dSStefano Zampini     }
233308401ef6SPierre Jolivet     PetscCheck(xnnz == ynnz, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Different number of nonzeros in off-diagonal block %" PetscInt_FMT " != %" PetscInt_FMT, xnnz, ynnz);
23349566063dSJacob Faibussowitsch     PetscCall(PetscBLASIntCast(xnnz, &bnz));
2335792fecdfSBarry Smith     PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &a, (PetscScalar *)xarr, &one, (PetscScalar *)yarr, &one));
2336363d496dSStefano Zampini   } else if (str == SUBSET_NONZERO_PATTERN) {
23379566063dSJacob Faibussowitsch     PetscCall(MatAXPY_Basic(Y, a, X, str));
2338363d496dSStefano Zampini   } else {
2339363d496dSStefano Zampini     Mat B;
2340363d496dSStefano Zampini 
23419566063dSJacob Faibussowitsch     PetscCall(MatAXPY_Basic_Preallocate(Y, X, &B));
23429566063dSJacob Faibussowitsch     PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str));
23439566063dSJacob Faibussowitsch     PetscCall(MatHeaderReplace(Y, &B));
2344363d496dSStefano Zampini   }
23456ea7df73SStefano Zampini #endif
23463ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2347363d496dSStefano Zampini }
2348363d496dSStefano Zampini 
23492c4ab24aSJunchao Zhang static PetscErrorCode MatDuplicate_HYPRE(Mat A, MatDuplicateOption op, Mat *B)
23502c4ab24aSJunchao Zhang {
23512c4ab24aSJunchao Zhang   hypre_ParCSRMatrix *parcsr = NULL;
23522c4ab24aSJunchao Zhang   PetscCopyMode       cpmode;
23532c4ab24aSJunchao Zhang   Mat_HYPRE          *hA;
23542c4ab24aSJunchao Zhang 
23552c4ab24aSJunchao Zhang   PetscFunctionBegin;
23562c4ab24aSJunchao Zhang   PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
23572c4ab24aSJunchao Zhang   if (op == MAT_DO_NOT_COPY_VALUES || op == MAT_SHARE_NONZERO_PATTERN) {
23582c4ab24aSJunchao Zhang     parcsr = hypre_ParCSRMatrixClone(parcsr, 0);
23592c4ab24aSJunchao Zhang     cpmode = PETSC_OWN_POINTER;
23602c4ab24aSJunchao Zhang   } else {
23612c4ab24aSJunchao Zhang     cpmode = PETSC_COPY_VALUES;
23622c4ab24aSJunchao Zhang   }
23632c4ab24aSJunchao Zhang   PetscCall(MatCreateFromParCSR(parcsr, MATHYPRE, cpmode, B));
23642c4ab24aSJunchao Zhang   hA = (Mat_HYPRE *)A->data;
23652c4ab24aSJunchao Zhang   if (hA->cooMat) {
236606977982Sstefanozampini     Mat_HYPRE *hB = (Mat_HYPRE *)((*B)->data);
2367b73e3080SStefano Zampini     op            = (op == MAT_DO_NOT_COPY_VALUES) ? op : MAT_COPY_VALUES;
2368b73e3080SStefano Zampini     /* Cannot simply increase the reference count of hA->cooMat, since B needs to share cooMat's data array */
236906977982Sstefanozampini     PetscCall(MatDuplicate(hA->cooMat, op, &hB->cooMat));
237006977982Sstefanozampini     PetscCall(MatHYPRE_AttachCOOMat(*B));
23712c4ab24aSJunchao Zhang   }
23722c4ab24aSJunchao Zhang   PetscFunctionReturn(PETSC_SUCCESS);
23732c4ab24aSJunchao Zhang }
23742c4ab24aSJunchao Zhang 
2375d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetPreallocationCOO_HYPRE(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[])
2376d71ae5a4SJacob Faibussowitsch {
237706977982Sstefanozampini   Mat_HYPRE *hmat = (Mat_HYPRE *)mat->data;
23785fbaff96SJunchao Zhang 
23795fbaff96SJunchao Zhang   PetscFunctionBegin;
2380651b1cf9SStefano Zampini   /* Build an agent matrix cooMat with AIJ format
23815fbaff96SJunchao Zhang      It has the same sparsity pattern as mat, and also shares the data array with mat. We use cooMat to do the COO work.
23825fbaff96SJunchao Zhang    */
238306977982Sstefanozampini   PetscCall(MatHYPRE_CreateCOOMat(mat));
238406977982Sstefanozampini   PetscCall(MatSetOption(hmat->cooMat, MAT_IGNORE_OFF_PROC_ENTRIES, hmat->donotstash));
238506977982Sstefanozampini   PetscCall(MatSetOption(hmat->cooMat, MAT_NO_OFF_PROC_ENTRIES, mat->nooffprocentries));
2386651b1cf9SStefano Zampini 
2387651b1cf9SStefano Zampini   /* MatSetPreallocationCOO_SeqAIJ and MatSetPreallocationCOO_MPIAIJ uses this specific
2388651b1cf9SStefano Zampini      name to automatically put the diagonal entries first */
238906977982Sstefanozampini   PetscCall(PetscObjectSetName((PetscObject)hmat->cooMat, "_internal_COO_mat_for_hypre"));
239006977982Sstefanozampini   PetscCall(MatSetPreallocationCOO(hmat->cooMat, coo_n, coo_i, coo_j));
239106977982Sstefanozampini   hmat->cooMat->assembled = PETSC_TRUE;
23925fbaff96SJunchao Zhang 
23935fbaff96SJunchao Zhang   /* Copy the sparsity pattern from cooMat to hypre IJMatrix hmat->ij */
23945fbaff96SJunchao Zhang   PetscCall(MatSetOption(mat, MAT_SORTED_FULL, PETSC_TRUE));
239506977982Sstefanozampini   PetscCall(MatHYPRE_CreateFromMat(hmat->cooMat, hmat));      /* Create hmat->ij and preallocate it */
239606977982Sstefanozampini   PetscCall(MatHYPRE_IJMatrixCopyIJ(hmat->cooMat, hmat->ij)); /* Copy A's (i,j) to hmat->ij */
23975fbaff96SJunchao Zhang 
23985fbaff96SJunchao Zhang   mat->preallocated = PETSC_TRUE;
23995fbaff96SJunchao Zhang   PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY));
24005fbaff96SJunchao Zhang   PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY)); /* Migrate mat to device if it is bound to. Hypre builds its own SpMV context here */
24015fbaff96SJunchao Zhang 
24022c4ab24aSJunchao Zhang   /* Attach cooMat to mat */
240306977982Sstefanozampini   PetscCall(MatHYPRE_AttachCOOMat(mat));
24043ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
24055fbaff96SJunchao Zhang }
24065fbaff96SJunchao Zhang 
2407d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_HYPRE(Mat mat, const PetscScalar v[], InsertMode imode)
2408d71ae5a4SJacob Faibussowitsch {
24095fbaff96SJunchao Zhang   Mat_HYPRE *hmat = (Mat_HYPRE *)mat->data;
24105fbaff96SJunchao Zhang 
24115fbaff96SJunchao Zhang   PetscFunctionBegin;
2412b73e3080SStefano Zampini   PetscCheck(hmat->cooMat, PetscObjectComm((PetscObject)mat), PETSC_ERR_PLIB, "HYPRE COO delegate matrix has not been created yet");
24135fbaff96SJunchao Zhang   PetscCall(MatSetValuesCOO(hmat->cooMat, v, imode));
2414651b1cf9SStefano Zampini   PetscCall(MatViewFromOptions(hmat->cooMat, (PetscObject)mat, "-cooMat_view"));
24153ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
24165fbaff96SJunchao Zhang }
24175fbaff96SJunchao Zhang 
241803db1824SAlex Lindsay static PetscErrorCode MatGetCurrentMemType_HYPRE(Mat A, PetscMemType *m)
241903db1824SAlex Lindsay {
242003db1824SAlex Lindsay   PetscBool petsconcpu;
242103db1824SAlex Lindsay 
242203db1824SAlex Lindsay   PetscFunctionBegin;
242303db1824SAlex Lindsay   PetscCall(MatBoundToCPU(A, &petsconcpu));
242403db1824SAlex Lindsay   *m = petsconcpu ? PETSC_MEMTYPE_HOST : PETSC_MEMTYPE_DEVICE;
242503db1824SAlex Lindsay   PetscFunctionReturn(PETSC_SUCCESS);
242603db1824SAlex Lindsay }
242703db1824SAlex Lindsay 
2428a055b5aaSBarry Smith /*MC
24292ef1f0ffSBarry Smith    MATHYPRE - "hypre" - A matrix type to be used for sequential and parallel sparse matrices
2430a055b5aaSBarry Smith           based on the hypre IJ interface.
2431a055b5aaSBarry Smith 
2432a055b5aaSBarry Smith    Level: intermediate
2433a055b5aaSBarry Smith 
24341cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatHYPRESetPreallocation`
2435a055b5aaSBarry Smith M*/
2436d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_HYPRE(Mat B)
2437d71ae5a4SJacob Faibussowitsch {
243863c07aadSStefano Zampini   Mat_HYPRE *hB;
2439a9e6c71bSAlex Lindsay #if defined(PETSC_HAVE_HYPRE_DEVICE)
2440a9e6c71bSAlex Lindsay   HYPRE_MemoryLocation memory_location;
2441a9e6c71bSAlex Lindsay #endif
244263c07aadSStefano Zampini 
244363c07aadSStefano Zampini   PetscFunctionBegin;
2444a9e6c71bSAlex Lindsay   PetscHYPREInitialize();
24454dfa11a4SJacob Faibussowitsch   PetscCall(PetscNew(&hB));
24466ea7df73SStefano Zampini 
2447978814f1SStefano Zampini   hB->inner_free      = PETSC_TRUE;
2448651b1cf9SStefano Zampini   hB->array_available = PETSC_TRUE;
2449978814f1SStefano Zampini 
245063c07aadSStefano Zampini   B->data = (void *)hB;
245163c07aadSStefano Zampini 
24529566063dSJacob Faibussowitsch   PetscCall(PetscMemzero(B->ops, sizeof(struct _MatOps)));
245363c07aadSStefano Zampini   B->ops->mult                  = MatMult_HYPRE;
245463c07aadSStefano Zampini   B->ops->multtranspose         = MatMultTranspose_HYPRE;
2455414bd5c3SStefano Zampini   B->ops->multadd               = MatMultAdd_HYPRE;
2456414bd5c3SStefano Zampini   B->ops->multtransposeadd      = MatMultTransposeAdd_HYPRE;
245763c07aadSStefano Zampini   B->ops->setup                 = MatSetUp_HYPRE;
245863c07aadSStefano Zampini   B->ops->destroy               = MatDestroy_HYPRE;
245963c07aadSStefano Zampini   B->ops->assemblyend           = MatAssemblyEnd_HYPRE;
2460c69f721fSFande Kong   B->ops->assemblybegin         = MatAssemblyBegin_HYPRE;
2461d975228cSstefano_zampini   B->ops->setvalues             = MatSetValues_HYPRE;
246268ec7858SStefano Zampini   B->ops->missingdiagonal       = MatMissingDiagonal_HYPRE;
246368ec7858SStefano Zampini   B->ops->scale                 = MatScale_HYPRE;
246468ec7858SStefano Zampini   B->ops->zerorowscolumns       = MatZeroRowsColumns_HYPRE;
2465c69f721fSFande Kong   B->ops->zeroentries           = MatZeroEntries_HYPRE;
2466c69f721fSFande Kong   B->ops->zerorows              = MatZeroRows_HYPRE;
2467c69f721fSFande Kong   B->ops->getrow                = MatGetRow_HYPRE;
2468c69f721fSFande Kong   B->ops->restorerow            = MatRestoreRow_HYPRE;
2469c69f721fSFande Kong   B->ops->getvalues             = MatGetValues_HYPRE;
2470ddbeb582SStefano Zampini   B->ops->setoption             = MatSetOption_HYPRE;
247145b8d346SStefano Zampini   B->ops->duplicate             = MatDuplicate_HYPRE;
2472465edc17SStefano Zampini   B->ops->copy                  = MatCopy_HYPRE;
247345b8d346SStefano Zampini   B->ops->view                  = MatView_HYPRE;
24746305df00SStefano Zampini   B->ops->getdiagonal           = MatGetDiagonal_HYPRE;
2475363d496dSStefano Zampini   B->ops->axpy                  = MatAXPY_HYPRE;
24764222ddf1SHong Zhang   B->ops->productsetfromoptions = MatProductSetFromOptions_HYPRE;
247703db1824SAlex Lindsay   B->ops->getcurrentmemtype     = MatGetCurrentMemType_HYPRE;
24786ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
24796ea7df73SStefano Zampini   B->ops->bindtocpu = MatBindToCPU_HYPRE;
2480a9e6c71bSAlex Lindsay   /* Get hypre's default memory location. Users can control this using the corresponding HYPRE_SetMemoryLocation API */
2481a333fa2bSZach Atkins   PetscCallHYPRE(HYPRE_GetMemoryLocation(&memory_location));
2482a9e6c71bSAlex Lindsay   B->boundtocpu = (memory_location == HYPRE_MEMORY_HOST) ? PETSC_TRUE : PETSC_FALSE;
24836ea7df73SStefano Zampini #endif
248445b8d346SStefano Zampini 
248545b8d346SStefano Zampini   /* build cache for off array entries formed */
24869566063dSJacob Faibussowitsch   PetscCall(MatStashCreate_Private(PetscObjectComm((PetscObject)B), 1, &B->stash));
248763c07aadSStefano Zampini 
24889566063dSJacob Faibussowitsch   PetscCall(PetscCommGetComm(PetscObjectComm((PetscObject)B), &hB->comm));
24899566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATHYPRE));
24909566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_hypre_aij_C", MatConvert_HYPRE_AIJ));
24919566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_hypre_is_C", MatConvert_HYPRE_IS));
24929566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_hypre_C", MatProductSetFromOptions_HYPRE));
24939566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_mpiaij_hypre_C", MatProductSetFromOptions_HYPRE));
24949566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatHYPRESetPreallocation_C", MatHYPRESetPreallocation_HYPRE));
24959566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatHYPREGetParCSR_C", MatHYPREGetParCSR_HYPRE));
24965fbaff96SJunchao Zhang   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_HYPRE));
24975fbaff96SJunchao Zhang   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_HYPRE));
24986ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
24996ea7df73SStefano Zampini   #if defined(HYPRE_USING_HIP)
250006977982Sstefanozampini   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijhipsparse_hypre_C", MatProductSetFromOptions_HYPRE));
250106977982Sstefanozampini   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_mpiaijhipsparse_hypre_C", MatProductSetFromOptions_HYPRE));
25029566063dSJacob Faibussowitsch   PetscCall(PetscDeviceInitialize(PETSC_DEVICE_HIP));
25039566063dSJacob Faibussowitsch   PetscCall(MatSetVecType(B, VECHIP));
25046ea7df73SStefano Zampini   #endif
25056ea7df73SStefano Zampini   #if defined(HYPRE_USING_CUDA)
250606977982Sstefanozampini   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_hypre_C", MatProductSetFromOptions_HYPRE));
250706977982Sstefanozampini   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_mpiaijcusparse_hypre_C", MatProductSetFromOptions_HYPRE));
25089566063dSJacob Faibussowitsch   PetscCall(PetscDeviceInitialize(PETSC_DEVICE_CUDA));
25099566063dSJacob Faibussowitsch   PetscCall(MatSetVecType(B, VECCUDA));
25106ea7df73SStefano Zampini   #endif
25116ea7df73SStefano Zampini #endif
25123ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
251363c07aadSStefano Zampini }
2514