xref: /petsc/src/mat/impls/hypre/mhypre.c (revision c3339decea92175325d9368fa13196bcd0e0e58b)
163c07aadSStefano Zampini 
263c07aadSStefano Zampini /*
363c07aadSStefano Zampini     Creates hypre ijmatrix from PETSc matrix
463c07aadSStefano Zampini */
5225daaf8SStefano Zampini 
6c6698e78SStefano Zampini #include <petscpkg_version.h>
739accc25SStefano Zampini #include <petsc/private/petschypre.h>
8dd9c0a25Sstefano_zampini #include <petscmathypre.h>
963c07aadSStefano Zampini #include <petsc/private/matimpl.h>
10a4af0ceeSJacob Faibussowitsch #include <petsc/private/deviceimpl.h>
1163c07aadSStefano Zampini #include <../src/mat/impls/hypre/mhypre.h>
1263c07aadSStefano Zampini #include <../src/mat/impls/aij/mpi/mpiaij.h>
1358968eb6SStefano Zampini #include <../src/vec/vec/impls/hypre/vhyp.h>
1458968eb6SStefano Zampini #include <HYPRE.h>
15c1a070e6SStefano Zampini #include <HYPRE_utilities.h>
16cd8bc7baSStefano Zampini #include <_hypre_parcsr_ls.h>
1768ec7858SStefano Zampini #include <_hypre_sstruct_ls.h>
1863c07aadSStefano Zampini 
190e6427aaSSatish Balay #if PETSC_PKG_HYPRE_VERSION_LT(2, 18, 0)
200e6427aaSSatish Balay   #define hypre_ParCSRMatrixClone(A, B) hypre_ParCSRMatrixCompleteClone(A)
210e6427aaSSatish Balay #endif
220e6427aaSSatish Balay 
2363c07aadSStefano Zampini static PetscErrorCode MatHYPRE_CreateFromMat(Mat, Mat_HYPRE *);
2463c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixPreallocate(Mat, Mat, HYPRE_IJMatrix);
2563c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixFastCopy_MPIAIJ(Mat, HYPRE_IJMatrix);
2663c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixFastCopy_SeqAIJ(Mat, HYPRE_IJMatrix);
2739accc25SStefano Zampini static PetscErrorCode MatHYPRE_MultKernel_Private(Mat, HYPRE_Complex, Vec, HYPRE_Complex, Vec, PetscBool);
28225daaf8SStefano Zampini static PetscErrorCode hypre_array_destroy(void *);
296ea7df73SStefano Zampini static PetscErrorCode MatSetValues_HYPRE(Mat, PetscInt, const PetscInt[], PetscInt, const PetscInt[], const PetscScalar[], InsertMode ins);
3063c07aadSStefano Zampini 
31d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_IJMatrixPreallocate(Mat A_d, Mat A_o, HYPRE_IJMatrix ij)
32d71ae5a4SJacob Faibussowitsch {
3363c07aadSStefano Zampini   PetscInt        i, n_d, n_o;
3463c07aadSStefano Zampini   const PetscInt *ia_d, *ia_o;
3563c07aadSStefano Zampini   PetscBool       done_d = PETSC_FALSE, done_o = PETSC_FALSE;
362cf14000SStefano Zampini   HYPRE_Int      *nnz_d = NULL, *nnz_o = NULL;
3763c07aadSStefano Zampini 
3863c07aadSStefano Zampini   PetscFunctionBegin;
3963c07aadSStefano Zampini   if (A_d) { /* determine number of nonzero entries in local diagonal part */
409566063dSJacob Faibussowitsch     PetscCall(MatGetRowIJ(A_d, 0, PETSC_FALSE, PETSC_FALSE, &n_d, &ia_d, NULL, &done_d));
4163c07aadSStefano Zampini     if (done_d) {
429566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(n_d, &nnz_d));
43ad540459SPierre Jolivet       for (i = 0; i < n_d; i++) nnz_d[i] = ia_d[i + 1] - ia_d[i];
4463c07aadSStefano Zampini     }
459566063dSJacob Faibussowitsch     PetscCall(MatRestoreRowIJ(A_d, 0, PETSC_FALSE, PETSC_FALSE, NULL, &ia_d, NULL, &done_d));
4663c07aadSStefano Zampini   }
4763c07aadSStefano Zampini   if (A_o) { /* determine number of nonzero entries in local off-diagonal part */
489566063dSJacob Faibussowitsch     PetscCall(MatGetRowIJ(A_o, 0, PETSC_FALSE, PETSC_FALSE, &n_o, &ia_o, NULL, &done_o));
4963c07aadSStefano Zampini     if (done_o) {
509566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(n_o, &nnz_o));
51ad540459SPierre Jolivet       for (i = 0; i < n_o; i++) nnz_o[i] = ia_o[i + 1] - ia_o[i];
5263c07aadSStefano Zampini     }
539566063dSJacob Faibussowitsch     PetscCall(MatRestoreRowIJ(A_o, 0, PETSC_FALSE, PETSC_FALSE, &n_o, &ia_o, NULL, &done_o));
5463c07aadSStefano Zampini   }
5563c07aadSStefano Zampini   if (done_d) {    /* set number of nonzeros in HYPRE IJ matrix */
5663c07aadSStefano Zampini     if (!done_o) { /* only diagonal part */
579566063dSJacob Faibussowitsch       PetscCall(PetscCalloc1(n_d, &nnz_o));
5863c07aadSStefano Zampini     }
59c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2, 16, 0)
60c6698e78SStefano Zampini     { /* If we don't do this, the columns of the matrix will be all zeros! */
61c6698e78SStefano Zampini       hypre_AuxParCSRMatrix *aux_matrix;
62c6698e78SStefano Zampini       aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij);
63c6698e78SStefano Zampini       hypre_AuxParCSRMatrixDestroy(aux_matrix);
64c6698e78SStefano Zampini       hypre_IJMatrixTranslator(ij) = NULL;
65792fecdfSBarry Smith       PetscCallExternal(HYPRE_IJMatrixSetDiagOffdSizes, ij, nnz_d, nnz_o);
6622235d61SPierre Jolivet       /* it seems they partially fixed it in 2.19.0 */
6722235d61SPierre Jolivet   #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0)
68c6698e78SStefano Zampini       aux_matrix                               = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij);
69c6698e78SStefano Zampini       hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 1;
7022235d61SPierre Jolivet   #endif
71c6698e78SStefano Zampini     }
72c6698e78SStefano Zampini #else
73792fecdfSBarry Smith     PetscCallExternal(HYPRE_IJMatrixSetDiagOffdSizes, ij, nnz_d, nnz_o);
74c6698e78SStefano Zampini #endif
759566063dSJacob Faibussowitsch     PetscCall(PetscFree(nnz_d));
769566063dSJacob Faibussowitsch     PetscCall(PetscFree(nnz_o));
7763c07aadSStefano Zampini   }
7863c07aadSStefano Zampini   PetscFunctionReturn(0);
7963c07aadSStefano Zampini }
8063c07aadSStefano Zampini 
81d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_CreateFromMat(Mat A, Mat_HYPRE *hA)
82d71ae5a4SJacob Faibussowitsch {
8363c07aadSStefano Zampini   PetscInt rstart, rend, cstart, cend;
8463c07aadSStefano Zampini 
8563c07aadSStefano Zampini   PetscFunctionBegin;
869566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->rmap));
879566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->cmap));
8863c07aadSStefano Zampini   rstart = A->rmap->rstart;
8963c07aadSStefano Zampini   rend   = A->rmap->rend;
9063c07aadSStefano Zampini   cstart = A->cmap->rstart;
9163c07aadSStefano Zampini   cend   = A->cmap->rend;
92792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixCreate, hA->comm, rstart, rend - 1, cstart, cend - 1, &hA->ij);
93792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixSetObjectType, hA->ij, HYPRE_PARCSR);
9463c07aadSStefano Zampini   {
9563c07aadSStefano Zampini     PetscBool       same;
9663c07aadSStefano Zampini     Mat             A_d, A_o;
9763c07aadSStefano Zampini     const PetscInt *colmap;
989566063dSJacob Faibussowitsch     PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &same));
9963c07aadSStefano Zampini     if (same) {
1009566063dSJacob Faibussowitsch       PetscCall(MatMPIAIJGetSeqAIJ(A, &A_d, &A_o, &colmap));
1019566063dSJacob Faibussowitsch       PetscCall(MatHYPRE_IJMatrixPreallocate(A_d, A_o, hA->ij));
10263c07aadSStefano Zampini       PetscFunctionReturn(0);
10363c07aadSStefano Zampini     }
1049566063dSJacob Faibussowitsch     PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIBAIJ, &same));
10563c07aadSStefano Zampini     if (same) {
1069566063dSJacob Faibussowitsch       PetscCall(MatMPIBAIJGetSeqBAIJ(A, &A_d, &A_o, &colmap));
1079566063dSJacob Faibussowitsch       PetscCall(MatHYPRE_IJMatrixPreallocate(A_d, A_o, hA->ij));
10863c07aadSStefano Zampini       PetscFunctionReturn(0);
10963c07aadSStefano Zampini     }
1109566063dSJacob Faibussowitsch     PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATSEQAIJ, &same));
11163c07aadSStefano Zampini     if (same) {
1129566063dSJacob Faibussowitsch       PetscCall(MatHYPRE_IJMatrixPreallocate(A, NULL, hA->ij));
11363c07aadSStefano Zampini       PetscFunctionReturn(0);
11463c07aadSStefano Zampini     }
1159566063dSJacob Faibussowitsch     PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATSEQBAIJ, &same));
11663c07aadSStefano Zampini     if (same) {
1179566063dSJacob Faibussowitsch       PetscCall(MatHYPRE_IJMatrixPreallocate(A, NULL, hA->ij));
11863c07aadSStefano Zampini       PetscFunctionReturn(0);
11963c07aadSStefano Zampini     }
12063c07aadSStefano Zampini   }
12163c07aadSStefano Zampini   PetscFunctionReturn(0);
12263c07aadSStefano Zampini }
12363c07aadSStefano Zampini 
124d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_IJMatrixCopy(Mat A, HYPRE_IJMatrix ij)
125d71ae5a4SJacob Faibussowitsch {
12663c07aadSStefano Zampini   PetscInt           i, rstart, rend, ncols, nr, nc;
12763c07aadSStefano Zampini   const PetscScalar *values;
12863c07aadSStefano Zampini   const PetscInt    *cols;
12963c07aadSStefano Zampini   PetscBool          flg;
13063c07aadSStefano Zampini 
13163c07aadSStefano Zampini   PetscFunctionBegin;
1326ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0)
133792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixInitialize, ij);
1346ea7df73SStefano Zampini #else
135792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixInitialize_v2, ij, HYPRE_MEMORY_HOST);
1366ea7df73SStefano Zampini #endif
1379566063dSJacob Faibussowitsch   PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &flg));
1389566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &nr, &nc));
13963c07aadSStefano Zampini   if (flg && nr == nc) {
1409566063dSJacob Faibussowitsch     PetscCall(MatHYPRE_IJMatrixFastCopy_MPIAIJ(A, ij));
14163c07aadSStefano Zampini     PetscFunctionReturn(0);
14263c07aadSStefano Zampini   }
1439566063dSJacob Faibussowitsch   PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATSEQAIJ, &flg));
14463c07aadSStefano Zampini   if (flg) {
1459566063dSJacob Faibussowitsch     PetscCall(MatHYPRE_IJMatrixFastCopy_SeqAIJ(A, ij));
14663c07aadSStefano Zampini     PetscFunctionReturn(0);
14763c07aadSStefano Zampini   }
14863c07aadSStefano Zampini 
1495fbaff96SJunchao Zhang   /* Do not need Aux since we have done precise i[],j[] allocation in MatHYPRE_CreateFromMat() */
1505fbaff96SJunchao Zhang   hypre_AuxParCSRMatrixNeedAux((hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij)) = 0;
1515fbaff96SJunchao Zhang 
1529566063dSJacob Faibussowitsch   PetscCall(MatGetOwnershipRange(A, &rstart, &rend));
15363c07aadSStefano Zampini   for (i = rstart; i < rend; i++) {
1549566063dSJacob Faibussowitsch     PetscCall(MatGetRow(A, i, &ncols, &cols, &values));
155e3977e59Sstefano_zampini     if (ncols) {
1562cf14000SStefano Zampini       HYPRE_Int nc = (HYPRE_Int)ncols;
1572cf14000SStefano Zampini 
158aed4548fSBarry Smith       PetscCheck((PetscInt)nc == ncols, PETSC_COMM_SELF, PETSC_ERR_SUP, "Hypre overflow! number of columns %" PetscInt_FMT " for row %" PetscInt_FMT, ncols, i);
159792fecdfSBarry Smith       PetscCallExternal(HYPRE_IJMatrixSetValues, ij, 1, &nc, (HYPRE_BigInt *)&i, (HYPRE_BigInt *)cols, (HYPRE_Complex *)values);
160e3977e59Sstefano_zampini     }
1619566063dSJacob Faibussowitsch     PetscCall(MatRestoreRow(A, i, &ncols, &cols, &values));
16263c07aadSStefano Zampini   }
16363c07aadSStefano Zampini   PetscFunctionReturn(0);
16463c07aadSStefano Zampini }
16563c07aadSStefano Zampini 
166d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_IJMatrixFastCopy_SeqAIJ(Mat A, HYPRE_IJMatrix ij)
167d71ae5a4SJacob Faibussowitsch {
16863c07aadSStefano Zampini   Mat_SeqAIJ            *pdiag = (Mat_SeqAIJ *)A->data;
16958968eb6SStefano Zampini   HYPRE_Int              type;
17063c07aadSStefano Zampini   hypre_ParCSRMatrix    *par_matrix;
17163c07aadSStefano Zampini   hypre_AuxParCSRMatrix *aux_matrix;
17263c07aadSStefano Zampini   hypre_CSRMatrix       *hdiag;
1732cf14000SStefano Zampini   PetscBool              sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int));
1746ea7df73SStefano Zampini   const PetscScalar     *pa;
17563c07aadSStefano Zampini 
17663c07aadSStefano Zampini   PetscFunctionBegin;
177792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixGetObjectType, ij, &type);
17808401ef6SPierre Jolivet   PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported");
179792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixGetObject, ij, (void **)&par_matrix);
18063c07aadSStefano Zampini   hdiag = hypre_ParCSRMatrixDiag(par_matrix);
18163c07aadSStefano Zampini   /*
18263c07aadSStefano Zampini        this is the Hack part where we monkey directly with the hypre datastructures
18363c07aadSStefano Zampini   */
1842cf14000SStefano Zampini   if (sameint) {
1859566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(hdiag->i, pdiag->i, A->rmap->n + 1));
1869566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(hdiag->j, pdiag->j, pdiag->nz));
1872cf14000SStefano Zampini   } else {
1882cf14000SStefano Zampini     PetscInt i;
1892cf14000SStefano Zampini 
1902cf14000SStefano Zampini     for (i = 0; i < A->rmap->n + 1; i++) hdiag->i[i] = (HYPRE_Int)pdiag->i[i];
1912cf14000SStefano Zampini     for (i = 0; i < pdiag->nz; i++) hdiag->j[i] = (HYPRE_Int)pdiag->j[i];
1922cf14000SStefano Zampini   }
1936ea7df73SStefano Zampini 
1949566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &pa));
1959566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(hdiag->data, pa, pdiag->nz));
1969566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &pa));
197ea9daf28SStefano Zampini 
198ea9daf28SStefano Zampini   aux_matrix                               = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij);
19963c07aadSStefano Zampini   hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0;
20063c07aadSStefano Zampini   PetscFunctionReturn(0);
20163c07aadSStefano Zampini }
20263c07aadSStefano Zampini 
203d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_IJMatrixFastCopy_MPIAIJ(Mat A, HYPRE_IJMatrix ij)
204d71ae5a4SJacob Faibussowitsch {
20563c07aadSStefano Zampini   Mat_MPIAIJ            *pA = (Mat_MPIAIJ *)A->data;
20663c07aadSStefano Zampini   Mat_SeqAIJ            *pdiag, *poffd;
20763c07aadSStefano Zampini   PetscInt               i, *garray = pA->garray, *jj, cstart, *pjj;
2082cf14000SStefano Zampini   HYPRE_Int             *hjj, type;
20963c07aadSStefano Zampini   hypre_ParCSRMatrix    *par_matrix;
21063c07aadSStefano Zampini   hypre_AuxParCSRMatrix *aux_matrix;
21163c07aadSStefano Zampini   hypre_CSRMatrix       *hdiag, *hoffd;
2122cf14000SStefano Zampini   PetscBool              sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int));
2136ea7df73SStefano Zampini   const PetscScalar     *pa;
21463c07aadSStefano Zampini 
21563c07aadSStefano Zampini   PetscFunctionBegin;
21663c07aadSStefano Zampini   pdiag = (Mat_SeqAIJ *)pA->A->data;
21763c07aadSStefano Zampini   poffd = (Mat_SeqAIJ *)pA->B->data;
21863c07aadSStefano Zampini   /* cstart is only valid for square MPIAIJ layed out in the usual way */
2199566063dSJacob Faibussowitsch   PetscCall(MatGetOwnershipRange(A, &cstart, NULL));
22063c07aadSStefano Zampini 
221792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixGetObjectType, ij, &type);
22208401ef6SPierre Jolivet   PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported");
223792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixGetObject, ij, (void **)&par_matrix);
22463c07aadSStefano Zampini   hdiag = hypre_ParCSRMatrixDiag(par_matrix);
22563c07aadSStefano Zampini   hoffd = hypre_ParCSRMatrixOffd(par_matrix);
22663c07aadSStefano Zampini 
22763c07aadSStefano Zampini   /*
22863c07aadSStefano Zampini        this is the Hack part where we monkey directly with the hypre datastructures
22963c07aadSStefano Zampini   */
2302cf14000SStefano Zampini   if (sameint) {
2319566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(hdiag->i, pdiag->i, pA->A->rmap->n + 1));
2322cf14000SStefano Zampini   } else {
2332cf14000SStefano Zampini     for (i = 0; i < pA->A->rmap->n + 1; i++) hdiag->i[i] = (HYPRE_Int)(pdiag->i[i]);
2342cf14000SStefano Zampini   }
23563c07aadSStefano Zampini   /* need to shift the diag column indices (hdiag->j) back to global numbering since hypre is expecting this */
2362cf14000SStefano Zampini   hjj = hdiag->j;
2372cf14000SStefano Zampini   pjj = pdiag->j;
238c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2, 16, 0)
2392cf14000SStefano Zampini   for (i = 0; i < pdiag->nz; i++) hjj[i] = pjj[i];
240c6698e78SStefano Zampini #else
2412cf14000SStefano Zampini   for (i = 0; i < pdiag->nz; i++) hjj[i] = cstart + pjj[i];
242c6698e78SStefano Zampini #endif
2439566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(pA->A, &pa));
2449566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(hdiag->data, pa, pdiag->nz));
2459566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(pA->A, &pa));
2462cf14000SStefano Zampini   if (sameint) {
2479566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(hoffd->i, poffd->i, pA->A->rmap->n + 1));
2482cf14000SStefano Zampini   } else {
2492cf14000SStefano Zampini     for (i = 0; i < pA->A->rmap->n + 1; i++) hoffd->i[i] = (HYPRE_Int)(poffd->i[i]);
2502cf14000SStefano Zampini   }
2512cf14000SStefano Zampini 
25263c07aadSStefano Zampini   /* need to move the offd column indices (hoffd->j) back to global numbering since hypre is expecting this
25363c07aadSStefano Zampini      If we hacked a hypre a bit more we might be able to avoid this step */
254c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2, 16, 0)
255792fecdfSBarry Smith   PetscCallExternal(hypre_CSRMatrixBigInitialize, hoffd);
256c6698e78SStefano Zampini   jj = (PetscInt *)hoffd->big_j;
257c6698e78SStefano Zampini #else
25863c07aadSStefano Zampini   jj = (PetscInt *)hoffd->j;
259c6698e78SStefano Zampini #endif
2602cf14000SStefano Zampini   pjj = poffd->j;
26163c07aadSStefano Zampini   for (i = 0; i < poffd->nz; i++) jj[i] = garray[pjj[i]];
262c6698e78SStefano Zampini 
2639566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(pA->B, &pa));
2649566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(hoffd->data, pa, poffd->nz));
2659566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(pA->B, &pa));
26663c07aadSStefano Zampini 
267ea9daf28SStefano Zampini   aux_matrix                               = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij);
26863c07aadSStefano Zampini   hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0;
26963c07aadSStefano Zampini   PetscFunctionReturn(0);
27063c07aadSStefano Zampini }
27163c07aadSStefano Zampini 
272d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatConvert_HYPRE_IS(Mat A, MatType mtype, MatReuse reuse, Mat *B)
273d71ae5a4SJacob Faibussowitsch {
2742df22349SStefano Zampini   Mat_HYPRE             *mhA = (Mat_HYPRE *)(A->data);
2752df22349SStefano Zampini   Mat                    lA;
2762df22349SStefano Zampini   ISLocalToGlobalMapping rl2g, cl2g;
2772df22349SStefano Zampini   IS                     is;
2782df22349SStefano Zampini   hypre_ParCSRMatrix    *hA;
2792df22349SStefano Zampini   hypre_CSRMatrix       *hdiag, *hoffd;
2802df22349SStefano Zampini   MPI_Comm               comm;
28139accc25SStefano Zampini   HYPRE_Complex         *hdd, *hod, *aa;
28239accc25SStefano Zampini   PetscScalar           *data;
2832cf14000SStefano Zampini   HYPRE_BigInt          *col_map_offd;
2842cf14000SStefano Zampini   HYPRE_Int             *hdi, *hdj, *hoi, *hoj;
2852df22349SStefano Zampini   PetscInt              *ii, *jj, *iptr, *jptr;
2862df22349SStefano Zampini   PetscInt               cum, dr, dc, oc, str, stc, nnz, i, jd, jo, M, N;
28758968eb6SStefano Zampini   HYPRE_Int              type;
2882df22349SStefano Zampini 
2892df22349SStefano Zampini   PetscFunctionBegin;
290a1787963SStefano Zampini   comm = PetscObjectComm((PetscObject)A);
291792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixGetObjectType, mhA->ij, &type);
29208401ef6SPierre Jolivet   PetscCheck(type == HYPRE_PARCSR, comm, PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported");
293792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixGetObject, mhA->ij, (void **)&hA);
2942df22349SStefano Zampini   M     = hypre_ParCSRMatrixGlobalNumRows(hA);
2952df22349SStefano Zampini   N     = hypre_ParCSRMatrixGlobalNumCols(hA);
2962df22349SStefano Zampini   str   = hypre_ParCSRMatrixFirstRowIndex(hA);
2972df22349SStefano Zampini   stc   = hypre_ParCSRMatrixFirstColDiag(hA);
2982df22349SStefano Zampini   hdiag = hypre_ParCSRMatrixDiag(hA);
2992df22349SStefano Zampini   hoffd = hypre_ParCSRMatrixOffd(hA);
3002df22349SStefano Zampini   dr    = hypre_CSRMatrixNumRows(hdiag);
3012df22349SStefano Zampini   dc    = hypre_CSRMatrixNumCols(hdiag);
3022df22349SStefano Zampini   nnz   = hypre_CSRMatrixNumNonzeros(hdiag);
3032df22349SStefano Zampini   hdi   = hypre_CSRMatrixI(hdiag);
3042df22349SStefano Zampini   hdj   = hypre_CSRMatrixJ(hdiag);
3052df22349SStefano Zampini   hdd   = hypre_CSRMatrixData(hdiag);
3062df22349SStefano Zampini   oc    = hypre_CSRMatrixNumCols(hoffd);
3072df22349SStefano Zampini   nnz += hypre_CSRMatrixNumNonzeros(hoffd);
3082df22349SStefano Zampini   hoi = hypre_CSRMatrixI(hoffd);
3092df22349SStefano Zampini   hoj = hypre_CSRMatrixJ(hoffd);
3102df22349SStefano Zampini   hod = hypre_CSRMatrixData(hoffd);
3112df22349SStefano Zampini   if (reuse != MAT_REUSE_MATRIX) {
3122df22349SStefano Zampini     PetscInt *aux;
3132df22349SStefano Zampini 
3142df22349SStefano Zampini     /* generate l2g maps for rows and cols */
3159566063dSJacob Faibussowitsch     PetscCall(ISCreateStride(comm, dr, str, 1, &is));
3169566063dSJacob Faibussowitsch     PetscCall(ISLocalToGlobalMappingCreateIS(is, &rl2g));
3179566063dSJacob Faibussowitsch     PetscCall(ISDestroy(&is));
3182df22349SStefano Zampini     col_map_offd = hypre_ParCSRMatrixColMapOffd(hA);
3199566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(dc + oc, &aux));
3202df22349SStefano Zampini     for (i = 0; i < dc; i++) aux[i] = i + stc;
3212df22349SStefano Zampini     for (i = 0; i < oc; i++) aux[i + dc] = col_map_offd[i];
3229566063dSJacob Faibussowitsch     PetscCall(ISCreateGeneral(comm, dc + oc, aux, PETSC_OWN_POINTER, &is));
3239566063dSJacob Faibussowitsch     PetscCall(ISLocalToGlobalMappingCreateIS(is, &cl2g));
3249566063dSJacob Faibussowitsch     PetscCall(ISDestroy(&is));
3252df22349SStefano Zampini     /* create MATIS object */
3269566063dSJacob Faibussowitsch     PetscCall(MatCreate(comm, B));
3279566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(*B, dr, dc, M, N));
3289566063dSJacob Faibussowitsch     PetscCall(MatSetType(*B, MATIS));
3299566063dSJacob Faibussowitsch     PetscCall(MatSetLocalToGlobalMapping(*B, rl2g, cl2g));
3309566063dSJacob Faibussowitsch     PetscCall(ISLocalToGlobalMappingDestroy(&rl2g));
3319566063dSJacob Faibussowitsch     PetscCall(ISLocalToGlobalMappingDestroy(&cl2g));
3322df22349SStefano Zampini 
3332df22349SStefano Zampini     /* allocate CSR for local matrix */
3349566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(dr + 1, &iptr));
3359566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nnz, &jptr));
3369566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nnz, &data));
3372df22349SStefano Zampini   } else {
3382df22349SStefano Zampini     PetscInt  nr;
3392df22349SStefano Zampini     PetscBool done;
3409566063dSJacob Faibussowitsch     PetscCall(MatISGetLocalMat(*B, &lA));
3419566063dSJacob Faibussowitsch     PetscCall(MatGetRowIJ(lA, 0, PETSC_FALSE, PETSC_FALSE, &nr, (const PetscInt **)&iptr, (const PetscInt **)&jptr, &done));
34208401ef6SPierre Jolivet     PetscCheck(nr == dr, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of rows in local mat! %" PetscInt_FMT " != %" PetscInt_FMT, nr, dr);
34308401ef6SPierre Jolivet     PetscCheck(iptr[nr] >= nnz, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of nonzeros in local mat! reuse %" PetscInt_FMT " requested %" PetscInt_FMT, iptr[nr], nnz);
3449566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(lA, &data));
3452df22349SStefano Zampini   }
3462df22349SStefano Zampini   /* merge local matrices */
3472df22349SStefano Zampini   ii  = iptr;
3482df22349SStefano Zampini   jj  = jptr;
34939accc25SStefano Zampini   aa  = (HYPRE_Complex *)data; /* this cast fixes the clang error when doing the assignments below: implicit conversion from 'HYPRE_Complex' (aka '_Complex double') to 'double' is not permitted in C++ */
3502df22349SStefano Zampini   *ii = *(hdi++) + *(hoi++);
3512df22349SStefano Zampini   for (jd = 0, jo = 0, cum = 0; *ii < nnz; cum++) {
35239accc25SStefano Zampini     PetscScalar *aold = (PetscScalar *)aa;
3532df22349SStefano Zampini     PetscInt    *jold = jj, nc = jd + jo;
3549371c9d4SSatish Balay     for (; jd < *hdi; jd++) {
3559371c9d4SSatish Balay       *jj++ = *hdj++;
3569371c9d4SSatish Balay       *aa++ = *hdd++;
3579371c9d4SSatish Balay     }
3589371c9d4SSatish Balay     for (; jo < *hoi; jo++) {
3599371c9d4SSatish Balay       *jj++ = *hoj++ + dc;
3609371c9d4SSatish Balay       *aa++ = *hod++;
3619371c9d4SSatish Balay     }
3622df22349SStefano Zampini     *(++ii) = *(hdi++) + *(hoi++);
3639566063dSJacob Faibussowitsch     PetscCall(PetscSortIntWithScalarArray(jd + jo - nc, jold, aold));
3642df22349SStefano Zampini   }
3652df22349SStefano Zampini   for (; cum < dr; cum++) *(++ii) = nnz;
3662df22349SStefano Zampini   if (reuse != MAT_REUSE_MATRIX) {
367a033916dSStefano Zampini     Mat_SeqAIJ *a;
368a033916dSStefano Zampini 
3699566063dSJacob Faibussowitsch     PetscCall(MatCreateSeqAIJWithArrays(PETSC_COMM_SELF, dr, dc + oc, iptr, jptr, data, &lA));
3709566063dSJacob Faibussowitsch     PetscCall(MatISSetLocalMat(*B, lA));
371a033916dSStefano Zampini     /* hack SeqAIJ */
372a033916dSStefano Zampini     a          = (Mat_SeqAIJ *)(lA->data);
373a033916dSStefano Zampini     a->free_a  = PETSC_TRUE;
374a033916dSStefano Zampini     a->free_ij = PETSC_TRUE;
3759566063dSJacob Faibussowitsch     PetscCall(MatDestroy(&lA));
3762df22349SStefano Zampini   }
3779566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY));
3789566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY));
37948a46eb9SPierre Jolivet   if (reuse == MAT_INPLACE_MATRIX) PetscCall(MatHeaderReplace(A, B));
3802df22349SStefano Zampini   PetscFunctionReturn(0);
3812df22349SStefano Zampini }
3822df22349SStefano Zampini 
383d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType type, MatReuse reuse, Mat *B)
384d71ae5a4SJacob Faibussowitsch {
38584d4e069SStefano Zampini   Mat        M = NULL;
38663c07aadSStefano Zampini   Mat_HYPRE *hB;
38763c07aadSStefano Zampini   MPI_Comm   comm = PetscObjectComm((PetscObject)A);
38863c07aadSStefano Zampini 
38963c07aadSStefano Zampini   PetscFunctionBegin;
39063c07aadSStefano Zampini   if (reuse == MAT_REUSE_MATRIX) {
39163c07aadSStefano Zampini     /* always destroy the old matrix and create a new memory;
39263c07aadSStefano Zampini        hope this does not churn the memory too much. The problem
39363c07aadSStefano Zampini        is I do not know if it is possible to put the matrix back to
39463c07aadSStefano Zampini        its initial state so that we can directly copy the values
39563c07aadSStefano Zampini        the second time through. */
39663c07aadSStefano Zampini     hB = (Mat_HYPRE *)((*B)->data);
397792fecdfSBarry Smith     PetscCallExternal(HYPRE_IJMatrixDestroy, hB->ij);
39863c07aadSStefano Zampini   } else {
3999566063dSJacob Faibussowitsch     PetscCall(MatCreate(comm, &M));
4009566063dSJacob Faibussowitsch     PetscCall(MatSetType(M, MATHYPRE));
4019566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(M, A->rmap->n, A->cmap->n, A->rmap->N, A->cmap->N));
40284d4e069SStefano Zampini     hB = (Mat_HYPRE *)(M->data);
40384d4e069SStefano Zampini     if (reuse == MAT_INITIAL_MATRIX) *B = M;
40463c07aadSStefano Zampini   }
4059566063dSJacob Faibussowitsch   PetscCall(MatSetOption(*B, MAT_SORTED_FULL, PETSC_TRUE)); /* "perfect" preallocation, so no need for hypre_AuxParCSRMatrixNeedAux */
4069566063dSJacob Faibussowitsch   PetscCall(MatSetOption(*B, MAT_NO_OFF_PROC_ENTRIES, PETSC_TRUE));
4079566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_CreateFromMat(A, hB));
4089566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_IJMatrixCopy(A, hB->ij));
40948a46eb9SPierre Jolivet   if (reuse == MAT_INPLACE_MATRIX) PetscCall(MatHeaderReplace(A, &M));
4104ec6421dSstefano_zampini   (*B)->preallocated = PETSC_TRUE;
4119566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY));
4129566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY));
41363c07aadSStefano Zampini   PetscFunctionReturn(0);
41463c07aadSStefano Zampini }
41563c07aadSStefano Zampini 
416d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatConvert_HYPRE_AIJ(Mat A, MatType mtype, MatReuse reuse, Mat *B)
417d71ae5a4SJacob Faibussowitsch {
41863c07aadSStefano Zampini   Mat_HYPRE          *hA = (Mat_HYPRE *)A->data;
41963c07aadSStefano Zampini   hypre_ParCSRMatrix *parcsr;
42063c07aadSStefano Zampini   hypre_CSRMatrix    *hdiag, *hoffd;
42163c07aadSStefano Zampini   MPI_Comm            comm;
42263c07aadSStefano Zampini   PetscScalar        *da, *oa, *aptr;
42363c07aadSStefano Zampini   PetscInt           *dii, *djj, *oii, *ojj, *iptr;
42463c07aadSStefano Zampini   PetscInt            i, dnnz, onnz, m, n;
42558968eb6SStefano Zampini   HYPRE_Int           type;
42663c07aadSStefano Zampini   PetscMPIInt         size;
4272cf14000SStefano Zampini   PetscBool           sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int));
42863c07aadSStefano Zampini 
42963c07aadSStefano Zampini   PetscFunctionBegin;
43063c07aadSStefano Zampini   comm = PetscObjectComm((PetscObject)A);
431792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixGetObjectType, hA->ij, &type);
43208401ef6SPierre Jolivet   PetscCheck(type == HYPRE_PARCSR, comm, PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported");
43363c07aadSStefano Zampini   if (reuse == MAT_REUSE_MATRIX) {
43463c07aadSStefano Zampini     PetscBool ismpiaij, isseqaij;
4359566063dSJacob Faibussowitsch     PetscCall(PetscObjectBaseTypeCompare((PetscObject)*B, MATMPIAIJ, &ismpiaij));
4369566063dSJacob Faibussowitsch     PetscCall(PetscObjectBaseTypeCompare((PetscObject)*B, MATSEQAIJ, &isseqaij));
43708401ef6SPierre Jolivet     PetscCheck(ismpiaij || isseqaij, comm, PETSC_ERR_SUP, "Only MATMPIAIJ or MATSEQAIJ are supported");
43863c07aadSStefano Zampini   }
4396ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
44008401ef6SPierre Jolivet   PetscCheck(HYPRE_MEMORY_DEVICE != hypre_IJMatrixMemoryLocation(hA->ij), comm, PETSC_ERR_SUP, "Not yet implemented");
4416ea7df73SStefano Zampini #endif
4429566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_size(comm, &size));
44363c07aadSStefano Zampini 
444792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixGetObject, hA->ij, (void **)&parcsr);
44563c07aadSStefano Zampini   hdiag = hypre_ParCSRMatrixDiag(parcsr);
44663c07aadSStefano Zampini   hoffd = hypre_ParCSRMatrixOffd(parcsr);
44763c07aadSStefano Zampini   m     = hypre_CSRMatrixNumRows(hdiag);
44863c07aadSStefano Zampini   n     = hypre_CSRMatrixNumCols(hdiag);
44963c07aadSStefano Zampini   dnnz  = hypre_CSRMatrixNumNonzeros(hdiag);
45063c07aadSStefano Zampini   onnz  = hypre_CSRMatrixNumNonzeros(hoffd);
451225daaf8SStefano Zampini   if (reuse == MAT_INITIAL_MATRIX) {
4529566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(m + 1, &dii));
4539566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(dnnz, &djj));
4549566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(dnnz, &da));
455225daaf8SStefano Zampini   } else if (reuse == MAT_REUSE_MATRIX) {
45663c07aadSStefano Zampini     PetscInt  nr;
45763c07aadSStefano Zampini     PetscBool done;
45863c07aadSStefano Zampini     if (size > 1) {
45963c07aadSStefano Zampini       Mat_MPIAIJ *b = (Mat_MPIAIJ *)((*B)->data);
46063c07aadSStefano Zampini 
4619566063dSJacob Faibussowitsch       PetscCall(MatGetRowIJ(b->A, 0, PETSC_FALSE, PETSC_FALSE, &nr, (const PetscInt **)&dii, (const PetscInt **)&djj, &done));
46208401ef6SPierre Jolivet       PetscCheck(nr == m, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of local rows in diag part! %" PetscInt_FMT " != %" PetscInt_FMT, nr, m);
46308401ef6SPierre Jolivet       PetscCheck(dii[nr] >= dnnz, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of nonzeros in diag part! reuse %" PetscInt_FMT " hypre %" PetscInt_FMT, dii[nr], dnnz);
4649566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJGetArray(b->A, &da));
46563c07aadSStefano Zampini     } else {
4669566063dSJacob Faibussowitsch       PetscCall(MatGetRowIJ(*B, 0, PETSC_FALSE, PETSC_FALSE, &nr, (const PetscInt **)&dii, (const PetscInt **)&djj, &done));
46708401ef6SPierre Jolivet       PetscCheck(nr == m, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of local rows! %" PetscInt_FMT " != %" PetscInt_FMT, nr, m);
46808401ef6SPierre Jolivet       PetscCheck(dii[nr] >= dnnz, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of nonzeros! reuse %" PetscInt_FMT " hypre %" PetscInt_FMT, dii[nr], dnnz);
4699566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJGetArray(*B, &da));
47063c07aadSStefano Zampini     }
471225daaf8SStefano Zampini   } else { /* MAT_INPLACE_MATRIX */
4722cf14000SStefano Zampini     if (!sameint) {
4739566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m + 1, &dii));
4749566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(dnnz, &djj));
4752cf14000SStefano Zampini     } else {
4767d968826Sstefano_zampini       dii = (PetscInt *)hypre_CSRMatrixI(hdiag);
4777d968826Sstefano_zampini       djj = (PetscInt *)hypre_CSRMatrixJ(hdiag);
47863c07aadSStefano Zampini     }
47939accc25SStefano Zampini     da = (PetscScalar *)hypre_CSRMatrixData(hdiag);
48063c07aadSStefano Zampini   }
4812cf14000SStefano Zampini 
4822cf14000SStefano Zampini   if (!sameint) {
4839371c9d4SSatish Balay     if (reuse != MAT_REUSE_MATRIX) {
4849371c9d4SSatish Balay       for (i = 0; i < m + 1; i++) dii[i] = (PetscInt)(hypre_CSRMatrixI(hdiag)[i]);
4859371c9d4SSatish Balay     }
4862cf14000SStefano Zampini     for (i = 0; i < dnnz; i++) djj[i] = (PetscInt)(hypre_CSRMatrixJ(hdiag)[i]);
4872cf14000SStefano Zampini   } else {
4889566063dSJacob Faibussowitsch     if (reuse != MAT_REUSE_MATRIX) PetscCall(PetscArraycpy(dii, hypre_CSRMatrixI(hdiag), m + 1));
4899566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(djj, hypre_CSRMatrixJ(hdiag), dnnz));
4902cf14000SStefano Zampini   }
4919566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(da, hypre_CSRMatrixData(hdiag), dnnz));
49263c07aadSStefano Zampini   iptr = djj;
49363c07aadSStefano Zampini   aptr = da;
49463c07aadSStefano Zampini   for (i = 0; i < m; i++) {
49563c07aadSStefano Zampini     PetscInt nc = dii[i + 1] - dii[i];
4969566063dSJacob Faibussowitsch     PetscCall(PetscSortIntWithScalarArray(nc, iptr, aptr));
49763c07aadSStefano Zampini     iptr += nc;
49863c07aadSStefano Zampini     aptr += nc;
49963c07aadSStefano Zampini   }
50063c07aadSStefano Zampini   if (size > 1) {
5012cf14000SStefano Zampini     HYPRE_BigInt *coffd;
5022cf14000SStefano Zampini     HYPRE_Int    *offdj;
50363c07aadSStefano Zampini 
504225daaf8SStefano Zampini     if (reuse == MAT_INITIAL_MATRIX) {
5059566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m + 1, &oii));
5069566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(onnz, &ojj));
5079566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(onnz, &oa));
508225daaf8SStefano Zampini     } else if (reuse == MAT_REUSE_MATRIX) {
50963c07aadSStefano Zampini       Mat_MPIAIJ *b = (Mat_MPIAIJ *)((*B)->data);
51063c07aadSStefano Zampini       PetscInt    nr, hr = hypre_CSRMatrixNumRows(hoffd);
51163c07aadSStefano Zampini       PetscBool   done;
51263c07aadSStefano Zampini 
5139566063dSJacob Faibussowitsch       PetscCall(MatGetRowIJ(b->B, 0, PETSC_FALSE, PETSC_FALSE, &nr, (const PetscInt **)&oii, (const PetscInt **)&ojj, &done));
51408401ef6SPierre Jolivet       PetscCheck(nr == hr, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of local rows in offdiag part! %" PetscInt_FMT " != %" PetscInt_FMT, nr, hr);
51508401ef6SPierre Jolivet       PetscCheck(oii[nr] >= onnz, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of nonzeros in offdiag part! reuse %" PetscInt_FMT " hypre %" PetscInt_FMT, oii[nr], onnz);
5169566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJGetArray(b->B, &oa));
517225daaf8SStefano Zampini     } else { /* MAT_INPLACE_MATRIX */
5182cf14000SStefano Zampini       if (!sameint) {
5199566063dSJacob Faibussowitsch         PetscCall(PetscMalloc1(m + 1, &oii));
5209566063dSJacob Faibussowitsch         PetscCall(PetscMalloc1(onnz, &ojj));
5212cf14000SStefano Zampini       } else {
5227d968826Sstefano_zampini         oii = (PetscInt *)hypre_CSRMatrixI(hoffd);
5237d968826Sstefano_zampini         ojj = (PetscInt *)hypre_CSRMatrixJ(hoffd);
52463c07aadSStefano Zampini       }
52539accc25SStefano Zampini       oa = (PetscScalar *)hypre_CSRMatrixData(hoffd);
52663c07aadSStefano Zampini     }
527a16187a7SStefano Zampini     if (reuse != MAT_REUSE_MATRIX) {
5282cf14000SStefano Zampini       if (!sameint) {
5292cf14000SStefano Zampini         for (i = 0; i < m + 1; i++) oii[i] = (PetscInt)(hypre_CSRMatrixI(hoffd)[i]);
5302cf14000SStefano Zampini       } else {
5319566063dSJacob Faibussowitsch         PetscCall(PetscArraycpy(oii, hypre_CSRMatrixI(hoffd), m + 1));
5322cf14000SStefano Zampini       }
533a16187a7SStefano Zampini     }
5349566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(oa, hypre_CSRMatrixData(hoffd), onnz));
535a16187a7SStefano Zampini 
53663c07aadSStefano Zampini     offdj = hypre_CSRMatrixJ(hoffd);
53763c07aadSStefano Zampini     coffd = hypre_ParCSRMatrixColMapOffd(parcsr);
538a16187a7SStefano Zampini     /* we only need the permutation to be computed properly, I don't know if HYPRE
539a16187a7SStefano Zampini        messes up with the ordering. Just in case, allocate some memory and free it
540a16187a7SStefano Zampini        later */
541a16187a7SStefano Zampini     if (reuse == MAT_REUSE_MATRIX) {
542a16187a7SStefano Zampini       Mat_MPIAIJ *b = (Mat_MPIAIJ *)((*B)->data);
543a16187a7SStefano Zampini       PetscInt    mnz;
544a16187a7SStefano Zampini 
5459566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJGetMaxRowNonzeros(b->B, &mnz));
5469566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(mnz, &ojj));
5479371c9d4SSatish Balay     } else
5489371c9d4SSatish Balay       for (i = 0; i < onnz; i++) ojj[i] = coffd[offdj[i]];
54963c07aadSStefano Zampini     iptr = ojj;
55063c07aadSStefano Zampini     aptr = oa;
55163c07aadSStefano Zampini     for (i = 0; i < m; i++) {
55263c07aadSStefano Zampini       PetscInt nc = oii[i + 1] - oii[i];
553a16187a7SStefano Zampini       if (reuse == MAT_REUSE_MATRIX) {
554a16187a7SStefano Zampini         PetscInt j;
555a16187a7SStefano Zampini 
556a16187a7SStefano Zampini         iptr = ojj;
557a16187a7SStefano Zampini         for (j = 0; j < nc; j++) iptr[j] = coffd[offdj[oii[i] + j]];
558a16187a7SStefano Zampini       }
5599566063dSJacob Faibussowitsch       PetscCall(PetscSortIntWithScalarArray(nc, iptr, aptr));
56063c07aadSStefano Zampini       iptr += nc;
56163c07aadSStefano Zampini       aptr += nc;
56263c07aadSStefano Zampini     }
5639566063dSJacob Faibussowitsch     if (reuse == MAT_REUSE_MATRIX) PetscCall(PetscFree(ojj));
564225daaf8SStefano Zampini     if (reuse == MAT_INITIAL_MATRIX) {
56563c07aadSStefano Zampini       Mat_MPIAIJ *b;
56663c07aadSStefano Zampini       Mat_SeqAIJ *d, *o;
567225daaf8SStefano Zampini 
5689566063dSJacob Faibussowitsch       PetscCall(MatCreateMPIAIJWithSplitArrays(comm, m, n, PETSC_DECIDE, PETSC_DECIDE, dii, djj, da, oii, ojj, oa, B));
56963c07aadSStefano Zampini       /* hack MPIAIJ */
57063c07aadSStefano Zampini       b          = (Mat_MPIAIJ *)((*B)->data);
57163c07aadSStefano Zampini       d          = (Mat_SeqAIJ *)b->A->data;
57263c07aadSStefano Zampini       o          = (Mat_SeqAIJ *)b->B->data;
57363c07aadSStefano Zampini       d->free_a  = PETSC_TRUE;
57463c07aadSStefano Zampini       d->free_ij = PETSC_TRUE;
57563c07aadSStefano Zampini       o->free_a  = PETSC_TRUE;
57663c07aadSStefano Zampini       o->free_ij = PETSC_TRUE;
577225daaf8SStefano Zampini     } else if (reuse == MAT_INPLACE_MATRIX) {
578225daaf8SStefano Zampini       Mat T;
5792cf14000SStefano Zampini 
5809566063dSJacob Faibussowitsch       PetscCall(MatCreateMPIAIJWithSplitArrays(comm, m, n, PETSC_DECIDE, PETSC_DECIDE, dii, djj, da, oii, ojj, oa, &T));
5812cf14000SStefano Zampini       if (sameint) { /* ownership of CSR pointers is transferred to PETSc */
582225daaf8SStefano Zampini         hypre_CSRMatrixI(hdiag) = NULL;
583225daaf8SStefano Zampini         hypre_CSRMatrixJ(hdiag) = NULL;
584225daaf8SStefano Zampini         hypre_CSRMatrixI(hoffd) = NULL;
585225daaf8SStefano Zampini         hypre_CSRMatrixJ(hoffd) = NULL;
5862cf14000SStefano Zampini       } else { /* Hack MPIAIJ -> free ij but not a */
5872cf14000SStefano Zampini         Mat_MPIAIJ *b = (Mat_MPIAIJ *)(T->data);
5882cf14000SStefano Zampini         Mat_SeqAIJ *d = (Mat_SeqAIJ *)(b->A->data);
5892cf14000SStefano Zampini         Mat_SeqAIJ *o = (Mat_SeqAIJ *)(b->B->data);
5902cf14000SStefano Zampini 
5912cf14000SStefano Zampini         d->free_ij = PETSC_TRUE;
5922cf14000SStefano Zampini         o->free_ij = PETSC_TRUE;
5932cf14000SStefano Zampini       }
5942cf14000SStefano Zampini       hypre_CSRMatrixData(hdiag) = NULL;
595225daaf8SStefano Zampini       hypre_CSRMatrixData(hoffd) = NULL;
5969566063dSJacob Faibussowitsch       PetscCall(MatHeaderReplace(A, &T));
59763c07aadSStefano Zampini     }
598225daaf8SStefano Zampini   } else {
599225daaf8SStefano Zampini     oii = NULL;
600225daaf8SStefano Zampini     ojj = NULL;
601225daaf8SStefano Zampini     oa  = NULL;
602225daaf8SStefano Zampini     if (reuse == MAT_INITIAL_MATRIX) {
60363c07aadSStefano Zampini       Mat_SeqAIJ *b;
6042cf14000SStefano Zampini 
6059566063dSJacob Faibussowitsch       PetscCall(MatCreateSeqAIJWithArrays(comm, m, n, dii, djj, da, B));
60663c07aadSStefano Zampini       /* hack SeqAIJ */
60763c07aadSStefano Zampini       b          = (Mat_SeqAIJ *)((*B)->data);
60863c07aadSStefano Zampini       b->free_a  = PETSC_TRUE;
60963c07aadSStefano Zampini       b->free_ij = PETSC_TRUE;
610225daaf8SStefano Zampini     } else if (reuse == MAT_INPLACE_MATRIX) {
611225daaf8SStefano Zampini       Mat T;
6122cf14000SStefano Zampini 
6139566063dSJacob Faibussowitsch       PetscCall(MatCreateSeqAIJWithArrays(comm, m, n, dii, djj, da, &T));
6142cf14000SStefano Zampini       if (sameint) { /* ownership of CSR pointers is transferred to PETSc */
615225daaf8SStefano Zampini         hypre_CSRMatrixI(hdiag) = NULL;
616225daaf8SStefano Zampini         hypre_CSRMatrixJ(hdiag) = NULL;
6172cf14000SStefano Zampini       } else { /* free ij but not a */
6182cf14000SStefano Zampini         Mat_SeqAIJ *b = (Mat_SeqAIJ *)(T->data);
6192cf14000SStefano Zampini 
6202cf14000SStefano Zampini         b->free_ij = PETSC_TRUE;
6212cf14000SStefano Zampini       }
622225daaf8SStefano Zampini       hypre_CSRMatrixData(hdiag) = NULL;
6239566063dSJacob Faibussowitsch       PetscCall(MatHeaderReplace(A, &T));
62463c07aadSStefano Zampini     }
625225daaf8SStefano Zampini   }
626225daaf8SStefano Zampini 
6272cf14000SStefano Zampini   /* we have to use hypre_Tfree to free the HYPRE arrays
6282cf14000SStefano Zampini      that PETSc now onws */
62963c07aadSStefano Zampini   if (reuse == MAT_INPLACE_MATRIX) {
6302cf14000SStefano Zampini     PetscInt    nh;
6312cf14000SStefano Zampini     void       *ptrs[6]  = {da, oa, dii, djj, oii, ojj};
6329371c9d4SSatish Balay     const char *names[6] = {"_hypre_csr_da", "_hypre_csr_oa", "_hypre_csr_dii", "_hypre_csr_djj", "_hypre_csr_oii", "_hypre_csr_ojj"};
6332cf14000SStefano Zampini     nh                   = sameint ? 6 : 2;
6342cf14000SStefano Zampini     for (i = 0; i < nh; i++) {
635225daaf8SStefano Zampini       PetscContainer c;
636225daaf8SStefano Zampini 
6379566063dSJacob Faibussowitsch       PetscCall(PetscContainerCreate(comm, &c));
6389566063dSJacob Faibussowitsch       PetscCall(PetscContainerSetPointer(c, ptrs[i]));
6399566063dSJacob Faibussowitsch       PetscCall(PetscContainerSetUserDestroy(c, hypre_array_destroy));
6409566063dSJacob Faibussowitsch       PetscCall(PetscObjectCompose((PetscObject)(*B), names[i], (PetscObject)c));
6419566063dSJacob Faibussowitsch       PetscCall(PetscContainerDestroy(&c));
642225daaf8SStefano Zampini     }
64363c07aadSStefano Zampini   }
64463c07aadSStefano Zampini   PetscFunctionReturn(0);
64563c07aadSStefano Zampini }
64663c07aadSStefano Zampini 
647d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAIJGetParCSR_Private(Mat A, hypre_ParCSRMatrix **hA)
648d71ae5a4SJacob Faibussowitsch {
649613e5ff0Sstefano_zampini   hypre_ParCSRMatrix *tA;
650c1a070e6SStefano Zampini   hypre_CSRMatrix    *hdiag, *hoffd;
651c1a070e6SStefano Zampini   Mat_SeqAIJ         *diag, *offd;
6522cf14000SStefano Zampini   PetscInt           *garray, i, noffd, dnnz, onnz, *row_starts, *col_starts;
653c1a070e6SStefano Zampini   MPI_Comm            comm = PetscObjectComm((PetscObject)A);
654613e5ff0Sstefano_zampini   PetscBool           ismpiaij, isseqaij;
6552cf14000SStefano Zampini   PetscBool           sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int));
6566ea7df73SStefano Zampini   HYPRE_Int          *hdi = NULL, *hdj = NULL, *hoi = NULL, *hoj = NULL;
6575c97c10fSStefano Zampini   PetscInt           *pdi = NULL, *pdj = NULL, *poi = NULL, *poj = NULL;
6586ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
6596ea7df73SStefano Zampini   PetscBool iscuda = PETSC_FALSE;
6606ea7df73SStefano Zampini #endif
661c1a070e6SStefano Zampini 
662c1a070e6SStefano Zampini   PetscFunctionBegin;
6639566063dSJacob Faibussowitsch   PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &ismpiaij));
6649566063dSJacob Faibussowitsch   PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATSEQAIJ, &isseqaij));
66508401ef6SPierre Jolivet   PetscCheck(ismpiaij || isseqaij, comm, PETSC_ERR_SUP, "Unsupported type %s", ((PetscObject)A)->type_name);
666c1a070e6SStefano Zampini   if (ismpiaij) {
667c1a070e6SStefano Zampini     Mat_MPIAIJ *a = (Mat_MPIAIJ *)(A->data);
668c1a070e6SStefano Zampini 
669c1a070e6SStefano Zampini     diag = (Mat_SeqAIJ *)a->A->data;
670c1a070e6SStefano Zampini     offd = (Mat_SeqAIJ *)a->B->data;
6716ea7df73SStefano Zampini #if defined(PETSC_HAVE_CUDA) && defined(PETSC_HAVE_HYPRE_DEVICE) && defined(HYPRE_USING_CUDA)
6729566063dSJacob Faibussowitsch     PetscCall(PetscObjectTypeCompare((PetscObject)A, MATMPIAIJCUSPARSE, &iscuda));
6736ea7df73SStefano Zampini     if (iscuda && !A->boundtocpu) {
6746ea7df73SStefano Zampini       sameint = PETSC_TRUE;
6759566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJCUSPARSEGetIJ(a->A, PETSC_FALSE, (const HYPRE_Int **)&hdi, (const HYPRE_Int **)&hdj));
6769566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJCUSPARSEGetIJ(a->B, PETSC_FALSE, (const HYPRE_Int **)&hoi, (const HYPRE_Int **)&hoj));
6776ea7df73SStefano Zampini     } else {
6786ea7df73SStefano Zampini #else
6796ea7df73SStefano Zampini     {
6806ea7df73SStefano Zampini #endif
6816ea7df73SStefano Zampini       pdi = diag->i;
6826ea7df73SStefano Zampini       pdj = diag->j;
6836ea7df73SStefano Zampini       poi = offd->i;
6846ea7df73SStefano Zampini       poj = offd->j;
6856ea7df73SStefano Zampini       if (sameint) {
6866ea7df73SStefano Zampini         hdi = (HYPRE_Int *)pdi;
6876ea7df73SStefano Zampini         hdj = (HYPRE_Int *)pdj;
6886ea7df73SStefano Zampini         hoi = (HYPRE_Int *)poi;
6896ea7df73SStefano Zampini         hoj = (HYPRE_Int *)poj;
6906ea7df73SStefano Zampini       }
6916ea7df73SStefano Zampini     }
692c1a070e6SStefano Zampini     garray = a->garray;
693c1a070e6SStefano Zampini     noffd  = a->B->cmap->N;
694c1a070e6SStefano Zampini     dnnz   = diag->nz;
695c1a070e6SStefano Zampini     onnz   = offd->nz;
696c1a070e6SStefano Zampini   } else {
697c1a070e6SStefano Zampini     diag = (Mat_SeqAIJ *)A->data;
698c1a070e6SStefano Zampini     offd = NULL;
6996ea7df73SStefano Zampini #if defined(PETSC_HAVE_CUDA) && defined(PETSC_HAVE_HYPRE_DEVICE)
7009566063dSJacob Faibussowitsch     PetscCall(PetscObjectTypeCompare((PetscObject)A, MATSEQAIJCUSPARSE, &iscuda));
7016ea7df73SStefano Zampini     if (iscuda && !A->boundtocpu) {
7026ea7df73SStefano Zampini       sameint = PETSC_TRUE;
7039566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJCUSPARSEGetIJ(A, PETSC_FALSE, (const HYPRE_Int **)&hdi, (const HYPRE_Int **)&hdj));
7046ea7df73SStefano Zampini     } else {
7056ea7df73SStefano Zampini #else
7066ea7df73SStefano Zampini     {
7076ea7df73SStefano Zampini #endif
7086ea7df73SStefano Zampini       pdi = diag->i;
7096ea7df73SStefano Zampini       pdj = diag->j;
7106ea7df73SStefano Zampini       if (sameint) {
7116ea7df73SStefano Zampini         hdi = (HYPRE_Int *)pdi;
7126ea7df73SStefano Zampini         hdj = (HYPRE_Int *)pdj;
7136ea7df73SStefano Zampini       }
7146ea7df73SStefano Zampini     }
715c1a070e6SStefano Zampini     garray = NULL;
716c1a070e6SStefano Zampini     noffd  = 0;
717c1a070e6SStefano Zampini     dnnz   = diag->nz;
718c1a070e6SStefano Zampini     onnz   = 0;
719c1a070e6SStefano Zampini   }
720225daaf8SStefano Zampini 
721c1a070e6SStefano Zampini   /* create a temporary ParCSR */
722c1a070e6SStefano Zampini   if (HYPRE_AssumedPartitionCheck()) {
723c1a070e6SStefano Zampini     PetscMPIInt myid;
724c1a070e6SStefano Zampini 
7259566063dSJacob Faibussowitsch     PetscCallMPI(MPI_Comm_rank(comm, &myid));
726c1a070e6SStefano Zampini     row_starts = A->rmap->range + myid;
727c1a070e6SStefano Zampini     col_starts = A->cmap->range + myid;
728c1a070e6SStefano Zampini   } else {
729c1a070e6SStefano Zampini     row_starts = A->rmap->range;
730c1a070e6SStefano Zampini     col_starts = A->cmap->range;
731c1a070e6SStefano Zampini   }
7322cf14000SStefano Zampini   tA = hypre_ParCSRMatrixCreate(comm, A->rmap->N, A->cmap->N, (HYPRE_BigInt *)row_starts, (HYPRE_BigInt *)col_starts, noffd, dnnz, onnz);
733a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts)
734c1a070e6SStefano Zampini   hypre_ParCSRMatrixSetRowStartsOwner(tA, 0);
735c1a070e6SStefano Zampini   hypre_ParCSRMatrixSetColStartsOwner(tA, 0);
736a1d2239cSSatish Balay #endif
737c1a070e6SStefano Zampini 
738225daaf8SStefano Zampini   /* set diagonal part */
739c1a070e6SStefano Zampini   hdiag = hypre_ParCSRMatrixDiag(tA);
7406ea7df73SStefano Zampini   if (!sameint) { /* malloc CSR pointers */
7419566063dSJacob Faibussowitsch     PetscCall(PetscMalloc2(A->rmap->n + 1, &hdi, dnnz, &hdj));
7426ea7df73SStefano Zampini     for (i = 0; i < A->rmap->n + 1; i++) hdi[i] = (HYPRE_Int)(pdi[i]);
7436ea7df73SStefano Zampini     for (i = 0; i < dnnz; i++) hdj[i] = (HYPRE_Int)(pdj[i]);
7442cf14000SStefano Zampini   }
7456ea7df73SStefano Zampini   hypre_CSRMatrixI(hdiag)           = hdi;
7466ea7df73SStefano Zampini   hypre_CSRMatrixJ(hdiag)           = hdj;
74739accc25SStefano Zampini   hypre_CSRMatrixData(hdiag)        = (HYPRE_Complex *)diag->a;
748c1a070e6SStefano Zampini   hypre_CSRMatrixNumNonzeros(hdiag) = diag->nz;
749c1a070e6SStefano Zampini   hypre_CSRMatrixSetRownnz(hdiag);
750c1a070e6SStefano Zampini   hypre_CSRMatrixSetDataOwner(hdiag, 0);
751c1a070e6SStefano Zampini 
752225daaf8SStefano Zampini   /* set offdiagonal part */
753c1a070e6SStefano Zampini   hoffd = hypre_ParCSRMatrixOffd(tA);
754c1a070e6SStefano Zampini   if (offd) {
7556ea7df73SStefano Zampini     if (!sameint) { /* malloc CSR pointers */
7569566063dSJacob Faibussowitsch       PetscCall(PetscMalloc2(A->rmap->n + 1, &hoi, onnz, &hoj));
7576ea7df73SStefano Zampini       for (i = 0; i < A->rmap->n + 1; i++) hoi[i] = (HYPRE_Int)(poi[i]);
7586ea7df73SStefano Zampini       for (i = 0; i < onnz; i++) hoj[i] = (HYPRE_Int)(poj[i]);
7592cf14000SStefano Zampini     }
7606ea7df73SStefano Zampini     hypre_CSRMatrixI(hoffd)           = hoi;
7616ea7df73SStefano Zampini     hypre_CSRMatrixJ(hoffd)           = hoj;
76239accc25SStefano Zampini     hypre_CSRMatrixData(hoffd)        = (HYPRE_Complex *)offd->a;
763c1a070e6SStefano Zampini     hypre_CSRMatrixNumNonzeros(hoffd) = offd->nz;
764c1a070e6SStefano Zampini     hypre_CSRMatrixSetRownnz(hoffd);
765c1a070e6SStefano Zampini     hypre_CSRMatrixSetDataOwner(hoffd, 0);
7666ea7df73SStefano Zampini   }
7676ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
768792fecdfSBarry Smith   PetscCallExternal(hypre_ParCSRMatrixInitialize_v2, tA, iscuda ? HYPRE_MEMORY_DEVICE : HYPRE_MEMORY_HOST);
7696ea7df73SStefano Zampini #else
7706ea7df73SStefano Zampini   #if PETSC_PKG_HYPRE_VERSION_LT(2, 18, 0)
771792fecdfSBarry Smith   PetscCallExternal(hypre_ParCSRMatrixInitialize, tA);
7726ea7df73SStefano Zampini   #else
773792fecdfSBarry Smith   PetscCallExternal(hypre_ParCSRMatrixInitialize_v2, tA, HYPRE_MEMORY_HOST);
7746ea7df73SStefano Zampini   #endif
7756ea7df73SStefano Zampini #endif
7766ea7df73SStefano Zampini   hypre_TFree(hypre_ParCSRMatrixColMapOffd(tA), HYPRE_MEMORY_HOST);
777c1a070e6SStefano Zampini   hypre_ParCSRMatrixSetNumNonzeros(tA);
7782cf14000SStefano Zampini   hypre_ParCSRMatrixColMapOffd(tA) = (HYPRE_BigInt *)garray;
779792fecdfSBarry Smith   if (!hypre_ParCSRMatrixCommPkg(tA)) PetscCallExternal(hypre_MatvecCommPkgCreate, tA);
780613e5ff0Sstefano_zampini   *hA = tA;
781613e5ff0Sstefano_zampini   PetscFunctionReturn(0);
782613e5ff0Sstefano_zampini }
783c1a070e6SStefano Zampini 
784d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAIJRestoreParCSR_Private(Mat A, hypre_ParCSRMatrix **hA)
785d71ae5a4SJacob Faibussowitsch {
786613e5ff0Sstefano_zampini   hypre_CSRMatrix *hdiag, *hoffd;
7876ea7df73SStefano Zampini   PetscBool        ismpiaij, sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int));
7886ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
7896ea7df73SStefano Zampini   PetscBool iscuda = PETSC_FALSE;
7906ea7df73SStefano Zampini #endif
791c1a070e6SStefano Zampini 
792613e5ff0Sstefano_zampini   PetscFunctionBegin;
7939566063dSJacob Faibussowitsch   PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &ismpiaij));
7946ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
7959566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompareAny((PetscObject)A, &iscuda, MATSEQAIJCUSPARSE, MATMPIAIJCUSPARSE, ""));
7966ea7df73SStefano Zampini   if (iscuda) sameint = PETSC_TRUE;
7976ea7df73SStefano Zampini #endif
798613e5ff0Sstefano_zampini   hdiag = hypre_ParCSRMatrixDiag(*hA);
799613e5ff0Sstefano_zampini   hoffd = hypre_ParCSRMatrixOffd(*hA);
8006ea7df73SStefano Zampini   /* free temporary memory allocated by PETSc
8016ea7df73SStefano Zampini      set pointers to NULL before destroying tA */
8022cf14000SStefano Zampini   if (!sameint) {
8032cf14000SStefano Zampini     HYPRE_Int *hi, *hj;
8042cf14000SStefano Zampini 
8052cf14000SStefano Zampini     hi = hypre_CSRMatrixI(hdiag);
8062cf14000SStefano Zampini     hj = hypre_CSRMatrixJ(hdiag);
8079566063dSJacob Faibussowitsch     PetscCall(PetscFree2(hi, hj));
8086ea7df73SStefano Zampini     if (ismpiaij) {
8092cf14000SStefano Zampini       hi = hypre_CSRMatrixI(hoffd);
8102cf14000SStefano Zampini       hj = hypre_CSRMatrixJ(hoffd);
8119566063dSJacob Faibussowitsch       PetscCall(PetscFree2(hi, hj));
8122cf14000SStefano Zampini     }
8132cf14000SStefano Zampini   }
814c1a070e6SStefano Zampini   hypre_CSRMatrixI(hdiag)    = NULL;
815c1a070e6SStefano Zampini   hypre_CSRMatrixJ(hdiag)    = NULL;
816c1a070e6SStefano Zampini   hypre_CSRMatrixData(hdiag) = NULL;
8176ea7df73SStefano Zampini   if (ismpiaij) {
818c1a070e6SStefano Zampini     hypre_CSRMatrixI(hoffd)    = NULL;
819c1a070e6SStefano Zampini     hypre_CSRMatrixJ(hoffd)    = NULL;
820c1a070e6SStefano Zampini     hypre_CSRMatrixData(hoffd) = NULL;
8216ea7df73SStefano Zampini   }
822613e5ff0Sstefano_zampini   hypre_ParCSRMatrixColMapOffd(*hA) = NULL;
823613e5ff0Sstefano_zampini   hypre_ParCSRMatrixDestroy(*hA);
824613e5ff0Sstefano_zampini   *hA = NULL;
825613e5ff0Sstefano_zampini   PetscFunctionReturn(0);
826613e5ff0Sstefano_zampini }
827613e5ff0Sstefano_zampini 
828613e5ff0Sstefano_zampini /* calls RAP from BoomerAMG:
8293dad0653Sstefano_zampini    the resulting ParCSR will not own the column and row starts
8306ea7df73SStefano Zampini    It looks like we don't need to have the diagonal entries ordered first */
831d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_ParCSR_RAP(hypre_ParCSRMatrix *hR, hypre_ParCSRMatrix *hA, hypre_ParCSRMatrix *hP, hypre_ParCSRMatrix **hRAP)
832d71ae5a4SJacob Faibussowitsch {
833a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts)
834613e5ff0Sstefano_zampini   HYPRE_Int P_owns_col_starts, R_owns_row_starts;
835a1d2239cSSatish Balay #endif
836613e5ff0Sstefano_zampini 
837613e5ff0Sstefano_zampini   PetscFunctionBegin;
838a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts)
839613e5ff0Sstefano_zampini   P_owns_col_starts = hypre_ParCSRMatrixOwnsColStarts(hP);
840613e5ff0Sstefano_zampini   R_owns_row_starts = hypre_ParCSRMatrixOwnsRowStarts(hR);
841a1d2239cSSatish Balay #endif
8426ea7df73SStefano Zampini   /* can be replaced by version test later */
8436ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
844792fecdfSBarry Smith   PetscStackPushExternal("hypre_ParCSRMatrixRAP");
8456ea7df73SStefano Zampini   *hRAP = hypre_ParCSRMatrixRAP(hR, hA, hP);
8466ea7df73SStefano Zampini   PetscStackPop;
8476ea7df73SStefano Zampini #else
848792fecdfSBarry Smith   PetscCallExternal(hypre_BoomerAMGBuildCoarseOperator, hR, hA, hP, hRAP);
849792fecdfSBarry Smith   PetscCallExternal(hypre_ParCSRMatrixSetNumNonzeros, *hRAP);
8506ea7df73SStefano Zampini #endif
851613e5ff0Sstefano_zampini   /* hypre_BoomerAMGBuildCoarseOperator steals the col_starts from P and the row_starts from R */
852a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts)
853613e5ff0Sstefano_zampini   hypre_ParCSRMatrixSetRowStartsOwner(*hRAP, 0);
854613e5ff0Sstefano_zampini   hypre_ParCSRMatrixSetColStartsOwner(*hRAP, 0);
855613e5ff0Sstefano_zampini   if (P_owns_col_starts) hypre_ParCSRMatrixSetColStartsOwner(hP, 1);
856613e5ff0Sstefano_zampini   if (R_owns_row_starts) hypre_ParCSRMatrixSetRowStartsOwner(hR, 1);
857a1d2239cSSatish Balay #endif
858613e5ff0Sstefano_zampini   PetscFunctionReturn(0);
859613e5ff0Sstefano_zampini }
860613e5ff0Sstefano_zampini 
861d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatPtAPNumeric_AIJ_AIJ_wHYPRE(Mat A, Mat P, Mat C)
862d71ae5a4SJacob Faibussowitsch {
8636f231fbdSstefano_zampini   Mat                 B;
8646abb4441SStefano Zampini   hypre_ParCSRMatrix *hA, *hP, *hPtAP = NULL;
8654222ddf1SHong Zhang   Mat_Product        *product = C->product;
866613e5ff0Sstefano_zampini 
867613e5ff0Sstefano_zampini   PetscFunctionBegin;
8689566063dSJacob Faibussowitsch   PetscCall(MatAIJGetParCSR_Private(A, &hA));
8699566063dSJacob Faibussowitsch   PetscCall(MatAIJGetParCSR_Private(P, &hP));
8709566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_ParCSR_RAP(hP, hA, hP, &hPtAP));
8719566063dSJacob Faibussowitsch   PetscCall(MatCreateFromParCSR(hPtAP, MATAIJ, PETSC_OWN_POINTER, &B));
8724222ddf1SHong Zhang 
8739566063dSJacob Faibussowitsch   PetscCall(MatHeaderMerge(C, &B));
8744222ddf1SHong Zhang   C->product = product;
8754222ddf1SHong Zhang 
8769566063dSJacob Faibussowitsch   PetscCall(MatAIJRestoreParCSR_Private(A, &hA));
8779566063dSJacob Faibussowitsch   PetscCall(MatAIJRestoreParCSR_Private(P, &hP));
8786f231fbdSstefano_zampini   PetscFunctionReturn(0);
8796f231fbdSstefano_zampini }
8806f231fbdSstefano_zampini 
881d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatPtAPSymbolic_AIJ_AIJ_wHYPRE(Mat A, Mat P, PetscReal fill, Mat C)
882d71ae5a4SJacob Faibussowitsch {
8836f231fbdSstefano_zampini   PetscFunctionBegin;
8849566063dSJacob Faibussowitsch   PetscCall(MatSetType(C, MATAIJ));
8854222ddf1SHong Zhang   C->ops->ptapnumeric    = MatPtAPNumeric_AIJ_AIJ_wHYPRE;
8864222ddf1SHong Zhang   C->ops->productnumeric = MatProductNumeric_PtAP;
887613e5ff0Sstefano_zampini   PetscFunctionReturn(0);
888613e5ff0Sstefano_zampini }
889613e5ff0Sstefano_zampini 
890d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatPtAPNumeric_AIJ_HYPRE(Mat A, Mat P, Mat C)
891d71ae5a4SJacob Faibussowitsch {
8924cc28894Sstefano_zampini   Mat                 B;
8934cc28894Sstefano_zampini   Mat_HYPRE          *hP;
8946abb4441SStefano Zampini   hypre_ParCSRMatrix *hA = NULL, *Pparcsr, *ptapparcsr = NULL;
895613e5ff0Sstefano_zampini   HYPRE_Int           type;
896613e5ff0Sstefano_zampini   MPI_Comm            comm = PetscObjectComm((PetscObject)A);
8974cc28894Sstefano_zampini   PetscBool           ishypre;
898613e5ff0Sstefano_zampini 
899613e5ff0Sstefano_zampini   PetscFunctionBegin;
9009566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)P, MATHYPRE, &ishypre));
90128b400f6SJacob Faibussowitsch   PetscCheck(ishypre, comm, PETSC_ERR_USER, "P should be of type %s", MATHYPRE);
9024cc28894Sstefano_zampini   hP = (Mat_HYPRE *)P->data;
903792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixGetObjectType, hP->ij, &type);
90408401ef6SPierre Jolivet   PetscCheck(type == HYPRE_PARCSR, comm, PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported");
905792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixGetObject, hP->ij, (void **)&Pparcsr);
906613e5ff0Sstefano_zampini 
9079566063dSJacob Faibussowitsch   PetscCall(MatAIJGetParCSR_Private(A, &hA));
9089566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_ParCSR_RAP(Pparcsr, hA, Pparcsr, &ptapparcsr));
9099566063dSJacob Faibussowitsch   PetscCall(MatAIJRestoreParCSR_Private(A, &hA));
910225daaf8SStefano Zampini 
9114cc28894Sstefano_zampini   /* create temporary matrix and merge to C */
9129566063dSJacob Faibussowitsch   PetscCall(MatCreateFromParCSR(ptapparcsr, ((PetscObject)C)->type_name, PETSC_OWN_POINTER, &B));
9139566063dSJacob Faibussowitsch   PetscCall(MatHeaderMerge(C, &B));
9144cc28894Sstefano_zampini   PetscFunctionReturn(0);
9154cc28894Sstefano_zampini }
9164cc28894Sstefano_zampini 
917d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatPtAPNumeric_HYPRE_HYPRE(Mat A, Mat P, Mat C)
918d71ae5a4SJacob Faibussowitsch {
9194cc28894Sstefano_zampini   Mat                 B;
9206abb4441SStefano Zampini   hypre_ParCSRMatrix *Aparcsr, *Pparcsr, *ptapparcsr = NULL;
9214cc28894Sstefano_zampini   Mat_HYPRE          *hA, *hP;
9224cc28894Sstefano_zampini   PetscBool           ishypre;
9234cc28894Sstefano_zampini   HYPRE_Int           type;
9244cc28894Sstefano_zampini 
9254cc28894Sstefano_zampini   PetscFunctionBegin;
9269566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)P, MATHYPRE, &ishypre));
92728b400f6SJacob Faibussowitsch   PetscCheck(ishypre, PetscObjectComm((PetscObject)P), PETSC_ERR_USER, "P should be of type %s", MATHYPRE);
9289566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)A, MATHYPRE, &ishypre));
92928b400f6SJacob Faibussowitsch   PetscCheck(ishypre, PetscObjectComm((PetscObject)A), PETSC_ERR_USER, "A should be of type %s", MATHYPRE);
9304cc28894Sstefano_zampini   hA = (Mat_HYPRE *)A->data;
9314cc28894Sstefano_zampini   hP = (Mat_HYPRE *)P->data;
932792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixGetObjectType, hA->ij, &type);
93308401ef6SPierre Jolivet   PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported");
934792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixGetObjectType, hP->ij, &type);
93508401ef6SPierre Jolivet   PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)P), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported");
936792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixGetObject, hA->ij, (void **)&Aparcsr);
937792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixGetObject, hP->ij, (void **)&Pparcsr);
9389566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_ParCSR_RAP(Pparcsr, Aparcsr, Pparcsr, &ptapparcsr));
9399566063dSJacob Faibussowitsch   PetscCall(MatCreateFromParCSR(ptapparcsr, MATHYPRE, PETSC_OWN_POINTER, &B));
9409566063dSJacob Faibussowitsch   PetscCall(MatHeaderMerge(C, &B));
9414cc28894Sstefano_zampini   PetscFunctionReturn(0);
9424cc28894Sstefano_zampini }
9434cc28894Sstefano_zampini 
944d501dc42Sstefano_zampini /* calls hypre_ParMatmul
945d501dc42Sstefano_zampini    hypre_ParMatMul uses hypre_ParMatrixCreate with the communicator of hA
9463dad0653Sstefano_zampini    hypre_ParMatrixCreate does not duplicate the communicator
9476ea7df73SStefano Zampini    It looks like we don't need to have the diagonal entries ordered first */
948d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_ParCSR_MatMatMult(hypre_ParCSRMatrix *hA, hypre_ParCSRMatrix *hB, hypre_ParCSRMatrix **hAB)
949d71ae5a4SJacob Faibussowitsch {
950d501dc42Sstefano_zampini   PetscFunctionBegin;
9516ea7df73SStefano Zampini   /* can be replaced by version test later */
9526ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
953792fecdfSBarry Smith   PetscStackPushExternal("hypre_ParCSRMatMat");
9546ea7df73SStefano Zampini   *hAB = hypre_ParCSRMatMat(hA, hB);
9556ea7df73SStefano Zampini #else
956792fecdfSBarry Smith   PetscStackPushExternal("hypre_ParMatmul");
957d501dc42Sstefano_zampini   *hAB = hypre_ParMatmul(hA, hB);
9586ea7df73SStefano Zampini #endif
959d501dc42Sstefano_zampini   PetscStackPop;
960d501dc42Sstefano_zampini   PetscFunctionReturn(0);
961d501dc42Sstefano_zampini }
962d501dc42Sstefano_zampini 
963d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMatMultNumeric_AIJ_AIJ_wHYPRE(Mat A, Mat B, Mat C)
964d71ae5a4SJacob Faibussowitsch {
9655e5acdf2Sstefano_zampini   Mat                 D;
966d501dc42Sstefano_zampini   hypre_ParCSRMatrix *hA, *hB, *hAB = NULL;
9674222ddf1SHong Zhang   Mat_Product        *product = C->product;
9685e5acdf2Sstefano_zampini 
9695e5acdf2Sstefano_zampini   PetscFunctionBegin;
9709566063dSJacob Faibussowitsch   PetscCall(MatAIJGetParCSR_Private(A, &hA));
9719566063dSJacob Faibussowitsch   PetscCall(MatAIJGetParCSR_Private(B, &hB));
9729566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_ParCSR_MatMatMult(hA, hB, &hAB));
9739566063dSJacob Faibussowitsch   PetscCall(MatCreateFromParCSR(hAB, MATAIJ, PETSC_OWN_POINTER, &D));
9744222ddf1SHong Zhang 
9759566063dSJacob Faibussowitsch   PetscCall(MatHeaderMerge(C, &D));
9764222ddf1SHong Zhang   C->product = product;
9774222ddf1SHong Zhang 
9789566063dSJacob Faibussowitsch   PetscCall(MatAIJRestoreParCSR_Private(A, &hA));
9799566063dSJacob Faibussowitsch   PetscCall(MatAIJRestoreParCSR_Private(B, &hB));
9805e5acdf2Sstefano_zampini   PetscFunctionReturn(0);
9815e5acdf2Sstefano_zampini }
9825e5acdf2Sstefano_zampini 
983d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatMatMultSymbolic_AIJ_AIJ_wHYPRE(Mat A, Mat B, PetscReal fill, Mat C)
984d71ae5a4SJacob Faibussowitsch {
9855e5acdf2Sstefano_zampini   PetscFunctionBegin;
9869566063dSJacob Faibussowitsch   PetscCall(MatSetType(C, MATAIJ));
9874222ddf1SHong Zhang   C->ops->matmultnumeric = MatMatMultNumeric_AIJ_AIJ_wHYPRE;
9884222ddf1SHong Zhang   C->ops->productnumeric = MatProductNumeric_AB;
9895e5acdf2Sstefano_zampini   PetscFunctionReturn(0);
9905e5acdf2Sstefano_zampini }
9915e5acdf2Sstefano_zampini 
992d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMatMultNumeric_HYPRE_HYPRE(Mat A, Mat B, Mat C)
993d71ae5a4SJacob Faibussowitsch {
994d501dc42Sstefano_zampini   Mat                 D;
995d501dc42Sstefano_zampini   hypre_ParCSRMatrix *Aparcsr, *Bparcsr, *ABparcsr = NULL;
996d501dc42Sstefano_zampini   Mat_HYPRE          *hA, *hB;
997d501dc42Sstefano_zampini   PetscBool           ishypre;
998d501dc42Sstefano_zampini   HYPRE_Int           type;
9994222ddf1SHong Zhang   Mat_Product        *product;
1000d501dc42Sstefano_zampini 
1001d501dc42Sstefano_zampini   PetscFunctionBegin;
10029566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)B, MATHYPRE, &ishypre));
100328b400f6SJacob Faibussowitsch   PetscCheck(ishypre, PetscObjectComm((PetscObject)B), PETSC_ERR_USER, "B should be of type %s", MATHYPRE);
10049566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)A, MATHYPRE, &ishypre));
100528b400f6SJacob Faibussowitsch   PetscCheck(ishypre, PetscObjectComm((PetscObject)A), PETSC_ERR_USER, "A should be of type %s", MATHYPRE);
1006d501dc42Sstefano_zampini   hA = (Mat_HYPRE *)A->data;
1007d501dc42Sstefano_zampini   hB = (Mat_HYPRE *)B->data;
1008792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixGetObjectType, hA->ij, &type);
100908401ef6SPierre Jolivet   PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported");
1010792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixGetObjectType, hB->ij, &type);
101108401ef6SPierre Jolivet   PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)B), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported");
1012792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixGetObject, hA->ij, (void **)&Aparcsr);
1013792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixGetObject, hB->ij, (void **)&Bparcsr);
10149566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_ParCSR_MatMatMult(Aparcsr, Bparcsr, &ABparcsr));
10159566063dSJacob Faibussowitsch   PetscCall(MatCreateFromParCSR(ABparcsr, MATHYPRE, PETSC_OWN_POINTER, &D));
10164222ddf1SHong Zhang 
1017d501dc42Sstefano_zampini   /* need to use HeaderReplace because HeaderMerge messes up with the communicator */
10184222ddf1SHong Zhang   product    = C->product; /* save it from MatHeaderReplace() */
10194222ddf1SHong Zhang   C->product = NULL;
10209566063dSJacob Faibussowitsch   PetscCall(MatHeaderReplace(C, &D));
10214222ddf1SHong Zhang   C->product             = product;
1022d501dc42Sstefano_zampini   C->ops->matmultnumeric = MatMatMultNumeric_HYPRE_HYPRE;
10234222ddf1SHong Zhang   C->ops->productnumeric = MatProductNumeric_AB;
1024d501dc42Sstefano_zampini   PetscFunctionReturn(0);
1025d501dc42Sstefano_zampini }
1026d501dc42Sstefano_zampini 
1027d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatTransposeMatMatMultNumeric_AIJ_AIJ_AIJ_wHYPRE(Mat A, Mat B, Mat C, Mat D)
1028d71ae5a4SJacob Faibussowitsch {
102920e1dc0dSstefano_zampini   Mat                 E;
10306abb4441SStefano Zampini   hypre_ParCSRMatrix *hA, *hB, *hC, *hABC = NULL;
103120e1dc0dSstefano_zampini 
103220e1dc0dSstefano_zampini   PetscFunctionBegin;
10339566063dSJacob Faibussowitsch   PetscCall(MatAIJGetParCSR_Private(A, &hA));
10349566063dSJacob Faibussowitsch   PetscCall(MatAIJGetParCSR_Private(B, &hB));
10359566063dSJacob Faibussowitsch   PetscCall(MatAIJGetParCSR_Private(C, &hC));
10369566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_ParCSR_RAP(hA, hB, hC, &hABC));
10379566063dSJacob Faibussowitsch   PetscCall(MatCreateFromParCSR(hABC, MATAIJ, PETSC_OWN_POINTER, &E));
10389566063dSJacob Faibussowitsch   PetscCall(MatHeaderMerge(D, &E));
10399566063dSJacob Faibussowitsch   PetscCall(MatAIJRestoreParCSR_Private(A, &hA));
10409566063dSJacob Faibussowitsch   PetscCall(MatAIJRestoreParCSR_Private(B, &hB));
10419566063dSJacob Faibussowitsch   PetscCall(MatAIJRestoreParCSR_Private(C, &hC));
104220e1dc0dSstefano_zampini   PetscFunctionReturn(0);
104320e1dc0dSstefano_zampini }
104420e1dc0dSstefano_zampini 
1045d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatTransposeMatMatMultSymbolic_AIJ_AIJ_AIJ_wHYPRE(Mat A, Mat B, Mat C, PetscReal fill, Mat D)
1046d71ae5a4SJacob Faibussowitsch {
104720e1dc0dSstefano_zampini   PetscFunctionBegin;
10489566063dSJacob Faibussowitsch   PetscCall(MatSetType(D, MATAIJ));
104920e1dc0dSstefano_zampini   PetscFunctionReturn(0);
105020e1dc0dSstefano_zampini }
105120e1dc0dSstefano_zampini 
10524222ddf1SHong Zhang /* ---------------------------------------------------- */
1053d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSymbolic_AB_HYPRE(Mat C)
1054d71ae5a4SJacob Faibussowitsch {
10554222ddf1SHong Zhang   PetscFunctionBegin;
10564222ddf1SHong Zhang   C->ops->productnumeric = MatProductNumeric_AB;
10574222ddf1SHong Zhang   PetscFunctionReturn(0);
10584222ddf1SHong Zhang }
10594222ddf1SHong Zhang 
1060d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSetFromOptions_HYPRE_AB(Mat C)
1061d71ae5a4SJacob Faibussowitsch {
10624222ddf1SHong Zhang   Mat_Product *product = C->product;
10634222ddf1SHong Zhang   PetscBool    Ahypre;
10644222ddf1SHong Zhang 
10654222ddf1SHong Zhang   PetscFunctionBegin;
10669566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)product->A, MATHYPRE, &Ahypre));
10674222ddf1SHong Zhang   if (Ahypre) { /* A is a Hypre matrix */
10689566063dSJacob Faibussowitsch     PetscCall(MatSetType(C, MATHYPRE));
10694222ddf1SHong Zhang     C->ops->productsymbolic = MatProductSymbolic_AB_HYPRE;
10704222ddf1SHong Zhang     C->ops->matmultnumeric  = MatMatMultNumeric_HYPRE_HYPRE;
10714222ddf1SHong Zhang     PetscFunctionReturn(0);
10726718818eSStefano Zampini   }
10734222ddf1SHong Zhang   PetscFunctionReturn(0);
10744222ddf1SHong Zhang }
10754222ddf1SHong Zhang 
1076d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSymbolic_PtAP_HYPRE(Mat C)
1077d71ae5a4SJacob Faibussowitsch {
10784222ddf1SHong Zhang   PetscFunctionBegin;
10794222ddf1SHong Zhang   C->ops->productnumeric = MatProductNumeric_PtAP;
10804222ddf1SHong Zhang   PetscFunctionReturn(0);
10814222ddf1SHong Zhang }
10824222ddf1SHong Zhang 
1083d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSetFromOptions_HYPRE_PtAP(Mat C)
1084d71ae5a4SJacob Faibussowitsch {
10854222ddf1SHong Zhang   Mat_Product *product = C->product;
10864222ddf1SHong Zhang   PetscBool    flg;
10874222ddf1SHong Zhang   PetscInt     type        = 0;
10884222ddf1SHong Zhang   const char  *outTypes[4] = {"aij", "seqaij", "mpiaij", "hypre"};
10894222ddf1SHong Zhang   PetscInt     ntype       = 4;
10904222ddf1SHong Zhang   Mat          A           = product->A;
10914222ddf1SHong Zhang   PetscBool    Ahypre;
10924222ddf1SHong Zhang 
10934222ddf1SHong Zhang   PetscFunctionBegin;
10949566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)A, MATHYPRE, &Ahypre));
10954222ddf1SHong Zhang   if (Ahypre) { /* A is a Hypre matrix */
10969566063dSJacob Faibussowitsch     PetscCall(MatSetType(C, MATHYPRE));
10974222ddf1SHong Zhang     C->ops->productsymbolic = MatProductSymbolic_PtAP_HYPRE;
10984222ddf1SHong Zhang     C->ops->ptapnumeric     = MatPtAPNumeric_HYPRE_HYPRE;
10994222ddf1SHong Zhang     PetscFunctionReturn(0);
11004222ddf1SHong Zhang   }
11014222ddf1SHong Zhang 
11024222ddf1SHong Zhang   /* A is AIJ, P is Hypre, C = PtAP can be either AIJ or Hypre format */
11034222ddf1SHong Zhang   /* Get runtime option */
11044222ddf1SHong Zhang   if (product->api_user) {
1105d0609cedSBarry Smith     PetscOptionsBegin(PetscObjectComm((PetscObject)C), ((PetscObject)C)->prefix, "MatPtAP_HYPRE", "Mat");
11069566063dSJacob Faibussowitsch     PetscCall(PetscOptionsEList("-matptap_hypre_outtype", "MatPtAP outtype", "MatPtAP outtype", outTypes, ntype, outTypes[type], &type, &flg));
1107d0609cedSBarry Smith     PetscOptionsEnd();
11084222ddf1SHong Zhang   } else {
1109d0609cedSBarry Smith     PetscOptionsBegin(PetscObjectComm((PetscObject)C), ((PetscObject)C)->prefix, "MatProduct_PtAP_HYPRE", "Mat");
11109566063dSJacob Faibussowitsch     PetscCall(PetscOptionsEList("-mat_product_algorithm_hypre_outtype", "MatProduct_PtAP outtype", "MatProduct_PtAP", outTypes, ntype, outTypes[type], &type, &flg));
1111d0609cedSBarry Smith     PetscOptionsEnd();
11124222ddf1SHong Zhang   }
11134222ddf1SHong Zhang 
11144222ddf1SHong Zhang   if (type == 0 || type == 1 || type == 2) {
11159566063dSJacob Faibussowitsch     PetscCall(MatSetType(C, MATAIJ));
11164222ddf1SHong Zhang   } else if (type == 3) {
11179566063dSJacob Faibussowitsch     PetscCall(MatSetType(C, MATHYPRE));
11184222ddf1SHong Zhang   } else SETERRQ(PetscObjectComm((PetscObject)C), PETSC_ERR_SUP, "MatPtAP outtype is not supported");
11194222ddf1SHong Zhang   C->ops->productsymbolic = MatProductSymbolic_PtAP_HYPRE;
11204222ddf1SHong Zhang   C->ops->ptapnumeric     = MatPtAPNumeric_AIJ_HYPRE;
11214222ddf1SHong Zhang   PetscFunctionReturn(0);
11224222ddf1SHong Zhang }
11234222ddf1SHong Zhang 
1124d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSetFromOptions_HYPRE(Mat C)
1125d71ae5a4SJacob Faibussowitsch {
11264222ddf1SHong Zhang   Mat_Product *product = C->product;
11274222ddf1SHong Zhang 
11284222ddf1SHong Zhang   PetscFunctionBegin;
11294222ddf1SHong Zhang   switch (product->type) {
1130d71ae5a4SJacob Faibussowitsch   case MATPRODUCT_AB:
1131d71ae5a4SJacob Faibussowitsch     PetscCall(MatProductSetFromOptions_HYPRE_AB(C));
1132d71ae5a4SJacob Faibussowitsch     break;
1133d71ae5a4SJacob Faibussowitsch   case MATPRODUCT_PtAP:
1134d71ae5a4SJacob Faibussowitsch     PetscCall(MatProductSetFromOptions_HYPRE_PtAP(C));
1135d71ae5a4SJacob Faibussowitsch     break;
1136d71ae5a4SJacob Faibussowitsch   default:
1137d71ae5a4SJacob Faibussowitsch     break;
11384222ddf1SHong Zhang   }
11394222ddf1SHong Zhang   PetscFunctionReturn(0);
11404222ddf1SHong Zhang }
11414222ddf1SHong Zhang 
11424222ddf1SHong Zhang /* -------------------------------------------------------- */
11434222ddf1SHong Zhang 
1144d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMultTranspose_HYPRE(Mat A, Vec x, Vec y)
1145d71ae5a4SJacob Faibussowitsch {
114663c07aadSStefano Zampini   PetscFunctionBegin;
11479566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_MultKernel_Private(A, 1.0, x, 0.0, y, PETSC_TRUE));
114863c07aadSStefano Zampini   PetscFunctionReturn(0);
114963c07aadSStefano Zampini }
115063c07aadSStefano Zampini 
1151d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMult_HYPRE(Mat A, Vec x, Vec y)
1152d71ae5a4SJacob Faibussowitsch {
115363c07aadSStefano Zampini   PetscFunctionBegin;
11549566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_MultKernel_Private(A, 1.0, x, 0.0, y, PETSC_FALSE));
115563c07aadSStefano Zampini   PetscFunctionReturn(0);
115663c07aadSStefano Zampini }
115763c07aadSStefano Zampini 
1158d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMultAdd_HYPRE(Mat A, Vec x, Vec y, Vec z)
1159d71ae5a4SJacob Faibussowitsch {
1160414bd5c3SStefano Zampini   PetscFunctionBegin;
116148a46eb9SPierre Jolivet   if (y != z) PetscCall(VecCopy(y, z));
11629566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_MultKernel_Private(A, 1.0, x, 1.0, z, PETSC_FALSE));
1163414bd5c3SStefano Zampini   PetscFunctionReturn(0);
1164414bd5c3SStefano Zampini }
1165414bd5c3SStefano Zampini 
1166d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMultTransposeAdd_HYPRE(Mat A, Vec x, Vec y, Vec z)
1167d71ae5a4SJacob Faibussowitsch {
1168414bd5c3SStefano Zampini   PetscFunctionBegin;
116948a46eb9SPierre Jolivet   if (y != z) PetscCall(VecCopy(y, z));
11709566063dSJacob Faibussowitsch   PetscCall(MatHYPRE_MultKernel_Private(A, 1.0, x, 1.0, z, PETSC_TRUE));
1171414bd5c3SStefano Zampini   PetscFunctionReturn(0);
1172414bd5c3SStefano Zampini }
1173414bd5c3SStefano Zampini 
1174414bd5c3SStefano Zampini /* y = a * A * x + b * y or y = a * A^t * x + b * y depending on trans */
1175d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_MultKernel_Private(Mat A, HYPRE_Complex a, Vec x, HYPRE_Complex b, Vec y, PetscBool trans)
1176d71ae5a4SJacob Faibussowitsch {
117763c07aadSStefano Zampini   Mat_HYPRE          *hA = (Mat_HYPRE *)A->data;
117863c07aadSStefano Zampini   hypre_ParCSRMatrix *parcsr;
117963c07aadSStefano Zampini   hypre_ParVector    *hx, *hy;
118063c07aadSStefano Zampini 
118163c07aadSStefano Zampini   PetscFunctionBegin;
118263c07aadSStefano Zampini   if (trans) {
11839566063dSJacob Faibussowitsch     PetscCall(VecHYPRE_IJVectorPushVecRead(hA->b, x));
11849566063dSJacob Faibussowitsch     if (b != 0.0) PetscCall(VecHYPRE_IJVectorPushVec(hA->x, y));
11859566063dSJacob Faibussowitsch     else PetscCall(VecHYPRE_IJVectorPushVecWrite(hA->x, y));
1186792fecdfSBarry Smith     PetscCallExternal(HYPRE_IJVectorGetObject, hA->b->ij, (void **)&hx);
1187792fecdfSBarry Smith     PetscCallExternal(HYPRE_IJVectorGetObject, hA->x->ij, (void **)&hy);
118863c07aadSStefano Zampini   } else {
11899566063dSJacob Faibussowitsch     PetscCall(VecHYPRE_IJVectorPushVecRead(hA->x, x));
11909566063dSJacob Faibussowitsch     if (b != 0.0) PetscCall(VecHYPRE_IJVectorPushVec(hA->b, y));
11919566063dSJacob Faibussowitsch     else PetscCall(VecHYPRE_IJVectorPushVecWrite(hA->b, y));
1192792fecdfSBarry Smith     PetscCallExternal(HYPRE_IJVectorGetObject, hA->x->ij, (void **)&hx);
1193792fecdfSBarry Smith     PetscCallExternal(HYPRE_IJVectorGetObject, hA->b->ij, (void **)&hy);
119463c07aadSStefano Zampini   }
1195792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixGetObject, hA->ij, (void **)&parcsr);
11966ea7df73SStefano Zampini   if (trans) {
1197792fecdfSBarry Smith     PetscCallExternal(hypre_ParCSRMatrixMatvecT, a, parcsr, hx, b, hy);
11986ea7df73SStefano Zampini   } else {
1199792fecdfSBarry Smith     PetscCallExternal(hypre_ParCSRMatrixMatvec, a, parcsr, hx, b, hy);
12006ea7df73SStefano Zampini   }
12019566063dSJacob Faibussowitsch   PetscCall(VecHYPRE_IJVectorPopVec(hA->x));
12029566063dSJacob Faibussowitsch   PetscCall(VecHYPRE_IJVectorPopVec(hA->b));
120363c07aadSStefano Zampini   PetscFunctionReturn(0);
120463c07aadSStefano Zampini }
120563c07aadSStefano Zampini 
1206d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatDestroy_HYPRE(Mat A)
1207d71ae5a4SJacob Faibussowitsch {
120863c07aadSStefano Zampini   Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
120963c07aadSStefano Zampini 
121063c07aadSStefano Zampini   PetscFunctionBegin;
12119566063dSJacob Faibussowitsch   PetscCall(VecHYPRE_IJVectorDestroy(&hA->x));
12129566063dSJacob Faibussowitsch   PetscCall(VecHYPRE_IJVectorDestroy(&hA->b));
1213978814f1SStefano Zampini   if (hA->ij) {
1214978814f1SStefano Zampini     if (!hA->inner_free) hypre_IJMatrixObject(hA->ij) = NULL;
1215792fecdfSBarry Smith     PetscCallExternal(HYPRE_IJMatrixDestroy, hA->ij);
1216978814f1SStefano Zampini   }
12179566063dSJacob Faibussowitsch   if (hA->comm) PetscCall(PetscCommRestoreComm(PetscObjectComm((PetscObject)A), &hA->comm));
1218c69f721fSFande Kong 
12199566063dSJacob Faibussowitsch   PetscCall(MatStashDestroy_Private(&A->stash));
12209566063dSJacob Faibussowitsch   PetscCall(PetscFree(hA->array));
1221c69f721fSFande Kong 
12225fbaff96SJunchao Zhang   if (hA->cooMat) {
12235fbaff96SJunchao Zhang     PetscCall(MatDestroy(&hA->cooMat));
1224e77caa6dSBarry Smith     PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hA->diagJ, hA->memType));
1225e77caa6dSBarry Smith     PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hA->offdJ, hA->memType));
1226e77caa6dSBarry Smith     PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hA->diag, hA->memType));
12275fbaff96SJunchao Zhang   }
12285fbaff96SJunchao Zhang 
12299566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_hypre_aij_C", NULL));
12309566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_hypre_is_C", NULL));
12319566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_hypre_C", NULL));
12329566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_mpiaij_hypre_C", NULL));
12339566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatHYPRESetPreallocation_C", NULL));
12349566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatHYPREGetParCSR_C", NULL));
12355fbaff96SJunchao Zhang   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL));
12365fbaff96SJunchao Zhang   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL));
12379566063dSJacob Faibussowitsch   PetscCall(PetscFree(A->data));
123863c07aadSStefano Zampini   PetscFunctionReturn(0);
123963c07aadSStefano Zampini }
124063c07aadSStefano Zampini 
1241d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetUp_HYPRE(Mat A)
1242d71ae5a4SJacob Faibussowitsch {
12434ec6421dSstefano_zampini   PetscFunctionBegin;
12449566063dSJacob Faibussowitsch   PetscCall(MatHYPRESetPreallocation(A, PETSC_DEFAULT, NULL, PETSC_DEFAULT, NULL));
12454ec6421dSstefano_zampini   PetscFunctionReturn(0);
12464ec6421dSstefano_zampini }
12474ec6421dSstefano_zampini 
12486ea7df73SStefano Zampini //TODO FIX hypre_CSRMatrixMatvecOutOfPlace
12496ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
1250d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatBindToCPU_HYPRE(Mat A, PetscBool bind)
1251d71ae5a4SJacob Faibussowitsch {
12526ea7df73SStefano Zampini   Mat_HYPRE           *hA   = (Mat_HYPRE *)A->data;
12536ea7df73SStefano Zampini   HYPRE_MemoryLocation hmem = bind ? HYPRE_MEMORY_HOST : HYPRE_MEMORY_DEVICE;
12546ea7df73SStefano Zampini 
12556ea7df73SStefano Zampini   PetscFunctionBegin;
12566ea7df73SStefano Zampini   A->boundtocpu = bind;
12575fbaff96SJunchao Zhang   if (hA->ij && hypre_IJMatrixAssembleFlag(hA->ij) && hmem != hypre_IJMatrixMemoryLocation(hA->ij)) {
12586ea7df73SStefano Zampini     hypre_ParCSRMatrix *parcsr;
1259792fecdfSBarry Smith     PetscCallExternal(HYPRE_IJMatrixGetObject, hA->ij, (void **)&parcsr);
1260792fecdfSBarry Smith     PetscCallExternal(hypre_ParCSRMatrixMigrate, parcsr, hmem);
12616ea7df73SStefano Zampini   }
12629566063dSJacob Faibussowitsch   if (hA->x) PetscCall(VecHYPRE_IJBindToCPU(hA->x, bind));
12639566063dSJacob Faibussowitsch   if (hA->b) PetscCall(VecHYPRE_IJBindToCPU(hA->b, bind));
12646ea7df73SStefano Zampini   PetscFunctionReturn(0);
12656ea7df73SStefano Zampini }
12666ea7df73SStefano Zampini #endif
12676ea7df73SStefano Zampini 
1268d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAssemblyEnd_HYPRE(Mat A, MatAssemblyType mode)
1269d71ae5a4SJacob Faibussowitsch {
127063c07aadSStefano Zampini   Mat_HYPRE   *hA = (Mat_HYPRE *)A->data;
1271c69f721fSFande Kong   PetscMPIInt  n;
1272c69f721fSFande Kong   PetscInt     i, j, rstart, ncols, flg;
1273c69f721fSFande Kong   PetscInt    *row, *col;
1274c69f721fSFande Kong   PetscScalar *val;
127563c07aadSStefano Zampini 
127663c07aadSStefano Zampini   PetscFunctionBegin;
127708401ef6SPierre Jolivet   PetscCheck(mode != MAT_FLUSH_ASSEMBLY, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "MAT_FLUSH_ASSEMBLY currently not supported with MATHYPRE");
1278c69f721fSFande Kong 
1279c69f721fSFande Kong   if (!A->nooffprocentries) {
1280c69f721fSFande Kong     while (1) {
12819566063dSJacob Faibussowitsch       PetscCall(MatStashScatterGetMesg_Private(&A->stash, &n, &row, &col, &val, &flg));
1282c69f721fSFande Kong       if (!flg) break;
1283c69f721fSFande Kong 
1284c69f721fSFande Kong       for (i = 0; i < n;) {
1285c69f721fSFande Kong         /* Now identify the consecutive vals belonging to the same row */
1286c69f721fSFande Kong         for (j = i, rstart = row[j]; j < n; j++) {
1287c69f721fSFande Kong           if (row[j] != rstart) break;
1288c69f721fSFande Kong         }
1289c69f721fSFande Kong         if (j < n) ncols = j - i;
1290c69f721fSFande Kong         else ncols = n - i;
1291c69f721fSFande Kong         /* Now assemble all these values with a single function call */
12929566063dSJacob Faibussowitsch         PetscCall(MatSetValues_HYPRE(A, 1, row + i, ncols, col + i, val + i, A->insertmode));
1293c69f721fSFande Kong 
1294c69f721fSFande Kong         i = j;
1295c69f721fSFande Kong       }
1296c69f721fSFande Kong     }
12979566063dSJacob Faibussowitsch     PetscCall(MatStashScatterEnd_Private(&A->stash));
1298c69f721fSFande Kong   }
1299c69f721fSFande Kong 
1300792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixAssemble, hA->ij);
1301336664bdSPierre Jolivet   /* The assembly routine destroys the aux_matrix, we recreate it here by calling HYPRE_IJMatrixInitialize */
1302336664bdSPierre Jolivet   /* If the option MAT_SORTED_FULL is set to true, the indices and values can be passed to hypre directly, so we don't need the aux_matrix */
1303336664bdSPierre Jolivet   if (!hA->sorted_full) {
1304af1cf968SStefano Zampini     hypre_AuxParCSRMatrix *aux_matrix;
1305af1cf968SStefano Zampini 
1306af1cf968SStefano Zampini     /* call destroy just to make sure we do not leak anything */
1307af1cf968SStefano Zampini     aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(hA->ij);
1308792fecdfSBarry Smith     PetscCallExternal(hypre_AuxParCSRMatrixDestroy, aux_matrix);
1309af1cf968SStefano Zampini     hypre_IJMatrixTranslator(hA->ij) = NULL;
1310af1cf968SStefano Zampini 
1311af1cf968SStefano Zampini     /* Initialize with assembled flag -> it only recreates the aux_par_matrix */
1312792fecdfSBarry Smith     PetscCallExternal(HYPRE_IJMatrixInitialize, hA->ij);
1313af1cf968SStefano Zampini     aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(hA->ij);
13146ea7df73SStefano Zampini     if (aux_matrix) {
1315af1cf968SStefano Zampini       hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 1; /* see comment in MatHYPRESetPreallocation_HYPRE */
131622235d61SPierre Jolivet #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0)
1317792fecdfSBarry Smith       PetscCallExternal(hypre_AuxParCSRMatrixInitialize, aux_matrix);
131822235d61SPierre Jolivet #else
1319792fecdfSBarry Smith       PetscCallExternal(hypre_AuxParCSRMatrixInitialize_v2, aux_matrix, HYPRE_MEMORY_HOST);
132022235d61SPierre Jolivet #endif
1321af1cf968SStefano Zampini     }
13226ea7df73SStefano Zampini   }
13236ea7df73SStefano Zampini   {
13246ea7df73SStefano Zampini     hypre_ParCSRMatrix *parcsr;
13256ea7df73SStefano Zampini 
1326792fecdfSBarry Smith     PetscCallExternal(HYPRE_IJMatrixGetObject, hA->ij, (void **)&parcsr);
1327792fecdfSBarry Smith     if (!hypre_ParCSRMatrixCommPkg(parcsr)) PetscCallExternal(hypre_MatvecCommPkgCreate, parcsr);
13286ea7df73SStefano Zampini   }
13299566063dSJacob Faibussowitsch   if (!hA->x) PetscCall(VecHYPRE_IJVectorCreate(A->cmap, &hA->x));
13309566063dSJacob Faibussowitsch   if (!hA->b) PetscCall(VecHYPRE_IJVectorCreate(A->rmap, &hA->b));
13316ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
13329566063dSJacob Faibussowitsch   PetscCall(MatBindToCPU_HYPRE(A, A->boundtocpu));
13336ea7df73SStefano Zampini #endif
133463c07aadSStefano Zampini   PetscFunctionReturn(0);
133563c07aadSStefano Zampini }
133663c07aadSStefano Zampini 
1337d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetArray_HYPRE(Mat A, PetscInt size, void **array)
1338d71ae5a4SJacob Faibussowitsch {
1339c69f721fSFande Kong   Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
1340c69f721fSFande Kong 
1341c69f721fSFande Kong   PetscFunctionBegin;
134228b400f6SJacob Faibussowitsch   PetscCheck(hA->available, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Temporary space is in use");
1343c69f721fSFande Kong 
134439accc25SStefano Zampini   if (hA->size >= size) {
134539accc25SStefano Zampini     *array = hA->array;
134639accc25SStefano Zampini   } else {
13479566063dSJacob Faibussowitsch     PetscCall(PetscFree(hA->array));
1348c69f721fSFande Kong     hA->size = size;
13499566063dSJacob Faibussowitsch     PetscCall(PetscMalloc(hA->size, &hA->array));
1350c69f721fSFande Kong     *array = hA->array;
1351c69f721fSFande Kong   }
1352c69f721fSFande Kong 
1353c69f721fSFande Kong   hA->available = PETSC_FALSE;
1354c69f721fSFande Kong   PetscFunctionReturn(0);
1355c69f721fSFande Kong }
1356c69f721fSFande Kong 
1357d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatRestoreArray_HYPRE(Mat A, void **array)
1358d71ae5a4SJacob Faibussowitsch {
1359c69f721fSFande Kong   Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
1360c69f721fSFande Kong 
1361c69f721fSFande Kong   PetscFunctionBegin;
1362c69f721fSFande Kong   *array        = NULL;
1363c69f721fSFande Kong   hA->available = PETSC_TRUE;
1364c69f721fSFande Kong   PetscFunctionReturn(0);
1365c69f721fSFande Kong }
1366c69f721fSFande Kong 
1367d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValues_HYPRE(Mat A, PetscInt nr, const PetscInt rows[], PetscInt nc, const PetscInt cols[], const PetscScalar v[], InsertMode ins)
1368d71ae5a4SJacob Faibussowitsch {
1369d975228cSstefano_zampini   Mat_HYPRE     *hA   = (Mat_HYPRE *)A->data;
1370d975228cSstefano_zampini   PetscScalar   *vals = (PetscScalar *)v;
137139accc25SStefano Zampini   HYPRE_Complex *sscr;
1372c69f721fSFande Kong   PetscInt      *cscr[2];
1373c69f721fSFande Kong   PetscInt       i, nzc;
137408defe43SFande Kong   void          *array = NULL;
1375d975228cSstefano_zampini 
1376d975228cSstefano_zampini   PetscFunctionBegin;
13779566063dSJacob Faibussowitsch   PetscCall(MatGetArray_HYPRE(A, sizeof(PetscInt) * (2 * nc) + sizeof(HYPRE_Complex) * nc * nr, &array));
1378c69f721fSFande Kong   cscr[0] = (PetscInt *)array;
1379c69f721fSFande Kong   cscr[1] = ((PetscInt *)array) + nc;
138039accc25SStefano Zampini   sscr    = (HYPRE_Complex *)(((PetscInt *)array) + nc * 2);
1381d975228cSstefano_zampini   for (i = 0, nzc = 0; i < nc; i++) {
1382d975228cSstefano_zampini     if (cols[i] >= 0) {
1383d975228cSstefano_zampini       cscr[0][nzc]   = cols[i];
1384d975228cSstefano_zampini       cscr[1][nzc++] = i;
1385d975228cSstefano_zampini     }
1386d975228cSstefano_zampini   }
1387c69f721fSFande Kong   if (!nzc) {
13889566063dSJacob Faibussowitsch     PetscCall(MatRestoreArray_HYPRE(A, &array));
1389c69f721fSFande Kong     PetscFunctionReturn(0);
1390c69f721fSFande Kong   }
1391d975228cSstefano_zampini 
13926ea7df73SStefano Zampini #if 0 //defined(PETSC_HAVE_HYPRE_DEVICE)
13936ea7df73SStefano Zampini   if (HYPRE_MEMORY_HOST != hypre_IJMatrixMemoryLocation(hA->ij)) {
13946ea7df73SStefano Zampini     hypre_ParCSRMatrix *parcsr;
13956ea7df73SStefano Zampini 
1396792fecdfSBarry Smith     PetscCallExternal(HYPRE_IJMatrixGetObject,hA->ij,(void**)&parcsr);
1397792fecdfSBarry Smith     PetscCallExternal(hypre_ParCSRMatrixMigrate,parcsr, HYPRE_MEMORY_HOST);
13986ea7df73SStefano Zampini   }
13996ea7df73SStefano Zampini #endif
14006ea7df73SStefano Zampini 
1401d975228cSstefano_zampini   if (ins == ADD_VALUES) {
1402d975228cSstefano_zampini     for (i = 0; i < nr; i++) {
14036ea7df73SStefano Zampini       if (rows[i] >= 0) {
1404d975228cSstefano_zampini         PetscInt  j;
14052cf14000SStefano Zampini         HYPRE_Int hnc = (HYPRE_Int)nzc;
14062cf14000SStefano Zampini 
1407aed4548fSBarry Smith         PetscCheck((PetscInt)hnc == nzc, PETSC_COMM_SELF, PETSC_ERR_SUP, "Hypre overflow! number of columns %" PetscInt_FMT " for row %" PetscInt_FMT, nzc, rows[i]);
14089566063dSJacob Faibussowitsch         for (j = 0; j < nzc; j++) PetscCall(PetscHYPREScalarCast(vals[cscr[1][j]], &sscr[j]));
1409792fecdfSBarry Smith         PetscCallExternal(HYPRE_IJMatrixAddToValues, hA->ij, 1, &hnc, (HYPRE_BigInt *)(rows + i), (HYPRE_BigInt *)cscr[0], sscr);
1410d975228cSstefano_zampini       }
1411d975228cSstefano_zampini       vals += nc;
1412d975228cSstefano_zampini     }
1413d975228cSstefano_zampini   } else { /* INSERT_VALUES */
1414d975228cSstefano_zampini     PetscInt rst, ren;
1415c69f721fSFande Kong 
14169566063dSJacob Faibussowitsch     PetscCall(MatGetOwnershipRange(A, &rst, &ren));
1417d975228cSstefano_zampini     for (i = 0; i < nr; i++) {
14186ea7df73SStefano Zampini       if (rows[i] >= 0) {
1419d975228cSstefano_zampini         PetscInt  j;
14202cf14000SStefano Zampini         HYPRE_Int hnc = (HYPRE_Int)nzc;
14212cf14000SStefano Zampini 
1422aed4548fSBarry Smith         PetscCheck((PetscInt)hnc == nzc, PETSC_COMM_SELF, PETSC_ERR_SUP, "Hypre overflow! number of columns %" PetscInt_FMT " for row %" PetscInt_FMT, nzc, rows[i]);
14239566063dSJacob Faibussowitsch         for (j = 0; j < nzc; j++) PetscCall(PetscHYPREScalarCast(vals[cscr[1][j]], &sscr[j]));
1424c69f721fSFande Kong         /* nonlocal values */
14259566063dSJacob Faibussowitsch         if (rows[i] < rst || rows[i] >= ren) PetscCall(MatStashValuesRow_Private(&A->stash, rows[i], nzc, cscr[0], (PetscScalar *)sscr, PETSC_FALSE));
1426c69f721fSFande Kong         /* local values */
1427792fecdfSBarry Smith         else PetscCallExternal(HYPRE_IJMatrixSetValues, hA->ij, 1, &hnc, (HYPRE_BigInt *)(rows + i), (HYPRE_BigInt *)cscr[0], sscr);
1428d975228cSstefano_zampini       }
1429d975228cSstefano_zampini       vals += nc;
1430d975228cSstefano_zampini     }
1431d975228cSstefano_zampini   }
1432c69f721fSFande Kong 
14339566063dSJacob Faibussowitsch   PetscCall(MatRestoreArray_HYPRE(A, &array));
1434d975228cSstefano_zampini   PetscFunctionReturn(0);
1435d975228cSstefano_zampini }
1436d975228cSstefano_zampini 
1437d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRESetPreallocation_HYPRE(Mat A, PetscInt dnz, const PetscInt dnnz[], PetscInt onz, const PetscInt onnz[])
1438d71ae5a4SJacob Faibussowitsch {
1439d975228cSstefano_zampini   Mat_HYPRE  *hA = (Mat_HYPRE *)A->data;
14407d968826Sstefano_zampini   HYPRE_Int  *hdnnz, *honnz;
144106a29025Sstefano_zampini   PetscInt    i, rs, re, cs, ce, bs;
1442d975228cSstefano_zampini   PetscMPIInt size;
1443d975228cSstefano_zampini 
1444d975228cSstefano_zampini   PetscFunctionBegin;
14459566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->rmap));
14469566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->cmap));
1447d975228cSstefano_zampini   rs = A->rmap->rstart;
1448d975228cSstefano_zampini   re = A->rmap->rend;
1449d975228cSstefano_zampini   cs = A->cmap->rstart;
1450d975228cSstefano_zampini   ce = A->cmap->rend;
1451d975228cSstefano_zampini   if (!hA->ij) {
1452792fecdfSBarry Smith     PetscCallExternal(HYPRE_IJMatrixCreate, hA->comm, rs, re - 1, cs, ce - 1, &hA->ij);
1453792fecdfSBarry Smith     PetscCallExternal(HYPRE_IJMatrixSetObjectType, hA->ij, HYPRE_PARCSR);
1454d975228cSstefano_zampini   } else {
14552cf14000SStefano Zampini     HYPRE_BigInt hrs, hre, hcs, hce;
1456792fecdfSBarry Smith     PetscCallExternal(HYPRE_IJMatrixGetLocalRange, hA->ij, &hrs, &hre, &hcs, &hce);
1457aed4548fSBarry Smith     PetscCheck(hre - hrs + 1 == re - rs, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Inconsistent local rows: IJMatrix [%" PetscHYPRE_BigInt_FMT ",%" PetscHYPRE_BigInt_FMT "), PETSc [%" PetscInt_FMT ",%" PetscInt_FMT ")", hrs, hre + 1, rs, re);
1458aed4548fSBarry Smith     PetscCheck(hce - hcs + 1 == ce - cs, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Inconsistent local cols: IJMatrix [%" PetscHYPRE_BigInt_FMT ",%" PetscHYPRE_BigInt_FMT "), PETSc [%" PetscInt_FMT ",%" PetscInt_FMT ")", hcs, hce + 1, cs, ce);
1459d975228cSstefano_zampini   }
14609566063dSJacob Faibussowitsch   PetscCall(MatGetBlockSize(A, &bs));
146106a29025Sstefano_zampini   if (dnz == PETSC_DEFAULT || dnz == PETSC_DECIDE) dnz = 10 * bs;
146206a29025Sstefano_zampini   if (onz == PETSC_DEFAULT || onz == PETSC_DECIDE) onz = 10 * bs;
146306a29025Sstefano_zampini 
1464d975228cSstefano_zampini   if (!dnnz) {
14659566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n, &hdnnz));
1466d975228cSstefano_zampini     for (i = 0; i < A->rmap->n; i++) hdnnz[i] = dnz;
1467d975228cSstefano_zampini   } else {
14687d968826Sstefano_zampini     hdnnz = (HYPRE_Int *)dnnz;
1469d975228cSstefano_zampini   }
14709566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)A), &size));
1471d975228cSstefano_zampini   if (size > 1) {
1472ddbeb582SStefano Zampini     hypre_AuxParCSRMatrix *aux_matrix;
1473d975228cSstefano_zampini     if (!onnz) {
14749566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(A->rmap->n, &honnz));
1475d975228cSstefano_zampini       for (i = 0; i < A->rmap->n; i++) honnz[i] = onz;
147622235d61SPierre Jolivet     } else honnz = (HYPRE_Int *)onnz;
1477ddbeb582SStefano Zampini     /* SetDiagOffdSizes sets hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0, since it seems
1478ddbeb582SStefano Zampini        they assume the user will input the entire row values, properly sorted
1479336664bdSPierre Jolivet        In PETSc, we don't make such an assumption and set this flag to 1,
1480336664bdSPierre Jolivet        unless the option MAT_SORTED_FULL is set to true.
1481ddbeb582SStefano Zampini        Also, to avoid possible memory leaks, we destroy and recreate the translator
1482ddbeb582SStefano Zampini        This has to be done here, as HYPRE_IJMatrixInitialize will properly initialize
1483ddbeb582SStefano Zampini        the IJ matrix for us */
1484ddbeb582SStefano Zampini     aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(hA->ij);
1485ddbeb582SStefano Zampini     hypre_AuxParCSRMatrixDestroy(aux_matrix);
1486ddbeb582SStefano Zampini     hypre_IJMatrixTranslator(hA->ij) = NULL;
1487792fecdfSBarry Smith     PetscCallExternal(HYPRE_IJMatrixSetDiagOffdSizes, hA->ij, hdnnz, honnz);
1488ddbeb582SStefano Zampini     aux_matrix                               = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(hA->ij);
1489336664bdSPierre Jolivet     hypre_AuxParCSRMatrixNeedAux(aux_matrix) = !hA->sorted_full;
1490d975228cSstefano_zampini   } else {
1491d975228cSstefano_zampini     honnz = NULL;
1492792fecdfSBarry Smith     PetscCallExternal(HYPRE_IJMatrixSetRowSizes, hA->ij, hdnnz);
1493d975228cSstefano_zampini   }
1494ddbeb582SStefano Zampini 
1495af1cf968SStefano Zampini   /* reset assembled flag and call the initialize method */
1496af1cf968SStefano Zampini   hypre_IJMatrixAssembleFlag(hA->ij) = 0;
14976ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0)
1498792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixInitialize, hA->ij);
14996ea7df73SStefano Zampini #else
1500792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixInitialize_v2, hA->ij, HYPRE_MEMORY_HOST);
15016ea7df73SStefano Zampini #endif
150248a46eb9SPierre Jolivet   if (!dnnz) PetscCall(PetscFree(hdnnz));
150348a46eb9SPierre Jolivet   if (!onnz && honnz) PetscCall(PetscFree(honnz));
1504af1cf968SStefano Zampini   /* Match AIJ logic */
150506a29025Sstefano_zampini   A->preallocated = PETSC_TRUE;
1506af1cf968SStefano Zampini   A->assembled    = PETSC_FALSE;
1507d975228cSstefano_zampini   PetscFunctionReturn(0);
1508d975228cSstefano_zampini }
1509d975228cSstefano_zampini 
1510d975228cSstefano_zampini /*@C
1511d975228cSstefano_zampini    MatHYPRESetPreallocation - Preallocates memory for a sparse parallel matrix in HYPRE IJ format
1512d975228cSstefano_zampini 
1513*c3339decSBarry Smith    Collective
1514d975228cSstefano_zampini 
1515d975228cSstefano_zampini    Input Parameters:
1516d975228cSstefano_zampini +  A - the matrix
1517d975228cSstefano_zampini .  dnz  - number of nonzeros per row in DIAGONAL portion of local submatrix
1518d975228cSstefano_zampini           (same value is used for all local rows)
1519d975228cSstefano_zampini .  dnnz - array containing the number of nonzeros in the various rows of the
1520d975228cSstefano_zampini           DIAGONAL portion of the local submatrix (possibly different for each row)
152111a5261eSBarry Smith           or NULL (`PETSC_NULL_INTEGER` in Fortran), if d_nz is used to specify the nonzero structure.
1522d975228cSstefano_zampini           The size of this array is equal to the number of local rows, i.e 'm'.
1523d975228cSstefano_zampini           For matrices that will be factored, you must leave room for (and set)
1524d975228cSstefano_zampini           the diagonal entry even if it is zero.
1525d975228cSstefano_zampini .  onz  - number of nonzeros per row in the OFF-DIAGONAL portion of local
1526d975228cSstefano_zampini           submatrix (same value is used for all local rows).
1527d975228cSstefano_zampini -  onnz - array containing the number of nonzeros in the various rows of the
1528d975228cSstefano_zampini           OFF-DIAGONAL portion of the local submatrix (possibly different for
152911a5261eSBarry Smith           each row) or NULL (`PETSC_NULL_INTEGER` in Fortran), if o_nz is used to specify the nonzero
1530d975228cSstefano_zampini           structure. The size of this array is equal to the number
1531d975228cSstefano_zampini           of local rows, i.e 'm'.
1532d975228cSstefano_zampini 
153311a5261eSBarry Smith    Note:
153495452b02SPatrick Sanan     If the *nnz parameter is given then the *nz parameter is ignored; for sequential matrices, onz and onnz are ignored.
1535d975228cSstefano_zampini 
1536d975228cSstefano_zampini    Level: intermediate
1537d975228cSstefano_zampini 
1538db781477SPatrick Sanan .seealso: `MatCreate()`, `MatMPIAIJSetPreallocation()`, `MATHYPRE`
1539d975228cSstefano_zampini @*/
1540d71ae5a4SJacob Faibussowitsch PetscErrorCode MatHYPRESetPreallocation(Mat A, PetscInt dnz, const PetscInt dnnz[], PetscInt onz, const PetscInt onnz[])
1541d71ae5a4SJacob Faibussowitsch {
1542d975228cSstefano_zampini   PetscFunctionBegin;
1543d975228cSstefano_zampini   PetscValidHeaderSpecific(A, MAT_CLASSID, 1);
1544d975228cSstefano_zampini   PetscValidType(A, 1);
1545cac4c232SBarry Smith   PetscTryMethod(A, "MatHYPRESetPreallocation_C", (Mat, PetscInt, const PetscInt[], PetscInt, const PetscInt[]), (A, dnz, dnnz, onz, onnz));
1546d975228cSstefano_zampini   PetscFunctionReturn(0);
1547d975228cSstefano_zampini }
1548d975228cSstefano_zampini 
1549225daaf8SStefano Zampini /*
1550225daaf8SStefano Zampini    MatCreateFromParCSR - Creates a matrix from a hypre_ParCSRMatrix
1551225daaf8SStefano Zampini 
1552225daaf8SStefano Zampini    Collective
1553225daaf8SStefano Zampini 
1554225daaf8SStefano Zampini    Input Parameters:
155545b8d346SStefano Zampini +  parcsr   - the pointer to the hypre_ParCSRMatrix
1556bb4689ddSStefano Zampini .  mtype    - matrix type to be created. Currently MATAIJ, MATIS and MATHYPRE are supported.
1557225daaf8SStefano Zampini -  copymode - PETSc copying options
1558225daaf8SStefano Zampini 
1559225daaf8SStefano Zampini    Output Parameter:
1560225daaf8SStefano Zampini .  A  - the matrix
1561225daaf8SStefano Zampini 
1562225daaf8SStefano Zampini    Level: intermediate
1563225daaf8SStefano Zampini 
1564db781477SPatrick Sanan .seealso: `MatHYPRE`, `PetscCopyMode`
1565225daaf8SStefano Zampini */
1566d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreateFromParCSR(hypre_ParCSRMatrix *parcsr, MatType mtype, PetscCopyMode copymode, Mat *A)
1567d71ae5a4SJacob Faibussowitsch {
1568225daaf8SStefano Zampini   Mat        T;
1569978814f1SStefano Zampini   Mat_HYPRE *hA;
1570978814f1SStefano Zampini   MPI_Comm   comm;
1571978814f1SStefano Zampini   PetscInt   rstart, rend, cstart, cend, M, N;
1572d248a85cSRichard Tran Mills   PetscBool  isseqaij, isseqaijmkl, ismpiaij, isaij, ishyp, isis;
1573978814f1SStefano Zampini 
1574978814f1SStefano Zampini   PetscFunctionBegin;
1575978814f1SStefano Zampini   comm = hypre_ParCSRMatrixComm(parcsr);
15769566063dSJacob Faibussowitsch   PetscCall(PetscStrcmp(mtype, MATSEQAIJ, &isseqaij));
15779566063dSJacob Faibussowitsch   PetscCall(PetscStrcmp(mtype, MATSEQAIJMKL, &isseqaijmkl));
15789566063dSJacob Faibussowitsch   PetscCall(PetscStrcmp(mtype, MATMPIAIJ, &ismpiaij));
15799566063dSJacob Faibussowitsch   PetscCall(PetscStrcmp(mtype, MATAIJ, &isaij));
15809566063dSJacob Faibussowitsch   PetscCall(PetscStrcmp(mtype, MATHYPRE, &ishyp));
15819566063dSJacob Faibussowitsch   PetscCall(PetscStrcmp(mtype, MATIS, &isis));
1582d248a85cSRichard Tran Mills   isaij = (PetscBool)(isseqaij || isseqaijmkl || ismpiaij || isaij);
15836ea7df73SStefano Zampini   /* TODO */
1584aed4548fSBarry Smith   PetscCheck(isaij || ishyp || isis, comm, PETSC_ERR_SUP, "Unsupported MatType %s! Supported types are %s, %s, %s, %s, %s, and %s", mtype, MATAIJ, MATSEQAIJ, MATSEQAIJMKL, MATMPIAIJ, MATIS, MATHYPRE);
1585978814f1SStefano Zampini   /* access ParCSRMatrix */
1586978814f1SStefano Zampini   rstart = hypre_ParCSRMatrixFirstRowIndex(parcsr);
1587978814f1SStefano Zampini   rend   = hypre_ParCSRMatrixLastRowIndex(parcsr);
1588978814f1SStefano Zampini   cstart = hypre_ParCSRMatrixFirstColDiag(parcsr);
1589978814f1SStefano Zampini   cend   = hypre_ParCSRMatrixLastColDiag(parcsr);
1590978814f1SStefano Zampini   M      = hypre_ParCSRMatrixGlobalNumRows(parcsr);
1591978814f1SStefano Zampini   N      = hypre_ParCSRMatrixGlobalNumCols(parcsr);
1592978814f1SStefano Zampini 
1593fa92c42cSstefano_zampini   /* fix for empty local rows/columns */
1594fa92c42cSstefano_zampini   if (rend < rstart) rend = rstart;
1595fa92c42cSstefano_zampini   if (cend < cstart) cend = cstart;
1596fa92c42cSstefano_zampini 
1597e6471dc9SStefano Zampini   /* PETSc convention */
1598e6471dc9SStefano Zampini   rend++;
1599e6471dc9SStefano Zampini   cend++;
1600e6471dc9SStefano Zampini   rend = PetscMin(rend, M);
1601e6471dc9SStefano Zampini   cend = PetscMin(cend, N);
1602e6471dc9SStefano Zampini 
1603978814f1SStefano Zampini   /* create PETSc matrix with MatHYPRE */
16049566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, &T));
16059566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(T, rend - rstart, cend - cstart, M, N));
16069566063dSJacob Faibussowitsch   PetscCall(MatSetType(T, MATHYPRE));
1607225daaf8SStefano Zampini   hA = (Mat_HYPRE *)(T->data);
1608978814f1SStefano Zampini 
1609978814f1SStefano Zampini   /* create HYPRE_IJMatrix */
1610792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixCreate, hA->comm, rstart, rend - 1, cstart, cend - 1, &hA->ij);
1611792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixSetObjectType, hA->ij, HYPRE_PARCSR);
161245b8d346SStefano Zampini 
16136ea7df73SStefano Zampini   // TODO DEV
161445b8d346SStefano Zampini   /* create new ParCSR object if needed */
161545b8d346SStefano Zampini   if (ishyp && copymode == PETSC_COPY_VALUES) {
161645b8d346SStefano Zampini     hypre_ParCSRMatrix *new_parcsr;
16176ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 18, 0)
161845b8d346SStefano Zampini     hypre_CSRMatrix *hdiag, *hoffd, *ndiag, *noffd;
161945b8d346SStefano Zampini 
16200e6427aaSSatish Balay     new_parcsr = hypre_ParCSRMatrixClone(parcsr, 0);
162145b8d346SStefano Zampini     hdiag      = hypre_ParCSRMatrixDiag(parcsr);
162245b8d346SStefano Zampini     hoffd      = hypre_ParCSRMatrixOffd(parcsr);
162345b8d346SStefano Zampini     ndiag      = hypre_ParCSRMatrixDiag(new_parcsr);
162445b8d346SStefano Zampini     noffd      = hypre_ParCSRMatrixOffd(new_parcsr);
16259566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(hypre_CSRMatrixData(ndiag), hypre_CSRMatrixData(hdiag), hypre_CSRMatrixNumNonzeros(hdiag)));
16269566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(hypre_CSRMatrixData(noffd), hypre_CSRMatrixData(hoffd), hypre_CSRMatrixNumNonzeros(hoffd)));
16276ea7df73SStefano Zampini #else
16286ea7df73SStefano Zampini     new_parcsr = hypre_ParCSRMatrixClone(parcsr, 1);
16296ea7df73SStefano Zampini #endif
163045b8d346SStefano Zampini     parcsr   = new_parcsr;
163145b8d346SStefano Zampini     copymode = PETSC_OWN_POINTER;
163245b8d346SStefano Zampini   }
1633978814f1SStefano Zampini 
1634978814f1SStefano Zampini   /* set ParCSR object */
1635978814f1SStefano Zampini   hypre_IJMatrixObject(hA->ij) = parcsr;
16364ec6421dSstefano_zampini   T->preallocated              = PETSC_TRUE;
1637978814f1SStefano Zampini 
1638978814f1SStefano Zampini   /* set assembled flag */
1639978814f1SStefano Zampini   hypre_IJMatrixAssembleFlag(hA->ij) = 1;
16406ea7df73SStefano Zampini #if 0
1641792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixInitialize,hA->ij);
16426ea7df73SStefano Zampini #endif
1643225daaf8SStefano Zampini   if (ishyp) {
16446d2a658fSstefano_zampini     PetscMPIInt myid = 0;
16456d2a658fSstefano_zampini 
16466d2a658fSstefano_zampini     /* make sure we always have row_starts and col_starts available */
164748a46eb9SPierre Jolivet     if (HYPRE_AssumedPartitionCheck()) PetscCallMPI(MPI_Comm_rank(comm, &myid));
1648a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts)
16496d2a658fSstefano_zampini     if (!hypre_ParCSRMatrixOwnsColStarts(parcsr)) {
16506d2a658fSstefano_zampini       PetscLayout map;
16516d2a658fSstefano_zampini 
16529566063dSJacob Faibussowitsch       PetscCall(MatGetLayouts(T, NULL, &map));
16539566063dSJacob Faibussowitsch       PetscCall(PetscLayoutSetUp(map));
16542cf14000SStefano Zampini       hypre_ParCSRMatrixColStarts(parcsr) = (HYPRE_BigInt *)(map->range + myid);
16556d2a658fSstefano_zampini     }
16566d2a658fSstefano_zampini     if (!hypre_ParCSRMatrixOwnsRowStarts(parcsr)) {
16576d2a658fSstefano_zampini       PetscLayout map;
16586d2a658fSstefano_zampini 
16599566063dSJacob Faibussowitsch       PetscCall(MatGetLayouts(T, &map, NULL));
16609566063dSJacob Faibussowitsch       PetscCall(PetscLayoutSetUp(map));
16612cf14000SStefano Zampini       hypre_ParCSRMatrixRowStarts(parcsr) = (HYPRE_BigInt *)(map->range + myid);
16626d2a658fSstefano_zampini     }
1663a1d2239cSSatish Balay #endif
1664978814f1SStefano Zampini     /* prevent from freeing the pointer */
1665978814f1SStefano Zampini     if (copymode == PETSC_USE_POINTER) hA->inner_free = PETSC_FALSE;
1666225daaf8SStefano Zampini     *A = T;
16679566063dSJacob Faibussowitsch     PetscCall(MatSetOption(*A, MAT_SORTED_FULL, PETSC_TRUE));
16689566063dSJacob Faibussowitsch     PetscCall(MatAssemblyBegin(*A, MAT_FINAL_ASSEMBLY));
16699566063dSJacob Faibussowitsch     PetscCall(MatAssemblyEnd(*A, MAT_FINAL_ASSEMBLY));
1670bb4689ddSStefano Zampini   } else if (isaij) {
1671bb4689ddSStefano Zampini     if (copymode != PETSC_OWN_POINTER) {
1672225daaf8SStefano Zampini       /* prevent from freeing the pointer */
1673225daaf8SStefano Zampini       hA->inner_free = PETSC_FALSE;
16749566063dSJacob Faibussowitsch       PetscCall(MatConvert_HYPRE_AIJ(T, MATAIJ, MAT_INITIAL_MATRIX, A));
16759566063dSJacob Faibussowitsch       PetscCall(MatDestroy(&T));
1676225daaf8SStefano Zampini     } else { /* AIJ return type with PETSC_OWN_POINTER */
16779566063dSJacob Faibussowitsch       PetscCall(MatConvert_HYPRE_AIJ(T, MATAIJ, MAT_INPLACE_MATRIX, &T));
1678225daaf8SStefano Zampini       *A = T;
1679225daaf8SStefano Zampini     }
1680bb4689ddSStefano Zampini   } else if (isis) {
16819566063dSJacob Faibussowitsch     PetscCall(MatConvert_HYPRE_IS(T, MATIS, MAT_INITIAL_MATRIX, A));
16828cfe8d00SStefano Zampini     if (copymode != PETSC_OWN_POINTER) hA->inner_free = PETSC_FALSE;
16839566063dSJacob Faibussowitsch     PetscCall(MatDestroy(&T));
1684bb4689ddSStefano Zampini   }
1685978814f1SStefano Zampini   PetscFunctionReturn(0);
1686978814f1SStefano Zampini }
1687978814f1SStefano Zampini 
1688d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPREGetParCSR_HYPRE(Mat A, hypre_ParCSRMatrix **parcsr)
1689d71ae5a4SJacob Faibussowitsch {
1690dd9c0a25Sstefano_zampini   Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
1691dd9c0a25Sstefano_zampini   HYPRE_Int  type;
1692dd9c0a25Sstefano_zampini 
1693dd9c0a25Sstefano_zampini   PetscFunctionBegin;
169428b400f6SJacob Faibussowitsch   PetscCheck(hA->ij, PetscObjectComm((PetscObject)A), PETSC_ERR_PLIB, "HYPRE_IJMatrix not present");
1695792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixGetObjectType, hA->ij, &type);
169608401ef6SPierre Jolivet   PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "HYPRE_IJMatrix is not of type HYPRE_PARCSR");
1697792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixGetObject, hA->ij, (void **)parcsr);
1698dd9c0a25Sstefano_zampini   PetscFunctionReturn(0);
1699dd9c0a25Sstefano_zampini }
1700dd9c0a25Sstefano_zampini 
1701dd9c0a25Sstefano_zampini /*
1702dd9c0a25Sstefano_zampini    MatHYPREGetParCSR - Gets the pointer to the ParCSR matrix
1703dd9c0a25Sstefano_zampini 
1704dd9c0a25Sstefano_zampini    Not collective
1705dd9c0a25Sstefano_zampini 
1706dd9c0a25Sstefano_zampini    Input Parameters:
1707dd9c0a25Sstefano_zampini +  A  - the MATHYPRE object
1708dd9c0a25Sstefano_zampini 
1709dd9c0a25Sstefano_zampini    Output Parameter:
1710dd9c0a25Sstefano_zampini .  parcsr  - the pointer to the hypre_ParCSRMatrix
1711dd9c0a25Sstefano_zampini 
1712dd9c0a25Sstefano_zampini    Level: intermediate
1713dd9c0a25Sstefano_zampini 
1714db781477SPatrick Sanan .seealso: `MatHYPRE`, `PetscCopyMode`
1715dd9c0a25Sstefano_zampini */
1716d71ae5a4SJacob Faibussowitsch PetscErrorCode MatHYPREGetParCSR(Mat A, hypre_ParCSRMatrix **parcsr)
1717d71ae5a4SJacob Faibussowitsch {
1718dd9c0a25Sstefano_zampini   PetscFunctionBegin;
1719dd9c0a25Sstefano_zampini   PetscValidHeaderSpecific(A, MAT_CLASSID, 1);
1720dd9c0a25Sstefano_zampini   PetscValidType(A, 1);
1721cac4c232SBarry Smith   PetscUseMethod(A, "MatHYPREGetParCSR_C", (Mat, hypre_ParCSRMatrix **), (A, parcsr));
1722dd9c0a25Sstefano_zampini   PetscFunctionReturn(0);
1723dd9c0a25Sstefano_zampini }
1724dd9c0a25Sstefano_zampini 
1725d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMissingDiagonal_HYPRE(Mat A, PetscBool *missing, PetscInt *dd)
1726d71ae5a4SJacob Faibussowitsch {
172768ec7858SStefano Zampini   hypre_ParCSRMatrix *parcsr;
172868ec7858SStefano Zampini   hypre_CSRMatrix    *ha;
172968ec7858SStefano Zampini   PetscInt            rst;
173068ec7858SStefano Zampini 
173168ec7858SStefano Zampini   PetscFunctionBegin;
173208401ef6SPierre Jolivet   PetscCheck(A->rmap->n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_SUP, "Not implemented with non-square diagonal blocks");
17339566063dSJacob Faibussowitsch   PetscCall(MatGetOwnershipRange(A, &rst, NULL));
17349566063dSJacob Faibussowitsch   PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
173568ec7858SStefano Zampini   if (missing) *missing = PETSC_FALSE;
173668ec7858SStefano Zampini   if (dd) *dd = -1;
173768ec7858SStefano Zampini   ha = hypre_ParCSRMatrixDiag(parcsr);
173868ec7858SStefano Zampini   if (ha) {
173968299464SStefano Zampini     PetscInt   size, i;
174068299464SStefano Zampini     HYPRE_Int *ii, *jj;
174168ec7858SStefano Zampini 
174268ec7858SStefano Zampini     size = hypre_CSRMatrixNumRows(ha);
174368ec7858SStefano Zampini     ii   = hypre_CSRMatrixI(ha);
174468ec7858SStefano Zampini     jj   = hypre_CSRMatrixJ(ha);
174568ec7858SStefano Zampini     for (i = 0; i < size; i++) {
174668ec7858SStefano Zampini       PetscInt  j;
174768ec7858SStefano Zampini       PetscBool found = PETSC_FALSE;
174868ec7858SStefano Zampini 
17499371c9d4SSatish Balay       for (j = ii[i]; j < ii[i + 1] && !found; j++) found = (jj[j] == i) ? PETSC_TRUE : PETSC_FALSE;
175068ec7858SStefano Zampini 
175168ec7858SStefano Zampini       if (!found) {
17527d3de750SJacob Faibussowitsch         PetscInfo(A, "Matrix is missing local diagonal entry %" PetscInt_FMT "\n", i);
175368ec7858SStefano Zampini         if (missing) *missing = PETSC_TRUE;
175468ec7858SStefano Zampini         if (dd) *dd = i + rst;
175568ec7858SStefano Zampini         PetscFunctionReturn(0);
175668ec7858SStefano Zampini       }
175768ec7858SStefano Zampini     }
175868ec7858SStefano Zampini     if (!size) {
175968ec7858SStefano Zampini       PetscInfo(A, "Matrix has no diagonal entries therefore is missing diagonal\n");
176068ec7858SStefano Zampini       if (missing) *missing = PETSC_TRUE;
176168ec7858SStefano Zampini       if (dd) *dd = rst;
176268ec7858SStefano Zampini     }
176368ec7858SStefano Zampini   } else {
176468ec7858SStefano Zampini     PetscInfo(A, "Matrix has no diagonal entries therefore is missing diagonal\n");
176568ec7858SStefano Zampini     if (missing) *missing = PETSC_TRUE;
176668ec7858SStefano Zampini     if (dd) *dd = rst;
176768ec7858SStefano Zampini   }
176868ec7858SStefano Zampini   PetscFunctionReturn(0);
176968ec7858SStefano Zampini }
177068ec7858SStefano Zampini 
1771d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatScale_HYPRE(Mat A, PetscScalar s)
1772d71ae5a4SJacob Faibussowitsch {
177368ec7858SStefano Zampini   hypre_ParCSRMatrix *parcsr;
17746ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0)
177568ec7858SStefano Zampini   hypre_CSRMatrix *ha;
17766ea7df73SStefano Zampini #endif
177739accc25SStefano Zampini   HYPRE_Complex hs;
177868ec7858SStefano Zampini 
177968ec7858SStefano Zampini   PetscFunctionBegin;
17809566063dSJacob Faibussowitsch   PetscCall(PetscHYPREScalarCast(s, &hs));
17819566063dSJacob Faibussowitsch   PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
17826ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2, 19, 0)
1783792fecdfSBarry Smith   PetscCallExternal(hypre_ParCSRMatrixScale, parcsr, hs);
17846ea7df73SStefano Zampini #else /* diagonal part */
178568ec7858SStefano Zampini   ha = hypre_ParCSRMatrixDiag(parcsr);
178668ec7858SStefano Zampini   if (ha) {
178768299464SStefano Zampini     PetscInt size, i;
178868299464SStefano Zampini     HYPRE_Int *ii;
178939accc25SStefano Zampini     HYPRE_Complex *a;
179068ec7858SStefano Zampini 
179168ec7858SStefano Zampini     size = hypre_CSRMatrixNumRows(ha);
179268ec7858SStefano Zampini     a = hypre_CSRMatrixData(ha);
179368ec7858SStefano Zampini     ii = hypre_CSRMatrixI(ha);
179439accc25SStefano Zampini     for (i = 0; i < ii[size]; i++) a[i] *= hs;
179568ec7858SStefano Zampini   }
179668ec7858SStefano Zampini   /* offdiagonal part */
179768ec7858SStefano Zampini   ha = hypre_ParCSRMatrixOffd(parcsr);
179868ec7858SStefano Zampini   if (ha) {
179968299464SStefano Zampini     PetscInt size, i;
180068299464SStefano Zampini     HYPRE_Int *ii;
180139accc25SStefano Zampini     HYPRE_Complex *a;
180268ec7858SStefano Zampini 
180368ec7858SStefano Zampini     size = hypre_CSRMatrixNumRows(ha);
180468ec7858SStefano Zampini     a = hypre_CSRMatrixData(ha);
180568ec7858SStefano Zampini     ii = hypre_CSRMatrixI(ha);
180639accc25SStefano Zampini     for (i = 0; i < ii[size]; i++) a[i] *= hs;
180768ec7858SStefano Zampini   }
18086ea7df73SStefano Zampini #endif
180968ec7858SStefano Zampini   PetscFunctionReturn(0);
181068ec7858SStefano Zampini }
181168ec7858SStefano Zampini 
1812d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatZeroRowsColumns_HYPRE(Mat A, PetscInt numRows, const PetscInt rows[], PetscScalar diag, Vec x, Vec b)
1813d71ae5a4SJacob Faibussowitsch {
181468ec7858SStefano Zampini   hypre_ParCSRMatrix *parcsr;
181568299464SStefano Zampini   HYPRE_Int          *lrows;
181668299464SStefano Zampini   PetscInt            rst, ren, i;
181768ec7858SStefano Zampini 
181868ec7858SStefano Zampini   PetscFunctionBegin;
181908401ef6SPierre Jolivet   PetscCheck(!x && !b, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "To be implemented");
18209566063dSJacob Faibussowitsch   PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
18219566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(numRows, &lrows));
18229566063dSJacob Faibussowitsch   PetscCall(MatGetOwnershipRange(A, &rst, &ren));
182368ec7858SStefano Zampini   for (i = 0; i < numRows; i++) {
18247a46b595SBarry Smith     PetscCheck(rows[i] >= rst && rows[i] < ren, PETSC_COMM_SELF, PETSC_ERR_SUP, "Non-local rows not yet supported");
182568ec7858SStefano Zampini     lrows[i] = rows[i] - rst;
182668ec7858SStefano Zampini   }
1827792fecdfSBarry Smith   PetscCallExternal(hypre_ParCSRMatrixEliminateRowsCols, parcsr, numRows, lrows);
18289566063dSJacob Faibussowitsch   PetscCall(PetscFree(lrows));
182968ec7858SStefano Zampini   PetscFunctionReturn(0);
183068ec7858SStefano Zampini }
183168ec7858SStefano Zampini 
1832d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatZeroEntries_HYPRE_CSRMatrix(hypre_CSRMatrix *ha)
1833d71ae5a4SJacob Faibussowitsch {
1834c69f721fSFande Kong   PetscFunctionBegin;
1835c69f721fSFande Kong   if (ha) {
1836c69f721fSFande Kong     HYPRE_Int     *ii, size;
1837c69f721fSFande Kong     HYPRE_Complex *a;
1838c69f721fSFande Kong 
1839c69f721fSFande Kong     size = hypre_CSRMatrixNumRows(ha);
1840c69f721fSFande Kong     a    = hypre_CSRMatrixData(ha);
1841c69f721fSFande Kong     ii   = hypre_CSRMatrixI(ha);
1842c69f721fSFande Kong 
18439566063dSJacob Faibussowitsch     if (a) PetscCall(PetscArrayzero(a, ii[size]));
1844c69f721fSFande Kong   }
1845c69f721fSFande Kong   PetscFunctionReturn(0);
1846c69f721fSFande Kong }
1847c69f721fSFande Kong 
1848d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_HYPRE(Mat A)
1849d71ae5a4SJacob Faibussowitsch {
18506ea7df73SStefano Zampini   Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
18516ea7df73SStefano Zampini 
18526ea7df73SStefano Zampini   PetscFunctionBegin;
18536ea7df73SStefano Zampini   if (HYPRE_MEMORY_DEVICE == hypre_IJMatrixMemoryLocation(hA->ij)) {
1854792fecdfSBarry Smith     PetscCallExternal(HYPRE_IJMatrixSetConstantValues, hA->ij, 0.0);
18556ea7df73SStefano Zampini   } else {
1856c69f721fSFande Kong     hypre_ParCSRMatrix *parcsr;
1857c69f721fSFande Kong 
18589566063dSJacob Faibussowitsch     PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
18599566063dSJacob Faibussowitsch     PetscCall(MatZeroEntries_HYPRE_CSRMatrix(hypre_ParCSRMatrixDiag(parcsr)));
18609566063dSJacob Faibussowitsch     PetscCall(MatZeroEntries_HYPRE_CSRMatrix(hypre_ParCSRMatrixOffd(parcsr)));
18616ea7df73SStefano Zampini   }
1862c69f721fSFande Kong   PetscFunctionReturn(0);
1863c69f721fSFande Kong }
1864c69f721fSFande Kong 
1865d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatZeroRows_HYPRE_CSRMatrix(hypre_CSRMatrix *hA, PetscInt N, const PetscInt rows[], HYPRE_Complex diag)
1866d71ae5a4SJacob Faibussowitsch {
186739accc25SStefano Zampini   PetscInt       ii;
186839accc25SStefano Zampini   HYPRE_Int     *i, *j;
186939accc25SStefano Zampini   HYPRE_Complex *a;
1870c69f721fSFande Kong 
1871c69f721fSFande Kong   PetscFunctionBegin;
1872c69f721fSFande Kong   if (!hA) PetscFunctionReturn(0);
1873c69f721fSFande Kong 
187439accc25SStefano Zampini   i = hypre_CSRMatrixI(hA);
187539accc25SStefano Zampini   j = hypre_CSRMatrixJ(hA);
1876c69f721fSFande Kong   a = hypre_CSRMatrixData(hA);
1877c69f721fSFande Kong 
1878c69f721fSFande Kong   for (ii = 0; ii < N; ii++) {
187939accc25SStefano Zampini     HYPRE_Int jj, ibeg, iend, irow;
188039accc25SStefano Zampini 
1881c69f721fSFande Kong     irow = rows[ii];
1882c69f721fSFande Kong     ibeg = i[irow];
1883c69f721fSFande Kong     iend = i[irow + 1];
1884c69f721fSFande Kong     for (jj = ibeg; jj < iend; jj++)
1885c69f721fSFande Kong       if (j[jj] == irow) a[jj] = diag;
1886c69f721fSFande Kong       else a[jj] = 0.0;
1887c69f721fSFande Kong   }
1888c69f721fSFande Kong   PetscFunctionReturn(0);
1889c69f721fSFande Kong }
1890c69f721fSFande Kong 
1891d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatZeroRows_HYPRE(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b)
1892d71ae5a4SJacob Faibussowitsch {
1893c69f721fSFande Kong   hypre_ParCSRMatrix *parcsr;
1894c69f721fSFande Kong   PetscInt           *lrows, len;
189539accc25SStefano Zampini   HYPRE_Complex       hdiag;
1896c69f721fSFande Kong 
1897c69f721fSFande Kong   PetscFunctionBegin;
189808401ef6SPierre Jolivet   PetscCheck(!x && !b, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Does not support to modify the solution and the right hand size");
18999566063dSJacob Faibussowitsch   PetscCall(PetscHYPREScalarCast(diag, &hdiag));
1900c69f721fSFande Kong   /* retrieve the internal matrix */
19019566063dSJacob Faibussowitsch   PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
1902c69f721fSFande Kong   /* get locally owned rows */
19039566063dSJacob Faibussowitsch   PetscCall(MatZeroRowsMapLocal_Private(A, N, rows, &len, &lrows));
1904c69f721fSFande Kong   /* zero diagonal part */
19059566063dSJacob Faibussowitsch   PetscCall(MatZeroRows_HYPRE_CSRMatrix(hypre_ParCSRMatrixDiag(parcsr), len, lrows, hdiag));
1906c69f721fSFande Kong   /* zero off-diagonal part */
19079566063dSJacob Faibussowitsch   PetscCall(MatZeroRows_HYPRE_CSRMatrix(hypre_ParCSRMatrixOffd(parcsr), len, lrows, 0.0));
1908c69f721fSFande Kong 
19099566063dSJacob Faibussowitsch   PetscCall(PetscFree(lrows));
1910c69f721fSFande Kong   PetscFunctionReturn(0);
1911c69f721fSFande Kong }
1912c69f721fSFande Kong 
1913d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAssemblyBegin_HYPRE(Mat mat, MatAssemblyType mode)
1914d71ae5a4SJacob Faibussowitsch {
1915c69f721fSFande Kong   PetscFunctionBegin;
1916c69f721fSFande Kong   if (mat->nooffprocentries) PetscFunctionReturn(0);
1917c69f721fSFande Kong 
19189566063dSJacob Faibussowitsch   PetscCall(MatStashScatterBegin_Private(mat, &mat->stash, mat->rmap->range));
1919c69f721fSFande Kong   PetscFunctionReturn(0);
1920c69f721fSFande Kong }
1921c69f721fSFande Kong 
1922d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetRow_HYPRE(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
1923d71ae5a4SJacob Faibussowitsch {
1924c69f721fSFande Kong   hypre_ParCSRMatrix *parcsr;
19252cf14000SStefano Zampini   HYPRE_Int           hnz;
1926c69f721fSFande Kong 
1927c69f721fSFande Kong   PetscFunctionBegin;
1928c69f721fSFande Kong   /* retrieve the internal matrix */
19299566063dSJacob Faibussowitsch   PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
1930c69f721fSFande Kong   /* call HYPRE API */
1931792fecdfSBarry Smith   PetscCallExternal(HYPRE_ParCSRMatrixGetRow, parcsr, row, &hnz, (HYPRE_BigInt **)idx, (HYPRE_Complex **)v);
19322cf14000SStefano Zampini   if (nz) *nz = (PetscInt)hnz;
1933c69f721fSFande Kong   PetscFunctionReturn(0);
1934c69f721fSFande Kong }
1935c69f721fSFande Kong 
1936d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatRestoreRow_HYPRE(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
1937d71ae5a4SJacob Faibussowitsch {
1938c69f721fSFande Kong   hypre_ParCSRMatrix *parcsr;
19392cf14000SStefano Zampini   HYPRE_Int           hnz;
1940c69f721fSFande Kong 
1941c69f721fSFande Kong   PetscFunctionBegin;
1942c69f721fSFande Kong   /* retrieve the internal matrix */
19439566063dSJacob Faibussowitsch   PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
1944c69f721fSFande Kong   /* call HYPRE API */
19452cf14000SStefano Zampini   hnz = nz ? (HYPRE_Int)(*nz) : 0;
1946792fecdfSBarry Smith   PetscCallExternal(HYPRE_ParCSRMatrixRestoreRow, parcsr, row, &hnz, (HYPRE_BigInt **)idx, (HYPRE_Complex **)v);
1947c69f721fSFande Kong   PetscFunctionReturn(0);
1948c69f721fSFande Kong }
1949c69f721fSFande Kong 
1950d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetValues_HYPRE(Mat A, PetscInt m, const PetscInt idxm[], PetscInt n, const PetscInt idxn[], PetscScalar v[])
1951d71ae5a4SJacob Faibussowitsch {
195245b8d346SStefano Zampini   Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
1953c69f721fSFande Kong   PetscInt   i;
19541d4906efSStefano Zampini 
1955c69f721fSFande Kong   PetscFunctionBegin;
1956c69f721fSFande Kong   if (!m || !n) PetscFunctionReturn(0);
1957c69f721fSFande Kong   /* Ignore negative row indices
1958c69f721fSFande Kong    * And negative column indices should be automatically ignored in hypre
1959c69f721fSFande Kong    * */
19602cf14000SStefano Zampini   for (i = 0; i < m; i++) {
19612cf14000SStefano Zampini     if (idxm[i] >= 0) {
19622cf14000SStefano Zampini       HYPRE_Int hn = (HYPRE_Int)n;
1963792fecdfSBarry Smith       PetscCallExternal(HYPRE_IJMatrixGetValues, hA->ij, 1, &hn, (HYPRE_BigInt *)&idxm[i], (HYPRE_BigInt *)idxn, (HYPRE_Complex *)(v + i * n));
19642cf14000SStefano Zampini     }
19652cf14000SStefano Zampini   }
1966c69f721fSFande Kong   PetscFunctionReturn(0);
1967c69f721fSFande Kong }
1968c69f721fSFande Kong 
1969d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetOption_HYPRE(Mat A, MatOption op, PetscBool flg)
1970d71ae5a4SJacob Faibussowitsch {
1971ddbeb582SStefano Zampini   Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
1972ddbeb582SStefano Zampini 
1973ddbeb582SStefano Zampini   PetscFunctionBegin;
1974c6698e78SStefano Zampini   switch (op) {
1975ddbeb582SStefano Zampini   case MAT_NO_OFF_PROC_ENTRIES:
197648a46eb9SPierre Jolivet     if (flg) PetscCallExternal(HYPRE_IJMatrixSetMaxOffProcElmts, hA->ij, 0);
1977ddbeb582SStefano Zampini     break;
1978d71ae5a4SJacob Faibussowitsch   case MAT_SORTED_FULL:
1979d71ae5a4SJacob Faibussowitsch     hA->sorted_full = flg;
1980d71ae5a4SJacob Faibussowitsch     break;
1981d71ae5a4SJacob Faibussowitsch   default:
1982d71ae5a4SJacob Faibussowitsch     break;
1983ddbeb582SStefano Zampini   }
1984ddbeb582SStefano Zampini   PetscFunctionReturn(0);
1985ddbeb582SStefano Zampini }
1986c69f721fSFande Kong 
1987d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_HYPRE(Mat A, PetscViewer view)
1988d71ae5a4SJacob Faibussowitsch {
198945b8d346SStefano Zampini   PetscViewerFormat format;
199045b8d346SStefano Zampini 
199145b8d346SStefano Zampini   PetscFunctionBegin;
19929566063dSJacob Faibussowitsch   PetscCall(PetscViewerGetFormat(view, &format));
19936ea7df73SStefano Zampini   if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(0);
199445b8d346SStefano Zampini   if (format != PETSC_VIEWER_NATIVE) {
19956ea7df73SStefano Zampini     Mat                 B;
19966ea7df73SStefano Zampini     hypre_ParCSRMatrix *parcsr;
19976ea7df73SStefano Zampini     PetscErrorCode (*mview)(Mat, PetscViewer) = NULL;
19986ea7df73SStefano Zampini 
19999566063dSJacob Faibussowitsch     PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
20009566063dSJacob Faibussowitsch     PetscCall(MatCreateFromParCSR(parcsr, MATAIJ, PETSC_USE_POINTER, &B));
20019566063dSJacob Faibussowitsch     PetscCall(MatGetOperation(B, MATOP_VIEW, (void (**)(void)) & mview));
200228b400f6SJacob Faibussowitsch     PetscCheck(mview, PetscObjectComm((PetscObject)A), PETSC_ERR_PLIB, "Missing view operation");
20039566063dSJacob Faibussowitsch     PetscCall((*mview)(B, view));
20049566063dSJacob Faibussowitsch     PetscCall(MatDestroy(&B));
200545b8d346SStefano Zampini   } else {
200645b8d346SStefano Zampini     Mat_HYPRE  *hA = (Mat_HYPRE *)A->data;
200745b8d346SStefano Zampini     PetscMPIInt size;
200845b8d346SStefano Zampini     PetscBool   isascii;
200945b8d346SStefano Zampini     const char *filename;
201045b8d346SStefano Zampini 
201145b8d346SStefano Zampini     /* HYPRE uses only text files */
20129566063dSJacob Faibussowitsch     PetscCall(PetscObjectTypeCompare((PetscObject)view, PETSCVIEWERASCII, &isascii));
201328b400f6SJacob Faibussowitsch     PetscCheck(isascii, PetscObjectComm((PetscObject)view), PETSC_ERR_SUP, "PetscViewerType %s: native HYPRE format needs PETSCVIEWERASCII", ((PetscObject)view)->type_name);
20149566063dSJacob Faibussowitsch     PetscCall(PetscViewerFileGetName(view, &filename));
2015792fecdfSBarry Smith     PetscCallExternal(HYPRE_IJMatrixPrint, hA->ij, filename);
20169566063dSJacob Faibussowitsch     PetscCallMPI(MPI_Comm_size(hA->comm, &size));
201745b8d346SStefano Zampini     if (size > 1) {
20189566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(view, "Matrix files: %s.%05d ... %s.%05d\n", filename, 0, filename, size - 1));
201945b8d346SStefano Zampini     } else {
20209566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(view, "Matrix file: %s.%05d\n", filename, 0));
202145b8d346SStefano Zampini     }
202245b8d346SStefano Zampini   }
202345b8d346SStefano Zampini   PetscFunctionReturn(0);
202445b8d346SStefano Zampini }
202545b8d346SStefano Zampini 
2026d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatDuplicate_HYPRE(Mat A, MatDuplicateOption op, Mat *B)
2027d71ae5a4SJacob Faibussowitsch {
20286abb4441SStefano Zampini   hypre_ParCSRMatrix *parcsr = NULL;
202945b8d346SStefano Zampini   PetscCopyMode       cpmode;
203045b8d346SStefano Zampini 
203145b8d346SStefano Zampini   PetscFunctionBegin;
20329566063dSJacob Faibussowitsch   PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
203345b8d346SStefano Zampini   if (op == MAT_DO_NOT_COPY_VALUES || op == MAT_SHARE_NONZERO_PATTERN) {
20340e6427aaSSatish Balay     parcsr = hypre_ParCSRMatrixClone(parcsr, 0);
203545b8d346SStefano Zampini     cpmode = PETSC_OWN_POINTER;
203645b8d346SStefano Zampini   } else {
203745b8d346SStefano Zampini     cpmode = PETSC_COPY_VALUES;
203845b8d346SStefano Zampini   }
20399566063dSJacob Faibussowitsch   PetscCall(MatCreateFromParCSR(parcsr, MATHYPRE, cpmode, B));
204045b8d346SStefano Zampini   PetscFunctionReturn(0);
204145b8d346SStefano Zampini }
204245b8d346SStefano Zampini 
2043d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatCopy_HYPRE(Mat A, Mat B, MatStructure str)
2044d71ae5a4SJacob Faibussowitsch {
2045465edc17SStefano Zampini   hypre_ParCSRMatrix *acsr, *bcsr;
2046465edc17SStefano Zampini 
2047465edc17SStefano Zampini   PetscFunctionBegin;
2048465edc17SStefano Zampini   if (str == SAME_NONZERO_PATTERN && A->ops->copy == B->ops->copy) {
20499566063dSJacob Faibussowitsch     PetscCall(MatHYPREGetParCSR_HYPRE(A, &acsr));
20509566063dSJacob Faibussowitsch     PetscCall(MatHYPREGetParCSR_HYPRE(B, &bcsr));
2051792fecdfSBarry Smith     PetscCallExternal(hypre_ParCSRMatrixCopy, acsr, bcsr, 1);
20529566063dSJacob Faibussowitsch     PetscCall(MatSetOption(B, MAT_SORTED_FULL, PETSC_TRUE)); /* "perfect" preallocation, so no need for hypre_AuxParCSRMatrixNeedAux */
20539566063dSJacob Faibussowitsch     PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY));
20549566063dSJacob Faibussowitsch     PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY));
2055465edc17SStefano Zampini   } else {
20569566063dSJacob Faibussowitsch     PetscCall(MatCopy_Basic(A, B, str));
2057465edc17SStefano Zampini   }
2058465edc17SStefano Zampini   PetscFunctionReturn(0);
2059465edc17SStefano Zampini }
2060465edc17SStefano Zampini 
2061d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetDiagonal_HYPRE(Mat A, Vec d)
2062d71ae5a4SJacob Faibussowitsch {
20636305df00SStefano Zampini   hypre_ParCSRMatrix *parcsr;
20646305df00SStefano Zampini   hypre_CSRMatrix    *dmat;
206539accc25SStefano Zampini   HYPRE_Complex      *a;
206639accc25SStefano Zampini   HYPRE_Complex      *data = NULL;
20672cf14000SStefano Zampini   HYPRE_Int          *diag = NULL;
20682cf14000SStefano Zampini   PetscInt            i;
20696305df00SStefano Zampini   PetscBool           cong;
20706305df00SStefano Zampini 
20716305df00SStefano Zampini   PetscFunctionBegin;
20729566063dSJacob Faibussowitsch   PetscCall(MatHasCongruentLayouts(A, &cong));
207328b400f6SJacob Faibussowitsch   PetscCheck(cong, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only for square matrices with same local distributions of rows and columns");
207476bd3646SJed Brown   if (PetscDefined(USE_DEBUG)) {
20756305df00SStefano Zampini     PetscBool miss;
20769566063dSJacob Faibussowitsch     PetscCall(MatMissingDiagonal(A, &miss, NULL));
207708401ef6SPierre Jolivet     PetscCheck(!miss || !A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_SUP, "Not implemented when diagonal entries are missing");
20786305df00SStefano Zampini   }
20799566063dSJacob Faibussowitsch   PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
20806305df00SStefano Zampini   dmat = hypre_ParCSRMatrixDiag(parcsr);
20816305df00SStefano Zampini   if (dmat) {
208239accc25SStefano Zampini     /* this cast fixes the clang error: implicit conversion from 'HYPRE_Complex' (aka '_Complex double') to 'double' is not permitted in C++ */
20839566063dSJacob Faibussowitsch     PetscCall(VecGetArray(d, (PetscScalar **)&a));
20842cf14000SStefano Zampini     diag = hypre_CSRMatrixI(dmat);
208539accc25SStefano Zampini     data = hypre_CSRMatrixData(dmat);
20866305df00SStefano Zampini     for (i = 0; i < A->rmap->n; i++) a[i] = data[diag[i]];
20879566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(d, (PetscScalar **)&a));
20886305df00SStefano Zampini   }
20896305df00SStefano Zampini   PetscFunctionReturn(0);
20906305df00SStefano Zampini }
20916305df00SStefano Zampini 
2092363d496dSStefano Zampini #include <petscblaslapack.h>
2093363d496dSStefano Zampini 
2094d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAXPY_HYPRE(Mat Y, PetscScalar a, Mat X, MatStructure str)
2095d71ae5a4SJacob Faibussowitsch {
2096363d496dSStefano Zampini   PetscFunctionBegin;
20976ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
20986ea7df73SStefano Zampini   {
20996ea7df73SStefano Zampini     Mat                 B;
21006ea7df73SStefano Zampini     hypre_ParCSRMatrix *x, *y, *z;
21016ea7df73SStefano Zampini 
21029566063dSJacob Faibussowitsch     PetscCall(MatHYPREGetParCSR(Y, &y));
21039566063dSJacob Faibussowitsch     PetscCall(MatHYPREGetParCSR(X, &x));
2104792fecdfSBarry Smith     PetscCallExternal(hypre_ParCSRMatrixAdd, 1.0, y, 1.0, x, &z);
21059566063dSJacob Faibussowitsch     PetscCall(MatCreateFromParCSR(z, MATHYPRE, PETSC_OWN_POINTER, &B));
21069566063dSJacob Faibussowitsch     PetscCall(MatHeaderMerge(Y, &B));
21076ea7df73SStefano Zampini   }
21086ea7df73SStefano Zampini #else
2109363d496dSStefano Zampini   if (str == SAME_NONZERO_PATTERN) {
2110363d496dSStefano Zampini     hypre_ParCSRMatrix *x, *y;
2111363d496dSStefano Zampini     hypre_CSRMatrix *xloc, *yloc;
2112363d496dSStefano Zampini     PetscInt xnnz, ynnz;
211339accc25SStefano Zampini     HYPRE_Complex *xarr, *yarr;
2114363d496dSStefano Zampini     PetscBLASInt one = 1, bnz;
2115363d496dSStefano Zampini 
21169566063dSJacob Faibussowitsch     PetscCall(MatHYPREGetParCSR(Y, &y));
21179566063dSJacob Faibussowitsch     PetscCall(MatHYPREGetParCSR(X, &x));
2118363d496dSStefano Zampini 
2119363d496dSStefano Zampini     /* diagonal block */
2120363d496dSStefano Zampini     xloc = hypre_ParCSRMatrixDiag(x);
2121363d496dSStefano Zampini     yloc = hypre_ParCSRMatrixDiag(y);
2122363d496dSStefano Zampini     xnnz = 0;
2123363d496dSStefano Zampini     ynnz = 0;
2124363d496dSStefano Zampini     xarr = NULL;
2125363d496dSStefano Zampini     yarr = NULL;
2126363d496dSStefano Zampini     if (xloc) {
212739accc25SStefano Zampini       xarr = hypre_CSRMatrixData(xloc);
2128363d496dSStefano Zampini       xnnz = hypre_CSRMatrixNumNonzeros(xloc);
2129363d496dSStefano Zampini     }
2130363d496dSStefano Zampini     if (yloc) {
213139accc25SStefano Zampini       yarr = hypre_CSRMatrixData(yloc);
2132363d496dSStefano Zampini       ynnz = hypre_CSRMatrixNumNonzeros(yloc);
2133363d496dSStefano Zampini     }
213408401ef6SPierre Jolivet     PetscCheck(xnnz == ynnz, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Different number of nonzeros in diagonal block %" PetscInt_FMT " != %" PetscInt_FMT, xnnz, ynnz);
21359566063dSJacob Faibussowitsch     PetscCall(PetscBLASIntCast(xnnz, &bnz));
2136792fecdfSBarry Smith     PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &a, (PetscScalar *)xarr, &one, (PetscScalar *)yarr, &one));
2137363d496dSStefano Zampini 
2138363d496dSStefano Zampini     /* off-diagonal block */
2139363d496dSStefano Zampini     xloc = hypre_ParCSRMatrixOffd(x);
2140363d496dSStefano Zampini     yloc = hypre_ParCSRMatrixOffd(y);
2141363d496dSStefano Zampini     xnnz = 0;
2142363d496dSStefano Zampini     ynnz = 0;
2143363d496dSStefano Zampini     xarr = NULL;
2144363d496dSStefano Zampini     yarr = NULL;
2145363d496dSStefano Zampini     if (xloc) {
214639accc25SStefano Zampini       xarr = hypre_CSRMatrixData(xloc);
2147363d496dSStefano Zampini       xnnz = hypre_CSRMatrixNumNonzeros(xloc);
2148363d496dSStefano Zampini     }
2149363d496dSStefano Zampini     if (yloc) {
215039accc25SStefano Zampini       yarr = hypre_CSRMatrixData(yloc);
2151363d496dSStefano Zampini       ynnz = hypre_CSRMatrixNumNonzeros(yloc);
2152363d496dSStefano Zampini     }
215308401ef6SPierre Jolivet     PetscCheck(xnnz == ynnz, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Different number of nonzeros in off-diagonal block %" PetscInt_FMT " != %" PetscInt_FMT, xnnz, ynnz);
21549566063dSJacob Faibussowitsch     PetscCall(PetscBLASIntCast(xnnz, &bnz));
2155792fecdfSBarry Smith     PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &a, (PetscScalar *)xarr, &one, (PetscScalar *)yarr, &one));
2156363d496dSStefano Zampini   } else if (str == SUBSET_NONZERO_PATTERN) {
21579566063dSJacob Faibussowitsch     PetscCall(MatAXPY_Basic(Y, a, X, str));
2158363d496dSStefano Zampini   } else {
2159363d496dSStefano Zampini     Mat B;
2160363d496dSStefano Zampini 
21619566063dSJacob Faibussowitsch     PetscCall(MatAXPY_Basic_Preallocate(Y, X, &B));
21629566063dSJacob Faibussowitsch     PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str));
21639566063dSJacob Faibussowitsch     PetscCall(MatHeaderReplace(Y, &B));
2164363d496dSStefano Zampini   }
21656ea7df73SStefano Zampini #endif
2166363d496dSStefano Zampini   PetscFunctionReturn(0);
2167363d496dSStefano Zampini }
2168363d496dSStefano Zampini 
2169d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetPreallocationCOO_HYPRE(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[])
2170d71ae5a4SJacob Faibussowitsch {
21715fbaff96SJunchao Zhang   MPI_Comm             comm;
21725fbaff96SJunchao Zhang   PetscMPIInt          size;
21735fbaff96SJunchao Zhang   PetscLayout          rmap, cmap;
21745fbaff96SJunchao Zhang   Mat_HYPRE           *hmat;
21755fbaff96SJunchao Zhang   hypre_ParCSRMatrix  *parCSR;
21765fbaff96SJunchao Zhang   hypre_CSRMatrix     *diag, *offd;
21775fbaff96SJunchao Zhang   Mat                  A, B, cooMat;
21785fbaff96SJunchao Zhang   PetscScalar         *Aa, *Ba;
21795fbaff96SJunchao Zhang   HYPRE_MemoryLocation hypreMemtype = HYPRE_MEMORY_HOST;
21805fbaff96SJunchao Zhang   PetscMemType         petscMemtype;
21815fbaff96SJunchao Zhang   MatType              matType = MATAIJ; /* default type of cooMat */
21825fbaff96SJunchao Zhang 
21835fbaff96SJunchao Zhang   PetscFunctionBegin;
21845fbaff96SJunchao Zhang   /* Build an agent matrix cooMat whose type is either MATAIJ or MATAIJKOKKOS.
21855fbaff96SJunchao Zhang      It has the same sparsity pattern as mat, and also shares the data array with mat. We use cooMat to do the COO work.
21865fbaff96SJunchao Zhang    */
21875fbaff96SJunchao Zhang   PetscCall(PetscObjectGetComm((PetscObject)mat, &comm));
21885fbaff96SJunchao Zhang   PetscCallMPI(MPI_Comm_size(comm, &size));
21895fbaff96SJunchao Zhang   PetscCall(PetscLayoutSetUp(mat->rmap));
21905fbaff96SJunchao Zhang   PetscCall(PetscLayoutSetUp(mat->cmap));
21915fbaff96SJunchao Zhang   PetscCall(MatGetLayouts(mat, &rmap, &cmap));
21925fbaff96SJunchao Zhang 
21935fbaff96SJunchao Zhang   /* I do not know how hypre_ParCSRMatrix stores diagonal elements for non-square matrices, so I just give up now */
21945fbaff96SJunchao Zhang   PetscCheck(rmap->N == cmap->N, comm, PETSC_ERR_SUP, "MATHYPRE COO cannot handle non-square matrices");
21955fbaff96SJunchao Zhang 
21965fbaff96SJunchao Zhang #if defined(PETSC_HAVE_DEVICE)
21975fbaff96SJunchao Zhang   if (!mat->boundtocpu) { /* mat will be on device, so will cooMat */
21985fbaff96SJunchao Zhang   #if defined(PETSC_HAVE_KOKKOS)
21995fbaff96SJunchao Zhang     matType = MATAIJKOKKOS;
22005fbaff96SJunchao Zhang   #else
22015fbaff96SJunchao Zhang     SETERRQ(comm, PETSC_ERR_SUP, "To support MATHYPRE COO assembly on device, we need Kokkos, e.g., --download-kokkos --download-kokkos-kernels");
22025fbaff96SJunchao Zhang   #endif
22035fbaff96SJunchao Zhang   }
22045fbaff96SJunchao Zhang #endif
22055fbaff96SJunchao Zhang 
22065fbaff96SJunchao Zhang   /* Do COO preallocation through cooMat */
22075fbaff96SJunchao Zhang   hmat = (Mat_HYPRE *)mat->data;
22085fbaff96SJunchao Zhang   PetscCall(MatDestroy(&hmat->cooMat));
22095fbaff96SJunchao Zhang   PetscCall(MatCreate(comm, &cooMat));
22105fbaff96SJunchao Zhang   PetscCall(MatSetType(cooMat, matType));
22115fbaff96SJunchao Zhang   PetscCall(MatSetLayouts(cooMat, rmap, cmap));
22125fbaff96SJunchao Zhang   PetscCall(MatSetPreallocationCOO(cooMat, coo_n, coo_i, coo_j));
22135fbaff96SJunchao Zhang 
22145fbaff96SJunchao Zhang   /* Copy the sparsity pattern from cooMat to hypre IJMatrix hmat->ij */
22155fbaff96SJunchao Zhang   PetscCall(MatSetOption(mat, MAT_SORTED_FULL, PETSC_TRUE));
22165fbaff96SJunchao Zhang   PetscCall(MatSetOption(mat, MAT_NO_OFF_PROC_ENTRIES, PETSC_TRUE));
22175fbaff96SJunchao Zhang   PetscCall(MatHYPRE_CreateFromMat(cooMat, hmat));    /* Create hmat->ij and preallocate it */
22185fbaff96SJunchao Zhang   PetscCall(MatHYPRE_IJMatrixCopy(cooMat, hmat->ij)); /* Copy A's (a,i,j) to hmat->ij. To reuse code. Copying 'a' is not really needed */
22195fbaff96SJunchao Zhang 
22205fbaff96SJunchao Zhang   mat->preallocated = PETSC_TRUE;
22215fbaff96SJunchao Zhang   PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY));
22225fbaff96SJunchao Zhang   PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY)); /* Migrate mat to device if it is bound to. Hypre builds its own SpMV context here */
22235fbaff96SJunchao Zhang 
22245fbaff96SJunchao Zhang   /* Alias cooMat's data array to IJMatrix's */
2225792fecdfSBarry Smith   PetscCallExternal(HYPRE_IJMatrixGetObject, hmat->ij, (void **)&parCSR);
22265fbaff96SJunchao Zhang   diag = hypre_ParCSRMatrixDiag(parCSR);
22275fbaff96SJunchao Zhang   offd = hypre_ParCSRMatrixOffd(parCSR);
22285fbaff96SJunchao Zhang 
22295fbaff96SJunchao Zhang   hypreMemtype = hypre_CSRMatrixMemoryLocation(diag);
22305fbaff96SJunchao Zhang   A            = (size == 1) ? cooMat : ((Mat_MPIAIJ *)cooMat->data)->A;
22315fbaff96SJunchao Zhang   PetscCall(MatSeqAIJGetCSRAndMemType(A, NULL, NULL, &Aa, &petscMemtype));
22329371c9d4SSatish Balay   PetscAssert((PetscMemTypeHost(petscMemtype) && hypreMemtype == HYPRE_MEMORY_HOST) || (PetscMemTypeDevice(petscMemtype) && hypreMemtype == HYPRE_MEMORY_DEVICE), comm, PETSC_ERR_PLIB, "PETSc and hypre's memory types mismatch");
22335fbaff96SJunchao Zhang 
22345fbaff96SJunchao Zhang   hmat->diagJ = hypre_CSRMatrixJ(diag);
2235e77caa6dSBarry Smith   PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hypre_CSRMatrixData(diag), hypreMemtype));
22365fbaff96SJunchao Zhang   hypre_CSRMatrixData(diag)     = (HYPRE_Complex *)Aa;
22375fbaff96SJunchao Zhang   hypre_CSRMatrixOwnsData(diag) = 0; /* Take ownership of (j,a) away from hypre. As a result, we need to free them on our own */
22385fbaff96SJunchao Zhang 
22395fbaff96SJunchao Zhang   /* Copy diagonal pointers of A to device to facilitate MatSeqAIJMoveDiagonalValuesFront_SeqAIJKokkos */
22405fbaff96SJunchao Zhang   if (hypreMemtype == HYPRE_MEMORY_DEVICE) {
2241e77caa6dSBarry Smith     PetscStackCallExternalVoid("hypre_TAlloc", hmat->diag = hypre_TAlloc(PetscInt, rmap->n, hypreMemtype));
22425fbaff96SJunchao Zhang     PetscCall(MatMarkDiagonal_SeqAIJ(A)); /* We need updated diagonal positions */
2243e77caa6dSBarry Smith     PetscStackCallExternalVoid("hypre_TMemcpy", hypre_TMemcpy(hmat->diag, ((Mat_SeqAIJ *)A->data)->diag, PetscInt, rmap->n, hypreMemtype, HYPRE_MEMORY_HOST));
22445fbaff96SJunchao Zhang   }
22455fbaff96SJunchao Zhang 
22465fbaff96SJunchao Zhang   if (size > 1) {
22475fbaff96SJunchao Zhang     B = ((Mat_MPIAIJ *)cooMat->data)->B;
22485fbaff96SJunchao Zhang     PetscCall(MatSeqAIJGetCSRAndMemType(B, NULL, NULL, &Ba, &petscMemtype));
22495fbaff96SJunchao Zhang     hmat->offdJ = hypre_CSRMatrixJ(offd);
2250e77caa6dSBarry Smith     PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hypre_CSRMatrixData(offd), hypreMemtype));
22515fbaff96SJunchao Zhang     hypre_CSRMatrixData(offd)     = (HYPRE_Complex *)Ba;
22525fbaff96SJunchao Zhang     hypre_CSRMatrixOwnsData(offd) = 0;
22535fbaff96SJunchao Zhang   }
22545fbaff96SJunchao Zhang 
22555fbaff96SJunchao Zhang   /* Record cooMat for use in MatSetValuesCOO_HYPRE */
22565fbaff96SJunchao Zhang   hmat->cooMat  = cooMat;
22575fbaff96SJunchao Zhang   hmat->memType = hypreMemtype;
22585fbaff96SJunchao Zhang   PetscFunctionReturn(0);
22595fbaff96SJunchao Zhang }
22605fbaff96SJunchao Zhang 
2261d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_HYPRE(Mat mat, const PetscScalar v[], InsertMode imode)
2262d71ae5a4SJacob Faibussowitsch {
22635fbaff96SJunchao Zhang   Mat_HYPRE  *hmat = (Mat_HYPRE *)mat->data;
22645fbaff96SJunchao Zhang   PetscMPIInt size;
22655fbaff96SJunchao Zhang   Mat         A;
22665fbaff96SJunchao Zhang 
22675fbaff96SJunchao Zhang   PetscFunctionBegin;
22685fbaff96SJunchao Zhang   PetscCheck(hmat->cooMat, hmat->comm, PETSC_ERR_PLIB, "HYPRE COO delegate matrix has not been created yet");
22695fbaff96SJunchao Zhang   PetscCallMPI(MPI_Comm_size(hmat->comm, &size));
22705fbaff96SJunchao Zhang   PetscCall(MatSetValuesCOO(hmat->cooMat, v, imode));
22715fbaff96SJunchao Zhang 
22725fbaff96SJunchao Zhang   /* Move diagonal elements of the diagonal block to the front of their row, as needed by ParCSRMatrix. So damn hacky */
22735fbaff96SJunchao Zhang   A = (size == 1) ? hmat->cooMat : ((Mat_MPIAIJ *)hmat->cooMat->data)->A;
22745fbaff96SJunchao Zhang   if (hmat->memType == HYPRE_MEMORY_HOST) {
22755fbaff96SJunchao Zhang     Mat_SeqAIJ  *aij = (Mat_SeqAIJ *)A->data;
22765fbaff96SJunchao Zhang     PetscInt     i, m, *Ai = aij->i, *Adiag = aij->diag;
22775fbaff96SJunchao Zhang     PetscScalar *Aa = aij->a, tmp;
22785fbaff96SJunchao Zhang 
22795fbaff96SJunchao Zhang     PetscCall(MatGetSize(A, &m, NULL));
22805fbaff96SJunchao Zhang     for (i = 0; i < m; i++) {
22815fbaff96SJunchao Zhang       if (Adiag[i] >= Ai[i] && Adiag[i] < Ai[i + 1]) { /* Digonal element of this row exists in a[] and j[] */
22825fbaff96SJunchao Zhang         tmp          = Aa[Ai[i]];
22835fbaff96SJunchao Zhang         Aa[Ai[i]]    = Aa[Adiag[i]];
22845fbaff96SJunchao Zhang         Aa[Adiag[i]] = tmp;
22855fbaff96SJunchao Zhang       }
22865fbaff96SJunchao Zhang     }
22875fbaff96SJunchao Zhang   } else {
22885fbaff96SJunchao Zhang #if defined(PETSC_HAVE_KOKKOS_KERNELS)
22895fbaff96SJunchao Zhang     PetscCall(MatSeqAIJMoveDiagonalValuesFront_SeqAIJKokkos(A, hmat->diag));
22905fbaff96SJunchao Zhang #endif
22915fbaff96SJunchao Zhang   }
22925fbaff96SJunchao Zhang   PetscFunctionReturn(0);
22935fbaff96SJunchao Zhang }
22945fbaff96SJunchao Zhang 
2295a055b5aaSBarry Smith /*MC
2296a055b5aaSBarry Smith    MATHYPRE - MATHYPRE = "hypre" - A matrix type to be used for sequential and parallel sparse matrices
2297a055b5aaSBarry Smith           based on the hypre IJ interface.
2298a055b5aaSBarry Smith 
2299a055b5aaSBarry Smith    Level: intermediate
2300a055b5aaSBarry Smith 
230111a5261eSBarry Smith .seealso: `MatCreate()`, `MatHYPRESetPreallocation`
2302a055b5aaSBarry Smith M*/
2303a055b5aaSBarry Smith 
2304d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_HYPRE(Mat B)
2305d71ae5a4SJacob Faibussowitsch {
230663c07aadSStefano Zampini   Mat_HYPRE *hB;
230763c07aadSStefano Zampini 
230863c07aadSStefano Zampini   PetscFunctionBegin;
23094dfa11a4SJacob Faibussowitsch   PetscCall(PetscNew(&hB));
23106ea7df73SStefano Zampini 
2311978814f1SStefano Zampini   hB->inner_free  = PETSC_TRUE;
2312c69f721fSFande Kong   hB->available   = PETSC_TRUE;
2313336664bdSPierre Jolivet   hB->sorted_full = PETSC_FALSE; /* no assumption whether column indices are sorted or not */
2314c69f721fSFande Kong   hB->size        = 0;
2315c69f721fSFande Kong   hB->array       = NULL;
2316978814f1SStefano Zampini 
231763c07aadSStefano Zampini   B->data      = (void *)hB;
231863c07aadSStefano Zampini   B->assembled = PETSC_FALSE;
231963c07aadSStefano Zampini 
23209566063dSJacob Faibussowitsch   PetscCall(PetscMemzero(B->ops, sizeof(struct _MatOps)));
232163c07aadSStefano Zampini   B->ops->mult                  = MatMult_HYPRE;
232263c07aadSStefano Zampini   B->ops->multtranspose         = MatMultTranspose_HYPRE;
2323414bd5c3SStefano Zampini   B->ops->multadd               = MatMultAdd_HYPRE;
2324414bd5c3SStefano Zampini   B->ops->multtransposeadd      = MatMultTransposeAdd_HYPRE;
232563c07aadSStefano Zampini   B->ops->setup                 = MatSetUp_HYPRE;
232663c07aadSStefano Zampini   B->ops->destroy               = MatDestroy_HYPRE;
232763c07aadSStefano Zampini   B->ops->assemblyend           = MatAssemblyEnd_HYPRE;
2328c69f721fSFande Kong   B->ops->assemblybegin         = MatAssemblyBegin_HYPRE;
2329d975228cSstefano_zampini   B->ops->setvalues             = MatSetValues_HYPRE;
233068ec7858SStefano Zampini   B->ops->missingdiagonal       = MatMissingDiagonal_HYPRE;
233168ec7858SStefano Zampini   B->ops->scale                 = MatScale_HYPRE;
233268ec7858SStefano Zampini   B->ops->zerorowscolumns       = MatZeroRowsColumns_HYPRE;
2333c69f721fSFande Kong   B->ops->zeroentries           = MatZeroEntries_HYPRE;
2334c69f721fSFande Kong   B->ops->zerorows              = MatZeroRows_HYPRE;
2335c69f721fSFande Kong   B->ops->getrow                = MatGetRow_HYPRE;
2336c69f721fSFande Kong   B->ops->restorerow            = MatRestoreRow_HYPRE;
2337c69f721fSFande Kong   B->ops->getvalues             = MatGetValues_HYPRE;
2338ddbeb582SStefano Zampini   B->ops->setoption             = MatSetOption_HYPRE;
233945b8d346SStefano Zampini   B->ops->duplicate             = MatDuplicate_HYPRE;
2340465edc17SStefano Zampini   B->ops->copy                  = MatCopy_HYPRE;
234145b8d346SStefano Zampini   B->ops->view                  = MatView_HYPRE;
23426305df00SStefano Zampini   B->ops->getdiagonal           = MatGetDiagonal_HYPRE;
2343363d496dSStefano Zampini   B->ops->axpy                  = MatAXPY_HYPRE;
23444222ddf1SHong Zhang   B->ops->productsetfromoptions = MatProductSetFromOptions_HYPRE;
23456ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
23466ea7df73SStefano Zampini   B->ops->bindtocpu = MatBindToCPU_HYPRE;
23476ea7df73SStefano Zampini   B->boundtocpu     = PETSC_FALSE;
23486ea7df73SStefano Zampini #endif
234945b8d346SStefano Zampini 
235045b8d346SStefano Zampini   /* build cache for off array entries formed */
23519566063dSJacob Faibussowitsch   PetscCall(MatStashCreate_Private(PetscObjectComm((PetscObject)B), 1, &B->stash));
235263c07aadSStefano Zampini 
23539566063dSJacob Faibussowitsch   PetscCall(PetscCommGetComm(PetscObjectComm((PetscObject)B), &hB->comm));
23549566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATHYPRE));
23559566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_hypre_aij_C", MatConvert_HYPRE_AIJ));
23569566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_hypre_is_C", MatConvert_HYPRE_IS));
23579566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_hypre_C", MatProductSetFromOptions_HYPRE));
23589566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_mpiaij_hypre_C", MatProductSetFromOptions_HYPRE));
23599566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatHYPRESetPreallocation_C", MatHYPRESetPreallocation_HYPRE));
23609566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatHYPREGetParCSR_C", MatHYPREGetParCSR_HYPRE));
23615fbaff96SJunchao Zhang   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_HYPRE));
23625fbaff96SJunchao Zhang   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_HYPRE));
23636ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
23646ea7df73SStefano Zampini   #if defined(HYPRE_USING_HIP)
23659566063dSJacob Faibussowitsch   PetscCall(PetscDeviceInitialize(PETSC_DEVICE_HIP));
23669566063dSJacob Faibussowitsch   PetscCall(MatSetVecType(B, VECHIP));
23676ea7df73SStefano Zampini   #endif
23686ea7df73SStefano Zampini   #if defined(HYPRE_USING_CUDA)
23699566063dSJacob Faibussowitsch   PetscCall(PetscDeviceInitialize(PETSC_DEVICE_CUDA));
23709566063dSJacob Faibussowitsch   PetscCall(MatSetVecType(B, VECCUDA));
23716ea7df73SStefano Zampini   #endif
23726ea7df73SStefano Zampini #endif
237363c07aadSStefano Zampini   PetscFunctionReturn(0);
237463c07aadSStefano Zampini }
237563c07aadSStefano Zampini 
2376d71ae5a4SJacob Faibussowitsch static PetscErrorCode hypre_array_destroy(void *ptr)
2377d71ae5a4SJacob Faibussowitsch {
2378225daaf8SStefano Zampini   PetscFunctionBegin;
2379e6de0934SSatish Balay   hypre_TFree(ptr, HYPRE_MEMORY_HOST);
2380225daaf8SStefano Zampini   PetscFunctionReturn(0);
2381225daaf8SStefano Zampini }
2382