163c07aadSStefano Zampini /* 263c07aadSStefano Zampini Creates hypre ijmatrix from PETSc matrix 363c07aadSStefano Zampini */ 4225daaf8SStefano Zampini 5c6698e78SStefano Zampini #include <petscpkg_version.h> 639accc25SStefano Zampini #include <petsc/private/petschypre.h> 7dd9c0a25Sstefano_zampini #include <petscmathypre.h> 863c07aadSStefano Zampini #include <petsc/private/matimpl.h> 9a4af0ceeSJacob Faibussowitsch #include <petsc/private/deviceimpl.h> 1063c07aadSStefano Zampini #include <../src/mat/impls/hypre/mhypre.h> 1163c07aadSStefano Zampini #include <../src/mat/impls/aij/mpi/mpiaij.h> 1258968eb6SStefano Zampini #include <../src/vec/vec/impls/hypre/vhyp.h> 1358968eb6SStefano Zampini #include <HYPRE.h> 14c1a070e6SStefano Zampini #include <HYPRE_utilities.h> 15cd8bc7baSStefano Zampini #include <_hypre_parcsr_ls.h> 1668ec7858SStefano Zampini #include <_hypre_sstruct_ls.h> 1763c07aadSStefano Zampini 180e6427aaSSatish Balay #if PETSC_PKG_HYPRE_VERSION_LT(2, 18, 0) 190e6427aaSSatish Balay #define hypre_ParCSRMatrixClone(A, B) hypre_ParCSRMatrixCompleteClone(A) 200e6427aaSSatish Balay #endif 210e6427aaSSatish Balay 22bb16242fSVictor A. P. Magri #if PETSC_PKG_HYPRE_VERSION_GE(2, 15, 0) 23bb16242fSVictor A. P. Magri #define HYPRE_AssumedPartitionCheck() 1 24bb16242fSVictor A. P. Magri #endif 25bb16242fSVictor A. P. Magri 2663c07aadSStefano Zampini static PetscErrorCode MatHYPRE_CreateFromMat(Mat, Mat_HYPRE *); 2763c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixPreallocate(Mat, Mat, HYPRE_IJMatrix); 28b73e3080SStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixCopyIJ_MPIAIJ(Mat, HYPRE_IJMatrix); 29b73e3080SStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixCopyIJ_SeqAIJ(Mat, HYPRE_IJMatrix); 3039accc25SStefano Zampini static PetscErrorCode MatHYPRE_MultKernel_Private(Mat, HYPRE_Complex, Vec, HYPRE_Complex, Vec, PetscBool); 316ea7df73SStefano Zampini static PetscErrorCode MatSetValues_HYPRE(Mat, PetscInt, const PetscInt[], PetscInt, const PetscInt[], const PetscScalar[], InsertMode ins); 3263c07aadSStefano Zampini 33d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_IJMatrixPreallocate(Mat A_d, Mat A_o, HYPRE_IJMatrix ij) 34d71ae5a4SJacob Faibussowitsch { 3563c07aadSStefano Zampini PetscInt i, n_d, n_o; 3663c07aadSStefano Zampini const PetscInt *ia_d, *ia_o; 3763c07aadSStefano Zampini PetscBool done_d = PETSC_FALSE, done_o = PETSC_FALSE; 382cf14000SStefano Zampini HYPRE_Int *nnz_d = NULL, *nnz_o = NULL; 3963c07aadSStefano Zampini 4063c07aadSStefano Zampini PetscFunctionBegin; 4163c07aadSStefano Zampini if (A_d) { /* determine number of nonzero entries in local diagonal part */ 429566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(A_d, 0, PETSC_FALSE, PETSC_FALSE, &n_d, &ia_d, NULL, &done_d)); 4363c07aadSStefano Zampini if (done_d) { 449566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n_d, &nnz_d)); 45*f2f41e48SZach Atkins for (i = 0; i < n_d; i++) nnz_d[i] = (HYPRE_Int)(ia_d[i + 1] - ia_d[i]); 4663c07aadSStefano Zampini } 479566063dSJacob Faibussowitsch PetscCall(MatRestoreRowIJ(A_d, 0, PETSC_FALSE, PETSC_FALSE, NULL, &ia_d, NULL, &done_d)); 4863c07aadSStefano Zampini } 4963c07aadSStefano Zampini if (A_o) { /* determine number of nonzero entries in local off-diagonal part */ 509566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(A_o, 0, PETSC_FALSE, PETSC_FALSE, &n_o, &ia_o, NULL, &done_o)); 5163c07aadSStefano Zampini if (done_o) { 529566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n_o, &nnz_o)); 53*f2f41e48SZach Atkins for (i = 0; i < n_o; i++) nnz_o[i] = (HYPRE_Int)(ia_o[i + 1] - ia_o[i]); 5463c07aadSStefano Zampini } 559566063dSJacob Faibussowitsch PetscCall(MatRestoreRowIJ(A_o, 0, PETSC_FALSE, PETSC_FALSE, &n_o, &ia_o, NULL, &done_o)); 5663c07aadSStefano Zampini } 5763c07aadSStefano Zampini if (done_d) { /* set number of nonzeros in HYPRE IJ matrix */ 5863c07aadSStefano Zampini if (!done_o) { /* only diagonal part */ 599566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n_d, &nnz_o)); 6063c07aadSStefano Zampini } 61c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2, 16, 0) 62c6698e78SStefano Zampini { /* If we don't do this, the columns of the matrix will be all zeros! */ 63c6698e78SStefano Zampini hypre_AuxParCSRMatrix *aux_matrix; 64c6698e78SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij); 65c6698e78SStefano Zampini hypre_AuxParCSRMatrixDestroy(aux_matrix); 66c6698e78SStefano Zampini hypre_IJMatrixTranslator(ij) = NULL; 67a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixSetDiagOffdSizes(ij, nnz_d, nnz_o)); 6822235d61SPierre Jolivet /* it seems they partially fixed it in 2.19.0 */ 6922235d61SPierre Jolivet #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0) 70c6698e78SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij); 71c6698e78SStefano Zampini hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 1; 7222235d61SPierre Jolivet #endif 73c6698e78SStefano Zampini } 74c6698e78SStefano Zampini #else 75a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixSetDiagOffdSizes(ij, nnz_d, nnz_o)); 76c6698e78SStefano Zampini #endif 779566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz_d)); 789566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz_o)); 7963c07aadSStefano Zampini } 803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 8163c07aadSStefano Zampini } 8263c07aadSStefano Zampini 83d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_CreateFromMat(Mat A, Mat_HYPRE *hA) 84d71ae5a4SJacob Faibussowitsch { 85*f2f41e48SZach Atkins HYPRE_Int rstart, rend, cstart, cend; 8663c07aadSStefano Zampini 8763c07aadSStefano Zampini PetscFunctionBegin; 889566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 899566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 90*f2f41e48SZach Atkins rstart = (HYPRE_Int)A->rmap->rstart; 91*f2f41e48SZach Atkins rend = (HYPRE_Int)A->rmap->rend; 92*f2f41e48SZach Atkins cstart = (HYPRE_Int)A->cmap->rstart; 93*f2f41e48SZach Atkins cend = (HYPRE_Int)A->cmap->rend; 94ea9ee2c1SPierre Jolivet PetscHYPREInitialize(); 95651b1cf9SStefano Zampini if (hA->ij) { 96651b1cf9SStefano Zampini if (!hA->inner_free) hypre_IJMatrixObject(hA->ij) = NULL; 97a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixDestroy(hA->ij)); 98651b1cf9SStefano Zampini } 99a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixCreate(hA->comm, rstart, rend - 1, cstart, cend - 1, &hA->ij)); 100a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixSetObjectType(hA->ij, HYPRE_PARCSR)); 10163c07aadSStefano Zampini { 10263c07aadSStefano Zampini PetscBool same; 10363c07aadSStefano Zampini Mat A_d, A_o; 10463c07aadSStefano Zampini const PetscInt *colmap; 1059566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &same)); 10663c07aadSStefano Zampini if (same) { 1079566063dSJacob Faibussowitsch PetscCall(MatMPIAIJGetSeqAIJ(A, &A_d, &A_o, &colmap)); 1089566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixPreallocate(A_d, A_o, hA->ij)); 1093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 11063c07aadSStefano Zampini } 1119566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIBAIJ, &same)); 11263c07aadSStefano Zampini if (same) { 1139566063dSJacob Faibussowitsch PetscCall(MatMPIBAIJGetSeqBAIJ(A, &A_d, &A_o, &colmap)); 1149566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixPreallocate(A_d, A_o, hA->ij)); 1153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 11663c07aadSStefano Zampini } 1179566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATSEQAIJ, &same)); 11863c07aadSStefano Zampini if (same) { 1199566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixPreallocate(A, NULL, hA->ij)); 1203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12163c07aadSStefano Zampini } 1229566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATSEQBAIJ, &same)); 12363c07aadSStefano Zampini if (same) { 1249566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixPreallocate(A, NULL, hA->ij)); 1253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12663c07aadSStefano Zampini } 12763c07aadSStefano Zampini } 1283ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12963c07aadSStefano Zampini } 13063c07aadSStefano Zampini 131b73e3080SStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixCopyIJ(Mat A, HYPRE_IJMatrix ij) 132d71ae5a4SJacob Faibussowitsch { 13363c07aadSStefano Zampini PetscBool flg; 13463c07aadSStefano Zampini 13563c07aadSStefano Zampini PetscFunctionBegin; 1366ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0) 137a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixInitialize(ij)); 1386ea7df73SStefano Zampini #else 139a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixInitialize_v2(ij, HYPRE_MEMORY_HOST)); 1406ea7df73SStefano Zampini #endif 1419566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &flg)); 142b73e3080SStefano Zampini if (flg) { 143b73e3080SStefano Zampini PetscCall(MatHYPRE_IJMatrixCopyIJ_MPIAIJ(A, ij)); 1443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 14563c07aadSStefano Zampini } 1469566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATSEQAIJ, &flg)); 14763c07aadSStefano Zampini if (flg) { 148b73e3080SStefano Zampini PetscCall(MatHYPRE_IJMatrixCopyIJ_SeqAIJ(A, ij)); 1493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 15063c07aadSStefano Zampini } 151b73e3080SStefano Zampini PetscCheck(PETSC_FALSE, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "No support for matrix type %s", ((PetscObject)A)->type_name); 15287ef5fa6SStefano Zampini PetscFunctionReturn(PETSC_SUCCESS); 15363c07aadSStefano Zampini } 15463c07aadSStefano Zampini 155b73e3080SStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixCopyIJ_SeqAIJ(Mat A, HYPRE_IJMatrix ij) 156d71ae5a4SJacob Faibussowitsch { 15763c07aadSStefano Zampini Mat_SeqAIJ *pdiag = (Mat_SeqAIJ *)A->data; 15858968eb6SStefano Zampini HYPRE_Int type; 15963c07aadSStefano Zampini hypre_ParCSRMatrix *par_matrix; 16063c07aadSStefano Zampini hypre_AuxParCSRMatrix *aux_matrix; 16163c07aadSStefano Zampini hypre_CSRMatrix *hdiag; 1622cf14000SStefano Zampini PetscBool sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int)); 16363c07aadSStefano Zampini 16463c07aadSStefano Zampini PetscFunctionBegin; 165a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(ij, &type)); 16608401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported"); 167a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(ij, (void **)&par_matrix)); 16863c07aadSStefano Zampini hdiag = hypre_ParCSRMatrixDiag(par_matrix); 16963c07aadSStefano Zampini /* 17063c07aadSStefano Zampini this is the Hack part where we monkey directly with the hypre datastructures 17163c07aadSStefano Zampini */ 1722cf14000SStefano Zampini if (sameint) { 1739566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hdiag->i, pdiag->i, A->rmap->n + 1)); 1749566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hdiag->j, pdiag->j, pdiag->nz)); 1752cf14000SStefano Zampini } else { 1762cf14000SStefano Zampini PetscInt i; 1772cf14000SStefano Zampini 1782cf14000SStefano Zampini for (i = 0; i < A->rmap->n + 1; i++) hdiag->i[i] = (HYPRE_Int)pdiag->i[i]; 1792cf14000SStefano Zampini for (i = 0; i < pdiag->nz; i++) hdiag->j[i] = (HYPRE_Int)pdiag->j[i]; 1802cf14000SStefano Zampini } 1816ea7df73SStefano Zampini 182ea9daf28SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij); 18363c07aadSStefano Zampini hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0; 1843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18563c07aadSStefano Zampini } 18663c07aadSStefano Zampini 187b73e3080SStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixCopyIJ_MPIAIJ(Mat A, HYPRE_IJMatrix ij) 188d71ae5a4SJacob Faibussowitsch { 18963c07aadSStefano Zampini Mat_MPIAIJ *pA = (Mat_MPIAIJ *)A->data; 19063c07aadSStefano Zampini Mat_SeqAIJ *pdiag, *poffd; 19163c07aadSStefano Zampini PetscInt i, *garray = pA->garray, *jj, cstart, *pjj; 1922cf14000SStefano Zampini HYPRE_Int *hjj, type; 19363c07aadSStefano Zampini hypre_ParCSRMatrix *par_matrix; 19463c07aadSStefano Zampini hypre_AuxParCSRMatrix *aux_matrix; 19563c07aadSStefano Zampini hypre_CSRMatrix *hdiag, *hoffd; 1962cf14000SStefano Zampini PetscBool sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int)); 19763c07aadSStefano Zampini 19863c07aadSStefano Zampini PetscFunctionBegin; 19963c07aadSStefano Zampini pdiag = (Mat_SeqAIJ *)pA->A->data; 20063c07aadSStefano Zampini poffd = (Mat_SeqAIJ *)pA->B->data; 201da81f932SPierre Jolivet /* cstart is only valid for square MPIAIJ laid out in the usual way */ 2029566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(A, &cstart, NULL)); 20363c07aadSStefano Zampini 204a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(ij, &type)); 20508401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported"); 206a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(ij, (void **)&par_matrix)); 20763c07aadSStefano Zampini hdiag = hypre_ParCSRMatrixDiag(par_matrix); 20863c07aadSStefano Zampini hoffd = hypre_ParCSRMatrixOffd(par_matrix); 20963c07aadSStefano Zampini 2102cf14000SStefano Zampini if (sameint) { 2119566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hdiag->i, pdiag->i, pA->A->rmap->n + 1)); 2122cf14000SStefano Zampini } else { 213f4f49eeaSPierre Jolivet for (i = 0; i < pA->A->rmap->n + 1; i++) hdiag->i[i] = (HYPRE_Int)pdiag->i[i]; 2142cf14000SStefano Zampini } 215b73e3080SStefano Zampini 2162cf14000SStefano Zampini hjj = hdiag->j; 2172cf14000SStefano Zampini pjj = pdiag->j; 218c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2, 16, 0) 219*f2f41e48SZach Atkins for (i = 0; i < pdiag->nz; i++) hjj[i] = (HYPRE_Int)pjj[i]; 220c6698e78SStefano Zampini #else 2212cf14000SStefano Zampini for (i = 0; i < pdiag->nz; i++) hjj[i] = cstart + pjj[i]; 222c6698e78SStefano Zampini #endif 2232cf14000SStefano Zampini if (sameint) { 2249566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hoffd->i, poffd->i, pA->A->rmap->n + 1)); 2252cf14000SStefano Zampini } else { 226f4f49eeaSPierre Jolivet for (i = 0; i < pA->A->rmap->n + 1; i++) hoffd->i[i] = (HYPRE_Int)poffd->i[i]; 2272cf14000SStefano Zampini } 2282cf14000SStefano Zampini 22906977982Sstefanozampini jj = (PetscInt *)hoffd->j; 230c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2, 16, 0) 231a333fa2bSZach Atkins PetscCallHYPRE(hypre_CSRMatrixBigInitialize(hoffd)); 232c6698e78SStefano Zampini jj = (PetscInt *)hoffd->big_j; 233c6698e78SStefano Zampini #endif 2342cf14000SStefano Zampini pjj = poffd->j; 23563c07aadSStefano Zampini for (i = 0; i < poffd->nz; i++) jj[i] = garray[pjj[i]]; 236c6698e78SStefano Zampini 237ea9daf28SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij); 23863c07aadSStefano Zampini hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0; 2393ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24063c07aadSStefano Zampini } 24163c07aadSStefano Zampini 242d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatConvert_HYPRE_IS(Mat A, MatType mtype, MatReuse reuse, Mat *B) 243d71ae5a4SJacob Faibussowitsch { 244f4f49eeaSPierre Jolivet Mat_HYPRE *mhA = (Mat_HYPRE *)A->data; 2452df22349SStefano Zampini Mat lA; 2462df22349SStefano Zampini ISLocalToGlobalMapping rl2g, cl2g; 2472df22349SStefano Zampini IS is; 2482df22349SStefano Zampini hypre_ParCSRMatrix *hA; 2492df22349SStefano Zampini hypre_CSRMatrix *hdiag, *hoffd; 2502df22349SStefano Zampini MPI_Comm comm; 25139accc25SStefano Zampini HYPRE_Complex *hdd, *hod, *aa; 25239accc25SStefano Zampini PetscScalar *data; 2532cf14000SStefano Zampini HYPRE_BigInt *col_map_offd; 2542cf14000SStefano Zampini HYPRE_Int *hdi, *hdj, *hoi, *hoj; 2552df22349SStefano Zampini PetscInt *ii, *jj, *iptr, *jptr; 2562df22349SStefano Zampini PetscInt cum, dr, dc, oc, str, stc, nnz, i, jd, jo, M, N; 25758968eb6SStefano Zampini HYPRE_Int type; 25806977982Sstefanozampini MatType lmattype = NULL; 25906977982Sstefanozampini PetscBool freeparcsr = PETSC_FALSE; 2602df22349SStefano Zampini 2612df22349SStefano Zampini PetscFunctionBegin; 262a1787963SStefano Zampini comm = PetscObjectComm((PetscObject)A); 263a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(mhA->ij, &type)); 26408401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, comm, PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported"); 265a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(mhA->ij, (void **)&hA)); 26606977982Sstefanozampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 26706977982Sstefanozampini if (HYPRE_MEMORY_DEVICE == hypre_IJMatrixMemoryLocation(mhA->ij)) { 26806977982Sstefanozampini /* Support by copying back on the host and copy to GPU 26906977982Sstefanozampini Kind of inefficient, but this is the best we can do now */ 27006977982Sstefanozampini #if defined(HYPRE_USING_HIP) 27106977982Sstefanozampini lmattype = MATSEQAIJHIPSPARSE; 27206977982Sstefanozampini #elif defined(HYPRE_USING_CUDA) 27306977982Sstefanozampini lmattype = MATSEQAIJCUSPARSE; 27406977982Sstefanozampini #endif 27506977982Sstefanozampini hA = hypre_ParCSRMatrixClone_v2(hA, 1, HYPRE_MEMORY_HOST); 27606977982Sstefanozampini freeparcsr = PETSC_TRUE; 27706977982Sstefanozampini } 27806977982Sstefanozampini #endif 2792df22349SStefano Zampini M = hypre_ParCSRMatrixGlobalNumRows(hA); 2802df22349SStefano Zampini N = hypre_ParCSRMatrixGlobalNumCols(hA); 2812df22349SStefano Zampini str = hypre_ParCSRMatrixFirstRowIndex(hA); 2822df22349SStefano Zampini stc = hypre_ParCSRMatrixFirstColDiag(hA); 2832df22349SStefano Zampini hdiag = hypre_ParCSRMatrixDiag(hA); 2842df22349SStefano Zampini hoffd = hypre_ParCSRMatrixOffd(hA); 2852df22349SStefano Zampini dr = hypre_CSRMatrixNumRows(hdiag); 2862df22349SStefano Zampini dc = hypre_CSRMatrixNumCols(hdiag); 2872df22349SStefano Zampini nnz = hypre_CSRMatrixNumNonzeros(hdiag); 2882df22349SStefano Zampini hdi = hypre_CSRMatrixI(hdiag); 2892df22349SStefano Zampini hdj = hypre_CSRMatrixJ(hdiag); 2902df22349SStefano Zampini hdd = hypre_CSRMatrixData(hdiag); 2912df22349SStefano Zampini oc = hypre_CSRMatrixNumCols(hoffd); 2922df22349SStefano Zampini nnz += hypre_CSRMatrixNumNonzeros(hoffd); 2932df22349SStefano Zampini hoi = hypre_CSRMatrixI(hoffd); 2942df22349SStefano Zampini hoj = hypre_CSRMatrixJ(hoffd); 2952df22349SStefano Zampini hod = hypre_CSRMatrixData(hoffd); 2962df22349SStefano Zampini if (reuse != MAT_REUSE_MATRIX) { 2972df22349SStefano Zampini PetscInt *aux; 2982df22349SStefano Zampini 2992df22349SStefano Zampini /* generate l2g maps for rows and cols */ 3009566063dSJacob Faibussowitsch PetscCall(ISCreateStride(comm, dr, str, 1, &is)); 3019566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreateIS(is, &rl2g)); 3029566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is)); 3032df22349SStefano Zampini col_map_offd = hypre_ParCSRMatrixColMapOffd(hA); 3049566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(dc + oc, &aux)); 3052df22349SStefano Zampini for (i = 0; i < dc; i++) aux[i] = i + stc; 3062df22349SStefano Zampini for (i = 0; i < oc; i++) aux[i + dc] = col_map_offd[i]; 3079566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(comm, dc + oc, aux, PETSC_OWN_POINTER, &is)); 3089566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreateIS(is, &cl2g)); 3099566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is)); 3102df22349SStefano Zampini /* create MATIS object */ 3119566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, B)); 3129566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, dr, dc, M, N)); 3139566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, MATIS)); 3149566063dSJacob Faibussowitsch PetscCall(MatSetLocalToGlobalMapping(*B, rl2g, cl2g)); 3159566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingDestroy(&rl2g)); 3169566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingDestroy(&cl2g)); 3172df22349SStefano Zampini 3182df22349SStefano Zampini /* allocate CSR for local matrix */ 3199566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(dr + 1, &iptr)); 3209566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz, &jptr)); 3219566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz, &data)); 3222df22349SStefano Zampini } else { 3232df22349SStefano Zampini PetscInt nr; 3242df22349SStefano Zampini PetscBool done; 3259566063dSJacob Faibussowitsch PetscCall(MatISGetLocalMat(*B, &lA)); 3269566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(lA, 0, PETSC_FALSE, PETSC_FALSE, &nr, (const PetscInt **)&iptr, (const PetscInt **)&jptr, &done)); 32708401ef6SPierre Jolivet PetscCheck(nr == dr, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of rows in local mat! %" PetscInt_FMT " != %" PetscInt_FMT, nr, dr); 32808401ef6SPierre Jolivet PetscCheck(iptr[nr] >= nnz, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of nonzeros in local mat! reuse %" PetscInt_FMT " requested %" PetscInt_FMT, iptr[nr], nnz); 32906977982Sstefanozampini PetscCall(MatSeqAIJGetArrayWrite(lA, &data)); 3302df22349SStefano Zampini } 3312df22349SStefano Zampini /* merge local matrices */ 3322df22349SStefano Zampini ii = iptr; 3332df22349SStefano Zampini jj = jptr; 33439accc25SStefano Zampini aa = (HYPRE_Complex *)data; /* this cast fixes the clang error when doing the assignments below: implicit conversion from 'HYPRE_Complex' (aka '_Complex double') to 'double' is not permitted in C++ */ 3352df22349SStefano Zampini *ii = *(hdi++) + *(hoi++); 3362df22349SStefano Zampini for (jd = 0, jo = 0, cum = 0; *ii < nnz; cum++) { 33739accc25SStefano Zampini PetscScalar *aold = (PetscScalar *)aa; 3382df22349SStefano Zampini PetscInt *jold = jj, nc = jd + jo; 3399371c9d4SSatish Balay for (; jd < *hdi; jd++) { 3409371c9d4SSatish Balay *jj++ = *hdj++; 3419371c9d4SSatish Balay *aa++ = *hdd++; 3429371c9d4SSatish Balay } 3439371c9d4SSatish Balay for (; jo < *hoi; jo++) { 3449371c9d4SSatish Balay *jj++ = *hoj++ + dc; 3459371c9d4SSatish Balay *aa++ = *hod++; 3469371c9d4SSatish Balay } 3472df22349SStefano Zampini *(++ii) = *(hdi++) + *(hoi++); 3489566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(jd + jo - nc, jold, aold)); 3492df22349SStefano Zampini } 3502df22349SStefano Zampini for (; cum < dr; cum++) *(++ii) = nnz; 3512df22349SStefano Zampini if (reuse != MAT_REUSE_MATRIX) { 352a033916dSStefano Zampini Mat_SeqAIJ *a; 353a033916dSStefano Zampini 3549566063dSJacob Faibussowitsch PetscCall(MatCreateSeqAIJWithArrays(PETSC_COMM_SELF, dr, dc + oc, iptr, jptr, data, &lA)); 355a033916dSStefano Zampini /* hack SeqAIJ */ 356f4f49eeaSPierre Jolivet a = (Mat_SeqAIJ *)lA->data; 357a033916dSStefano Zampini a->free_a = PETSC_TRUE; 358a033916dSStefano Zampini a->free_ij = PETSC_TRUE; 35906977982Sstefanozampini if (lmattype) PetscCall(MatConvert(lA, lmattype, MAT_INPLACE_MATRIX, &lA)); 36006977982Sstefanozampini PetscCall(MatISSetLocalMat(*B, lA)); 3619566063dSJacob Faibussowitsch PetscCall(MatDestroy(&lA)); 36206977982Sstefanozampini } else { 36306977982Sstefanozampini PetscCall(MatSeqAIJRestoreArrayWrite(lA, &data)); 3642df22349SStefano Zampini } 3659566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 3669566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 36748a46eb9SPierre Jolivet if (reuse == MAT_INPLACE_MATRIX) PetscCall(MatHeaderReplace(A, B)); 368a333fa2bSZach Atkins if (freeparcsr) PetscCallHYPRE(hypre_ParCSRMatrixDestroy(hA)); 3693ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3702df22349SStefano Zampini } 3712df22349SStefano Zampini 37206977982Sstefanozampini static PetscErrorCode MatHYPRE_DestroyCOOMat(Mat mat) 373d71ae5a4SJacob Faibussowitsch { 37406977982Sstefanozampini Mat_HYPRE *hA = (Mat_HYPRE *)mat->data; 37563c07aadSStefano Zampini 37663c07aadSStefano Zampini PetscFunctionBegin; 37706977982Sstefanozampini if (hA->cooMat) { /* If cooMat is present we need to destroy the column indices */ 37806977982Sstefanozampini PetscCall(MatDestroy(&hA->cooMat)); 37906977982Sstefanozampini if (hA->cooMatAttached) { 38006977982Sstefanozampini hypre_CSRMatrix *csr; 38106977982Sstefanozampini hypre_ParCSRMatrix *parcsr; 38206977982Sstefanozampini HYPRE_MemoryLocation mem; 38306977982Sstefanozampini 384a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(hA->ij, (void **)&parcsr)); 38506977982Sstefanozampini csr = hypre_ParCSRMatrixDiag(parcsr); 38606977982Sstefanozampini if (csr) { 38706977982Sstefanozampini mem = hypre_CSRMatrixMemoryLocation(csr); 38806977982Sstefanozampini PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hypre_CSRMatrixJ(csr), mem)); 38906977982Sstefanozampini PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hypre_CSRMatrixBigJ(csr), mem)); 390b73e3080SStefano Zampini } 39106977982Sstefanozampini csr = hypre_ParCSRMatrixOffd(parcsr); 39206977982Sstefanozampini if (csr) { 39306977982Sstefanozampini mem = hypre_CSRMatrixMemoryLocation(csr); 39406977982Sstefanozampini PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hypre_CSRMatrixJ(csr), mem)); 39506977982Sstefanozampini PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hypre_CSRMatrixBigJ(csr), mem)); 396b73e3080SStefano Zampini } 397b73e3080SStefano Zampini } 39806977982Sstefanozampini } 39906977982Sstefanozampini hA->cooMatAttached = PETSC_FALSE; 400b73e3080SStefano Zampini PetscFunctionReturn(PETSC_SUCCESS); 401b73e3080SStefano Zampini } 402b73e3080SStefano Zampini 40306977982Sstefanozampini static PetscErrorCode MatHYPRE_CreateCOOMat(Mat mat) 404b73e3080SStefano Zampini { 40506977982Sstefanozampini MPI_Comm comm; 40606977982Sstefanozampini PetscMPIInt size; 40706977982Sstefanozampini PetscLayout rmap, cmap; 40806977982Sstefanozampini Mat_HYPRE *hmat = (Mat_HYPRE *)mat->data; 40906977982Sstefanozampini MatType matType = MATAIJ; /* default type of cooMat */ 410b73e3080SStefano Zampini 411b73e3080SStefano Zampini PetscFunctionBegin; 41206977982Sstefanozampini /* Build an agent matrix cooMat with AIJ format 41306977982Sstefanozampini It has the same sparsity pattern as mat, and also shares the data array with mat. We use cooMat to do the COO work. 41406977982Sstefanozampini */ 41506977982Sstefanozampini PetscCall(PetscObjectGetComm((PetscObject)mat, &comm)); 41606977982Sstefanozampini PetscCallMPI(MPI_Comm_size(comm, &size)); 41706977982Sstefanozampini PetscCall(PetscLayoutSetUp(mat->rmap)); 41806977982Sstefanozampini PetscCall(PetscLayoutSetUp(mat->cmap)); 41906977982Sstefanozampini PetscCall(MatGetLayouts(mat, &rmap, &cmap)); 420b73e3080SStefano Zampini 42106977982Sstefanozampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 42206977982Sstefanozampini if (!mat->boundtocpu) { /* mat will be on device, so will cooMat */ 42306977982Sstefanozampini #if defined(HYPRE_USING_HIP) 42406977982Sstefanozampini matType = MATAIJHIPSPARSE; 42506977982Sstefanozampini #elif defined(HYPRE_USING_CUDA) 42606977982Sstefanozampini matType = MATAIJCUSPARSE; 427e64794e4SJunchao Zhang #elif defined(HYPRE_USING_SYCL) && defined(PETSC_HAVE_KOKKOS_KERNELS) 428e64794e4SJunchao Zhang matType = MATAIJKOKKOS; 42906977982Sstefanozampini #else 430e64794e4SJunchao Zhang SETERRQ(comm, PETSC_ERR_SUP, "No HYPRE device available. Suggest re-installing with Kokkos Kernels"); 43106977982Sstefanozampini #endif 432b73e3080SStefano Zampini } 43306977982Sstefanozampini #endif 43406977982Sstefanozampini 43506977982Sstefanozampini /* Do COO preallocation through cooMat */ 43606977982Sstefanozampini PetscCall(MatHYPRE_DestroyCOOMat(mat)); 43706977982Sstefanozampini PetscCall(MatCreate(comm, &hmat->cooMat)); 43806977982Sstefanozampini PetscCall(MatSetType(hmat->cooMat, matType)); 43906977982Sstefanozampini PetscCall(MatSetLayouts(hmat->cooMat, rmap, cmap)); 44006977982Sstefanozampini 44106977982Sstefanozampini /* allocate local matrices if needed */ 44206977982Sstefanozampini PetscCall(MatMPIAIJSetPreallocation(hmat->cooMat, 0, NULL, 0, NULL)); 44306977982Sstefanozampini PetscFunctionReturn(PETSC_SUCCESS); 44406977982Sstefanozampini } 44506977982Sstefanozampini 44606977982Sstefanozampini /* Attach cooMat data array to hypre matrix. 44706977982Sstefanozampini When AIJCUPMSPARSE will support raw device pointers and not THRUSTARRAY 44806977982Sstefanozampini we should swap the arrays: i.e., attach hypre matrix array to cooMat 44906977982Sstefanozampini This is because hypre should be in charge of handling the memory, 45006977982Sstefanozampini cooMat is only a way to reuse PETSc COO code. 45106977982Sstefanozampini attaching the memory will then be done at MatSetValuesCOO time and it will dynamically 45206977982Sstefanozampini support hypre matrix migrating to host. 45306977982Sstefanozampini */ 45406977982Sstefanozampini static PetscErrorCode MatHYPRE_AttachCOOMat(Mat mat) 45506977982Sstefanozampini { 45606977982Sstefanozampini Mat_HYPRE *hmat = (Mat_HYPRE *)mat->data; 45706977982Sstefanozampini hypre_CSRMatrix *diag, *offd; 45806977982Sstefanozampini hypre_ParCSRMatrix *parCSR; 45906977982Sstefanozampini HYPRE_MemoryLocation hmem = HYPRE_MEMORY_HOST; 46006977982Sstefanozampini PetscMemType pmem; 46106977982Sstefanozampini Mat A, B; 46206977982Sstefanozampini PetscScalar *a; 46306977982Sstefanozampini PetscMPIInt size; 46406977982Sstefanozampini MPI_Comm comm; 46506977982Sstefanozampini 46606977982Sstefanozampini PetscFunctionBegin; 46706977982Sstefanozampini PetscCheck(hmat->cooMat, PetscObjectComm((PetscObject)mat), PETSC_ERR_PLIB, "HYPRE COO delegate matrix has not been created yet"); 46806977982Sstefanozampini if (hmat->cooMatAttached) PetscFunctionReturn(PETSC_SUCCESS); 46906977982Sstefanozampini PetscCheck(hmat->cooMat->preallocated, PetscObjectComm((PetscObject)mat), PETSC_ERR_PLIB, "HYPRE COO delegate matrix is not preallocated"); 47006977982Sstefanozampini PetscCall(PetscObjectSetName((PetscObject)hmat->cooMat, "_internal_COO_mat_for_hypre")); 47106977982Sstefanozampini PetscCall(PetscObjectGetComm((PetscObject)mat, &comm)); 47206977982Sstefanozampini PetscCallMPI(MPI_Comm_size(comm, &size)); 47306977982Sstefanozampini 47406977982Sstefanozampini /* Alias cooMat's data array to IJMatrix's */ 475a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(hmat->ij, (void **)&parCSR)); 47606977982Sstefanozampini diag = hypre_ParCSRMatrixDiag(parCSR); 47706977982Sstefanozampini offd = hypre_ParCSRMatrixOffd(parCSR); 47806977982Sstefanozampini 47906977982Sstefanozampini A = (size == 1) ? hmat->cooMat : ((Mat_MPIAIJ *)hmat->cooMat->data)->A; 48006977982Sstefanozampini B = (size == 1) ? NULL : ((Mat_MPIAIJ *)hmat->cooMat->data)->B; 48106977982Sstefanozampini 48206977982Sstefanozampini PetscCall(PetscObjectSetName((PetscObject)A, "_internal_COO_mat_for_hypre")); 48306977982Sstefanozampini hmem = hypre_CSRMatrixMemoryLocation(diag); 48406977982Sstefanozampini PetscCall(MatSeqAIJGetCSRAndMemType(A, NULL, NULL, &a, &pmem)); 48506977982Sstefanozampini PetscAssert((PetscMemTypeHost(pmem) && hmem == HYPRE_MEMORY_HOST) || (PetscMemTypeDevice(pmem) && hmem == HYPRE_MEMORY_DEVICE), comm, PETSC_ERR_PLIB, "PETSc and hypre's memory types mismatch"); 48606977982Sstefanozampini PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hypre_CSRMatrixData(diag), hmem)); 48706977982Sstefanozampini hypre_CSRMatrixData(diag) = (HYPRE_Complex *)a; 48806977982Sstefanozampini hypre_CSRMatrixOwnsData(diag) = 0; /* Take ownership of (j,a) away from hypre. As a result, we need to free them on our own */ 48906977982Sstefanozampini 49006977982Sstefanozampini if (B) { 49106977982Sstefanozampini hmem = hypre_CSRMatrixMemoryLocation(offd); 49206977982Sstefanozampini PetscCall(MatSeqAIJGetCSRAndMemType(B, NULL, NULL, &a, &pmem)); 49306977982Sstefanozampini PetscAssert((PetscMemTypeHost(pmem) && hmem == HYPRE_MEMORY_HOST) || (PetscMemTypeDevice(pmem) && hmem == HYPRE_MEMORY_DEVICE), comm, PETSC_ERR_PLIB, "PETSc and hypre's memory types mismatch"); 49406977982Sstefanozampini PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hypre_CSRMatrixData(offd), hmem)); 49506977982Sstefanozampini hypre_CSRMatrixData(offd) = (HYPRE_Complex *)a; 49606977982Sstefanozampini hypre_CSRMatrixOwnsData(offd) = 0; 49706977982Sstefanozampini } 49806977982Sstefanozampini hmat->cooMatAttached = PETSC_TRUE; 49906977982Sstefanozampini PetscFunctionReturn(PETSC_SUCCESS); 50006977982Sstefanozampini } 50106977982Sstefanozampini 5021c265611SJunchao Zhang // Build COO's coordinate list i[], j[] based on CSR's i[], j[] arrays and the number of local rows 'n' 50306977982Sstefanozampini static PetscErrorCode CSRtoCOO_Private(PetscInt n, const PetscInt ii[], const PetscInt jj[], PetscCount *ncoo, PetscInt **coo_i, PetscInt **coo_j) 50406977982Sstefanozampini { 50506977982Sstefanozampini PetscInt *cooi, *cooj; 50606977982Sstefanozampini 50706977982Sstefanozampini PetscFunctionBegin; 50806977982Sstefanozampini *ncoo = ii[n]; 50906977982Sstefanozampini PetscCall(PetscMalloc2(*ncoo, &cooi, *ncoo, &cooj)); 51006977982Sstefanozampini for (PetscInt i = 0; i < n; i++) { 51106977982Sstefanozampini for (PetscInt j = ii[i]; j < ii[i + 1]; j++) cooi[j] = i; 51206977982Sstefanozampini } 51306977982Sstefanozampini PetscCall(PetscArraycpy(cooj, jj, *ncoo)); 51406977982Sstefanozampini *coo_i = cooi; 51506977982Sstefanozampini *coo_j = cooj; 51606977982Sstefanozampini PetscFunctionReturn(PETSC_SUCCESS); 51706977982Sstefanozampini } 51806977982Sstefanozampini 5191c265611SJunchao Zhang // Similar to CSRtoCOO_Private, but the CSR's i[], j[] are of type HYPRE_Int 52006977982Sstefanozampini static PetscErrorCode CSRtoCOO_HYPRE_Int_Private(PetscInt n, const HYPRE_Int ii[], const HYPRE_Int jj[], PetscCount *ncoo, PetscInt **coo_i, PetscInt **coo_j) 52106977982Sstefanozampini { 52206977982Sstefanozampini PetscInt *cooi, *cooj; 52306977982Sstefanozampini 52406977982Sstefanozampini PetscFunctionBegin; 52506977982Sstefanozampini *ncoo = ii[n]; 52606977982Sstefanozampini PetscCall(PetscMalloc2(*ncoo, &cooi, *ncoo, &cooj)); 52706977982Sstefanozampini for (PetscInt i = 0; i < n; i++) { 52806977982Sstefanozampini for (HYPRE_Int j = ii[i]; j < ii[i + 1]; j++) cooi[j] = i; 52906977982Sstefanozampini } 53006977982Sstefanozampini for (PetscCount i = 0; i < *ncoo; i++) cooj[i] = jj[i]; 53106977982Sstefanozampini *coo_i = cooi; 53206977982Sstefanozampini *coo_j = cooj; 53306977982Sstefanozampini PetscFunctionReturn(PETSC_SUCCESS); 53406977982Sstefanozampini } 53506977982Sstefanozampini 5361c265611SJunchao Zhang // Build a COO data structure for the seqaij matrix, as if the nonzeros are laid out in the same order as in the CSR 53706977982Sstefanozampini static PetscErrorCode MatSeqAIJGetCOO_Private(Mat A, PetscCount *ncoo, PetscInt **coo_i, PetscInt **coo_j) 53806977982Sstefanozampini { 53906977982Sstefanozampini PetscInt n; 54006977982Sstefanozampini const PetscInt *ii, *jj; 54106977982Sstefanozampini PetscBool done; 54206977982Sstefanozampini 54306977982Sstefanozampini PetscFunctionBegin; 54406977982Sstefanozampini PetscCall(MatGetRowIJ(A, 0, PETSC_FALSE, PETSC_FALSE, &n, &ii, &jj, &done)); 54506977982Sstefanozampini PetscCheck(done, PetscObjectComm((PetscObject)A), PETSC_ERR_PLIB, "Failure for MatGetRowIJ"); 54606977982Sstefanozampini PetscCall(CSRtoCOO_Private(n, ii, jj, ncoo, coo_i, coo_j)); 54706977982Sstefanozampini PetscCall(MatRestoreRowIJ(A, 0, PETSC_FALSE, PETSC_FALSE, &n, &ii, &jj, &done)); 54806977982Sstefanozampini PetscCheck(done, PetscObjectComm((PetscObject)A), PETSC_ERR_PLIB, "Failure for MatRestoreRowIJ"); 54906977982Sstefanozampini PetscFunctionReturn(PETSC_SUCCESS); 55006977982Sstefanozampini } 55106977982Sstefanozampini 5521c265611SJunchao Zhang // Build a COO data structure for the hypreCSRMatrix, as if the nonzeros are laid out in the same order as in the hypreCSRMatrix 55306977982Sstefanozampini static PetscErrorCode hypreCSRMatrixGetCOO_Private(hypre_CSRMatrix *A, PetscCount *ncoo, PetscInt **coo_i, PetscInt **coo_j) 55406977982Sstefanozampini { 55506977982Sstefanozampini PetscInt n = hypre_CSRMatrixNumRows(A); 55606977982Sstefanozampini HYPRE_Int *ii, *jj; 55706977982Sstefanozampini HYPRE_MemoryLocation mem = HYPRE_MEMORY_HOST; 55806977982Sstefanozampini 55906977982Sstefanozampini PetscFunctionBegin; 56006977982Sstefanozampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 56106977982Sstefanozampini mem = hypre_CSRMatrixMemoryLocation(A); 56206977982Sstefanozampini if (mem != HYPRE_MEMORY_HOST) { 56306977982Sstefanozampini PetscCount nnz = hypre_CSRMatrixNumNonzeros(A); 56406977982Sstefanozampini PetscCall(PetscMalloc2(n + 1, &ii, nnz, &jj)); 56506977982Sstefanozampini hypre_TMemcpy(ii, hypre_CSRMatrixI(A), HYPRE_Int, n + 1, HYPRE_MEMORY_HOST, mem); 56606977982Sstefanozampini hypre_TMemcpy(jj, hypre_CSRMatrixJ(A), HYPRE_Int, nnz, HYPRE_MEMORY_HOST, mem); 56706977982Sstefanozampini } else { 56806977982Sstefanozampini #else 56906977982Sstefanozampini { 57006977982Sstefanozampini #endif 57106977982Sstefanozampini ii = hypre_CSRMatrixI(A); 57206977982Sstefanozampini jj = hypre_CSRMatrixJ(A); 57306977982Sstefanozampini } 57406977982Sstefanozampini PetscCall(CSRtoCOO_HYPRE_Int_Private(n, ii, jj, ncoo, coo_i, coo_j)); 57506977982Sstefanozampini if (mem != HYPRE_MEMORY_HOST) PetscCall(PetscFree2(ii, jj)); 57606977982Sstefanozampini PetscFunctionReturn(PETSC_SUCCESS); 57706977982Sstefanozampini } 57806977982Sstefanozampini 57906977982Sstefanozampini static PetscErrorCode MatSetValuesCOOFromCSRMatrix_Private(Mat A, hypre_CSRMatrix *H) 58006977982Sstefanozampini { 58106977982Sstefanozampini PetscBool iscpu = PETSC_TRUE; 58206977982Sstefanozampini PetscScalar *a; 58306977982Sstefanozampini HYPRE_MemoryLocation mem = HYPRE_MEMORY_HOST; 58406977982Sstefanozampini 58506977982Sstefanozampini PetscFunctionBegin; 58606977982Sstefanozampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 58706977982Sstefanozampini mem = hypre_CSRMatrixMemoryLocation(H); 58806977982Sstefanozampini PetscCall(PetscObjectTypeCompare((PetscObject)A, MATSEQAIJ, &iscpu)); 58906977982Sstefanozampini #endif 59006977982Sstefanozampini if (iscpu && mem != HYPRE_MEMORY_HOST) { 59106977982Sstefanozampini PetscCount nnz = hypre_CSRMatrixNumNonzeros(H); 59206977982Sstefanozampini PetscCall(PetscMalloc1(nnz, &a)); 59306977982Sstefanozampini hypre_TMemcpy(a, hypre_CSRMatrixData(H), PetscScalar, nnz, HYPRE_MEMORY_HOST, mem); 59406977982Sstefanozampini } else { 59506977982Sstefanozampini a = (PetscScalar *)hypre_CSRMatrixData(H); 59606977982Sstefanozampini } 59706977982Sstefanozampini PetscCall(MatSetValuesCOO(A, a, INSERT_VALUES)); 59806977982Sstefanozampini if (iscpu && mem != HYPRE_MEMORY_HOST) PetscCall(PetscFree(a)); 599b73e3080SStefano Zampini PetscFunctionReturn(PETSC_SUCCESS); 600b73e3080SStefano Zampini } 601b73e3080SStefano Zampini 602b73e3080SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType type, MatReuse reuse, Mat *B) 603b73e3080SStefano Zampini { 604b73e3080SStefano Zampini MPI_Comm comm = PetscObjectComm((PetscObject)A); 60506977982Sstefanozampini Mat M = NULL, dH = NULL, oH = NULL, dA = NULL, oA = NULL; 606d7185485SAlex Lindsay PetscBool ismpiaij, issbaij, isbaij, boundtocpu = PETSC_TRUE; 607b73e3080SStefano Zampini Mat_HYPRE *hA; 608d7185485SAlex Lindsay PetscMemType memtype = PETSC_MEMTYPE_HOST; 609b73e3080SStefano Zampini 610b73e3080SStefano Zampini PetscFunctionBegin; 611d7185485SAlex Lindsay if (PetscDefined(HAVE_HYPRE_DEVICE)) { 612d7185485SAlex Lindsay PetscCall(MatGetCurrentMemType(A, &memtype)); 613d7185485SAlex Lindsay PetscHYPREInitialize(); 614d7185485SAlex Lindsay boundtocpu = PetscMemTypeHost(memtype) ? PETSC_TRUE : PETSC_FALSE; 615a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_SetMemoryLocation(boundtocpu ? HYPRE_MEMORY_HOST : HYPRE_MEMORY_DEVICE)); 616d7185485SAlex Lindsay } 617d7185485SAlex Lindsay 618b73e3080SStefano Zampini PetscCall(PetscObjectTypeCompareAny((PetscObject)A, &issbaij, MATSEQSBAIJ, MATMPIBAIJ, "")); 619b73e3080SStefano Zampini PetscCall(PetscObjectTypeCompareAny((PetscObject)A, &isbaij, MATSEQBAIJ, MATMPIBAIJ, "")); 620b73e3080SStefano Zampini if (isbaij || issbaij) { /* handle BAIJ and SBAIJ */ 621b73e3080SStefano Zampini PetscBool ismpi; 622b73e3080SStefano Zampini MatType newtype; 623b73e3080SStefano Zampini 624b73e3080SStefano Zampini PetscCall(PetscObjectTypeCompareAny((PetscObject)A, &ismpi, MATMPISBAIJ, MATMPIBAIJ, "")); 625b73e3080SStefano Zampini newtype = ismpi ? MATMPIAIJ : MATSEQAIJ; 62663c07aadSStefano Zampini if (reuse == MAT_REUSE_MATRIX) { 627b73e3080SStefano Zampini PetscCall(MatConvert(*B, newtype, MAT_INPLACE_MATRIX, B)); 628b73e3080SStefano Zampini PetscCall(MatConvert(A, newtype, MAT_REUSE_MATRIX, B)); 629b73e3080SStefano Zampini PetscCall(MatConvert(*B, MATHYPRE, MAT_INPLACE_MATRIX, B)); 630b73e3080SStefano Zampini } else if (reuse == MAT_INITIAL_MATRIX) { 631b73e3080SStefano Zampini PetscCall(MatConvert(A, newtype, MAT_INITIAL_MATRIX, B)); 632b73e3080SStefano Zampini PetscCall(MatConvert(*B, MATHYPRE, MAT_INPLACE_MATRIX, B)); 63363c07aadSStefano Zampini } else { 634b73e3080SStefano Zampini PetscCall(MatConvert(A, newtype, MAT_INPLACE_MATRIX, &A)); 635b73e3080SStefano Zampini PetscCall(MatConvert(A, MATHYPRE, MAT_INPLACE_MATRIX, &A)); 636b73e3080SStefano Zampini } 637d7185485SAlex Lindsay #if defined(PETSC_HAVE_DEVICE) 638d7185485SAlex Lindsay (*B)->boundtocpu = boundtocpu; 639d7185485SAlex Lindsay #endif 640b73e3080SStefano Zampini PetscFunctionReturn(PETSC_SUCCESS); 641b73e3080SStefano Zampini } 64206977982Sstefanozampini 64306977982Sstefanozampini dA = A; 644b73e3080SStefano Zampini PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &ismpiaij)); 645b73e3080SStefano Zampini if (ismpiaij) PetscCall(MatMPIAIJGetSeqAIJ(A, &dA, &oA, NULL)); 64606977982Sstefanozampini 647b73e3080SStefano Zampini if (reuse != MAT_REUSE_MATRIX) { 64806977982Sstefanozampini PetscCount coo_n; 64906977982Sstefanozampini PetscInt *coo_i, *coo_j; 65006977982Sstefanozampini 6519566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, &M)); 6529566063dSJacob Faibussowitsch PetscCall(MatSetType(M, MATHYPRE)); 6539566063dSJacob Faibussowitsch PetscCall(MatSetSizes(M, A->rmap->n, A->cmap->n, A->rmap->N, A->cmap->N)); 654b73e3080SStefano Zampini PetscCall(MatSetOption(M, MAT_SORTED_FULL, PETSC_TRUE)); 655b73e3080SStefano Zampini PetscCall(MatSetOption(M, MAT_NO_OFF_PROC_ENTRIES, PETSC_TRUE)); 656b73e3080SStefano Zampini 657b73e3080SStefano Zampini hA = (Mat_HYPRE *)M->data; 65806977982Sstefanozampini PetscCall(MatHYPRE_CreateFromMat(A, hA)); 65906977982Sstefanozampini PetscCall(MatHYPRE_IJMatrixCopyIJ(A, hA->ij)); 66006977982Sstefanozampini 66106977982Sstefanozampini PetscCall(MatHYPRE_CreateCOOMat(M)); 66206977982Sstefanozampini 66306977982Sstefanozampini dH = hA->cooMat; 66406977982Sstefanozampini PetscCall(PetscObjectBaseTypeCompare((PetscObject)hA->cooMat, MATMPIAIJ, &ismpiaij)); 66506977982Sstefanozampini if (ismpiaij) PetscCall(MatMPIAIJGetSeqAIJ(hA->cooMat, &dH, &oH, NULL)); 66606977982Sstefanozampini 66706977982Sstefanozampini PetscCall(PetscObjectSetName((PetscObject)dH, "_internal_COO_mat_for_hypre")); 66806977982Sstefanozampini PetscCall(MatSeqAIJGetCOO_Private(dA, &coo_n, &coo_i, &coo_j)); 66906977982Sstefanozampini PetscCall(MatSetPreallocationCOO(dH, coo_n, coo_i, coo_j)); 67006977982Sstefanozampini PetscCall(PetscFree2(coo_i, coo_j)); 67106977982Sstefanozampini if (oH) { 67206977982Sstefanozampini PetscCall(PetscLayoutDestroy(&oH->cmap)); 67306977982Sstefanozampini PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)oH), oA->cmap->n, oA->cmap->n, 1, &oH->cmap)); 67406977982Sstefanozampini PetscCall(MatSeqAIJGetCOO_Private(oA, &coo_n, &coo_i, &coo_j)); 67506977982Sstefanozampini PetscCall(MatSetPreallocationCOO(oH, coo_n, coo_i, coo_j)); 67606977982Sstefanozampini PetscCall(PetscFree2(coo_i, coo_j)); 67706977982Sstefanozampini } 67806977982Sstefanozampini hA->cooMat->assembled = PETSC_TRUE; 67906977982Sstefanozampini 680b73e3080SStefano Zampini M->preallocated = PETSC_TRUE; 68106977982Sstefanozampini PetscCall(MatAssemblyBegin(M, MAT_FINAL_ASSEMBLY)); 68206977982Sstefanozampini PetscCall(MatAssemblyEnd(M, MAT_FINAL_ASSEMBLY)); 68306977982Sstefanozampini 68406977982Sstefanozampini PetscCall(MatHYPRE_AttachCOOMat(M)); 68584d4e069SStefano Zampini if (reuse == MAT_INITIAL_MATRIX) *B = M; 686b73e3080SStefano Zampini } else M = *B; 687b73e3080SStefano Zampini 688b73e3080SStefano Zampini hA = (Mat_HYPRE *)M->data; 68906977982Sstefanozampini PetscCheck(hA->cooMat, PetscObjectComm((PetscObject)A), PETSC_ERR_PLIB, "HYPRE COO delegate matrix has not been created yet"); 69006977982Sstefanozampini 69106977982Sstefanozampini dH = hA->cooMat; 69206977982Sstefanozampini PetscCall(PetscObjectBaseTypeCompare((PetscObject)hA->cooMat, MATMPIAIJ, &ismpiaij)); 69306977982Sstefanozampini if (ismpiaij) PetscCall(MatMPIAIJGetSeqAIJ(hA->cooMat, &dH, &oH, NULL)); 69406977982Sstefanozampini 69506977982Sstefanozampini PetscScalar *a; 69606977982Sstefanozampini PetscCall(MatSeqAIJGetCSRAndMemType(dA, NULL, NULL, &a, NULL)); 69706977982Sstefanozampini PetscCall(MatSetValuesCOO(dH, a, INSERT_VALUES)); 69806977982Sstefanozampini if (oH) { 69906977982Sstefanozampini PetscCall(MatSeqAIJGetCSRAndMemType(oA, NULL, NULL, &a, NULL)); 70006977982Sstefanozampini PetscCall(MatSetValuesCOO(oH, a, INSERT_VALUES)); 70106977982Sstefanozampini } 702b73e3080SStefano Zampini 70348a46eb9SPierre Jolivet if (reuse == MAT_INPLACE_MATRIX) PetscCall(MatHeaderReplace(A, &M)); 704d7185485SAlex Lindsay #if defined(PETSC_HAVE_DEVICE) 705d7185485SAlex Lindsay (*B)->boundtocpu = boundtocpu; 706d7185485SAlex Lindsay #endif 7073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 70863c07aadSStefano Zampini } 70963c07aadSStefano Zampini 710d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatConvert_HYPRE_AIJ(Mat A, MatType mtype, MatReuse reuse, Mat *B) 711d71ae5a4SJacob Faibussowitsch { 71206977982Sstefanozampini Mat M, dA = NULL, oA = NULL; 71363c07aadSStefano Zampini hypre_ParCSRMatrix *parcsr; 71406977982Sstefanozampini hypre_CSRMatrix *dH, *oH; 71563c07aadSStefano Zampini MPI_Comm comm; 71606977982Sstefanozampini PetscBool ismpiaij, isseqaij; 71763c07aadSStefano Zampini 71863c07aadSStefano Zampini PetscFunctionBegin; 71963c07aadSStefano Zampini comm = PetscObjectComm((PetscObject)A); 72063c07aadSStefano Zampini if (reuse == MAT_REUSE_MATRIX) { 7219566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)*B, MATMPIAIJ, &ismpiaij)); 7229566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)*B, MATSEQAIJ, &isseqaij)); 72306977982Sstefanozampini PetscCheck(ismpiaij || isseqaij, comm, PETSC_ERR_SUP, "Only MATMPIAIJ or MATSEQAIJ base types are supported"); 72463c07aadSStefano Zampini } 72506977982Sstefanozampini PetscCall(MatHYPREGetParCSR(A, &parcsr)); 7266ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 72706977982Sstefanozampini if (HYPRE_MEMORY_DEVICE == hypre_ParCSRMatrixMemoryLocation(parcsr)) { 72806977982Sstefanozampini PetscBool isaij; 72906977982Sstefanozampini 73006977982Sstefanozampini PetscCall(PetscStrcmp(mtype, MATAIJ, &isaij)); 73106977982Sstefanozampini if (isaij) { 73206977982Sstefanozampini PetscMPIInt size; 73306977982Sstefanozampini 7349566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(comm, &size)); 73506977982Sstefanozampini #if defined(HYPRE_USING_HIP) 73606977982Sstefanozampini mtype = size > 1 ? MATMPIAIJHIPSPARSE : MATSEQAIJHIPSPARSE; 73706977982Sstefanozampini #elif defined(HYPRE_USING_CUDA) 73806977982Sstefanozampini mtype = size > 1 ? MATMPIAIJCUSPARSE : MATSEQAIJCUSPARSE; 73906977982Sstefanozampini #else 74006977982Sstefanozampini mtype = size > 1 ? MATMPIAIJ : MATSEQAIJ; 74106977982Sstefanozampini #endif 74263c07aadSStefano Zampini } 74363c07aadSStefano Zampini } 74406977982Sstefanozampini #endif 74506977982Sstefanozampini dH = hypre_ParCSRMatrixDiag(parcsr); 74606977982Sstefanozampini oH = hypre_ParCSRMatrixOffd(parcsr); 7479371c9d4SSatish Balay if (reuse != MAT_REUSE_MATRIX) { 74806977982Sstefanozampini PetscCount coo_n; 74906977982Sstefanozampini PetscInt *coo_i, *coo_j; 75063c07aadSStefano Zampini 75106977982Sstefanozampini PetscCall(MatCreate(comm, &M)); 75206977982Sstefanozampini PetscCall(MatSetType(M, mtype)); 75306977982Sstefanozampini PetscCall(MatSetSizes(M, A->rmap->n, A->cmap->n, A->rmap->N, A->cmap->N)); 75406977982Sstefanozampini PetscCall(MatMPIAIJSetPreallocation(M, 0, NULL, 0, NULL)); 75563c07aadSStefano Zampini 75606977982Sstefanozampini dA = M; 75706977982Sstefanozampini PetscCall(PetscObjectBaseTypeCompare((PetscObject)M, MATMPIAIJ, &ismpiaij)); 75806977982Sstefanozampini if (ismpiaij) PetscCall(MatMPIAIJGetSeqAIJ(M, &dA, &oA, NULL)); 759a16187a7SStefano Zampini 76006977982Sstefanozampini PetscCall(hypreCSRMatrixGetCOO_Private(dH, &coo_n, &coo_i, &coo_j)); 76106977982Sstefanozampini PetscCall(MatSetPreallocationCOO(dA, coo_n, coo_i, coo_j)); 76206977982Sstefanozampini PetscCall(PetscFree2(coo_i, coo_j)); 76306977982Sstefanozampini if (ismpiaij) { 76406977982Sstefanozampini HYPRE_Int nc = hypre_CSRMatrixNumCols(oH); 765a16187a7SStefano Zampini 76606977982Sstefanozampini PetscCall(PetscLayoutDestroy(&oA->cmap)); 76706977982Sstefanozampini PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)oA), nc, nc, 1, &oA->cmap)); 76806977982Sstefanozampini PetscCall(hypreCSRMatrixGetCOO_Private(oH, &coo_n, &coo_i, &coo_j)); 76906977982Sstefanozampini PetscCall(MatSetPreallocationCOO(oA, coo_n, coo_i, coo_j)); 77006977982Sstefanozampini PetscCall(PetscFree2(coo_i, coo_j)); 771a16187a7SStefano Zampini 77206977982Sstefanozampini /* garray */ 773f4f49eeaSPierre Jolivet Mat_MPIAIJ *aij = (Mat_MPIAIJ *)M->data; 77406977982Sstefanozampini HYPRE_BigInt *harray = hypre_ParCSRMatrixColMapOffd(parcsr); 77506977982Sstefanozampini PetscInt *garray; 77606977982Sstefanozampini 77706977982Sstefanozampini PetscCall(PetscFree(aij->garray)); 77806977982Sstefanozampini PetscCall(PetscMalloc1(nc, &garray)); 77906977982Sstefanozampini for (HYPRE_Int i = 0; i < nc; i++) garray[i] = (PetscInt)harray[i]; 78006977982Sstefanozampini aij->garray = garray; 78106977982Sstefanozampini PetscCall(MatSetUpMultiply_MPIAIJ(M)); 782a16187a7SStefano Zampini } 78306977982Sstefanozampini if (reuse == MAT_INITIAL_MATRIX) *B = M; 78406977982Sstefanozampini } else M = *B; 785225daaf8SStefano Zampini 78606977982Sstefanozampini dA = M; 78706977982Sstefanozampini PetscCall(PetscObjectBaseTypeCompare((PetscObject)M, MATMPIAIJ, &ismpiaij)); 78806977982Sstefanozampini if (ismpiaij) PetscCall(MatMPIAIJGetSeqAIJ(M, &dA, &oA, NULL)); 78906977982Sstefanozampini PetscCall(MatSetValuesCOOFromCSRMatrix_Private(dA, dH)); 79006977982Sstefanozampini if (oA) PetscCall(MatSetValuesCOOFromCSRMatrix_Private(oA, oH)); 79106977982Sstefanozampini M->assembled = PETSC_TRUE; 79206977982Sstefanozampini if (reuse == MAT_INPLACE_MATRIX) PetscCall(MatHeaderReplace(A, &M)); 7933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 79463c07aadSStefano Zampini } 79563c07aadSStefano Zampini 796d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAIJGetParCSR_Private(Mat A, hypre_ParCSRMatrix **hA) 797d71ae5a4SJacob Faibussowitsch { 798613e5ff0Sstefano_zampini hypre_ParCSRMatrix *tA; 799c1a070e6SStefano Zampini hypre_CSRMatrix *hdiag, *hoffd; 800c1a070e6SStefano Zampini Mat_SeqAIJ *diag, *offd; 8012cf14000SStefano Zampini PetscInt *garray, i, noffd, dnnz, onnz, *row_starts, *col_starts; 802c1a070e6SStefano Zampini MPI_Comm comm = PetscObjectComm((PetscObject)A); 803613e5ff0Sstefano_zampini PetscBool ismpiaij, isseqaij; 8042cf14000SStefano Zampini PetscBool sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int)); 8056ea7df73SStefano Zampini HYPRE_Int *hdi = NULL, *hdj = NULL, *hoi = NULL, *hoj = NULL; 8065c97c10fSStefano Zampini PetscInt *pdi = NULL, *pdj = NULL, *poi = NULL, *poj = NULL; 80706977982Sstefanozampini PetscBool iscuda, iship; 80806977982Sstefanozampini #if defined(PETSC_HAVE_DEVICE) && defined(PETSC_HAVE_HYPRE_DEVICE) 80906977982Sstefanozampini PetscBool boundtocpu = A->boundtocpu; 81006977982Sstefanozampini #else 81106977982Sstefanozampini PetscBool boundtocpu = PETSC_TRUE; 8126ea7df73SStefano Zampini #endif 813c1a070e6SStefano Zampini 814c1a070e6SStefano Zampini PetscFunctionBegin; 8159566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &ismpiaij)); 8169566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATSEQAIJ, &isseqaij)); 81708401ef6SPierre Jolivet PetscCheck(ismpiaij || isseqaij, comm, PETSC_ERR_SUP, "Unsupported type %s", ((PetscObject)A)->type_name); 818b655ebf8SZach Atkins PetscCall(PetscObjectTypeCompareAny((PetscObject)A, &iscuda, MATSEQAIJCUSPARSE, MATMPIAIJCUSPARSE, "")); 819b655ebf8SZach Atkins PetscCall(PetscObjectTypeCompareAny((PetscObject)A, &iship, MATSEQAIJHIPSPARSE, MATMPIAIJHIPSPARSE, "")); 820ea9ee2c1SPierre Jolivet PetscHYPREInitialize(); 821c1a070e6SStefano Zampini if (ismpiaij) { 822f4f49eeaSPierre Jolivet Mat_MPIAIJ *a = (Mat_MPIAIJ *)A->data; 823c1a070e6SStefano Zampini 824c1a070e6SStefano Zampini diag = (Mat_SeqAIJ *)a->A->data; 825c1a070e6SStefano Zampini offd = (Mat_SeqAIJ *)a->B->data; 82606977982Sstefanozampini if (!boundtocpu && (iscuda || iship)) { 82706977982Sstefanozampini #if defined(HYPRE_USING_CUDA) && defined(PETSC_HAVE_CUDA) 82806977982Sstefanozampini if (iscuda) { 8296ea7df73SStefano Zampini sameint = PETSC_TRUE; 8309566063dSJacob Faibussowitsch PetscCall(MatSeqAIJCUSPARSEGetIJ(a->A, PETSC_FALSE, (const HYPRE_Int **)&hdi, (const HYPRE_Int **)&hdj)); 8319566063dSJacob Faibussowitsch PetscCall(MatSeqAIJCUSPARSEGetIJ(a->B, PETSC_FALSE, (const HYPRE_Int **)&hoi, (const HYPRE_Int **)&hoj)); 83206977982Sstefanozampini } 8336ea7df73SStefano Zampini #endif 83406977982Sstefanozampini #if defined(HYPRE_USING_HIP) && defined(PETSC_HAVE_HIP) 83506977982Sstefanozampini if (iship) { 83606977982Sstefanozampini sameint = PETSC_TRUE; 83706977982Sstefanozampini PetscCall(MatSeqAIJHIPSPARSEGetIJ(a->A, PETSC_FALSE, (const HYPRE_Int **)&hdi, (const HYPRE_Int **)&hdj)); 83806977982Sstefanozampini PetscCall(MatSeqAIJHIPSPARSEGetIJ(a->B, PETSC_FALSE, (const HYPRE_Int **)&hoi, (const HYPRE_Int **)&hoj)); 83906977982Sstefanozampini } 84006977982Sstefanozampini #endif 84106977982Sstefanozampini } else { 84206977982Sstefanozampini boundtocpu = PETSC_TRUE; 8436ea7df73SStefano Zampini pdi = diag->i; 8446ea7df73SStefano Zampini pdj = diag->j; 8456ea7df73SStefano Zampini poi = offd->i; 8466ea7df73SStefano Zampini poj = offd->j; 8476ea7df73SStefano Zampini if (sameint) { 8486ea7df73SStefano Zampini hdi = (HYPRE_Int *)pdi; 8496ea7df73SStefano Zampini hdj = (HYPRE_Int *)pdj; 8506ea7df73SStefano Zampini hoi = (HYPRE_Int *)poi; 8516ea7df73SStefano Zampini hoj = (HYPRE_Int *)poj; 8526ea7df73SStefano Zampini } 8536ea7df73SStefano Zampini } 854c1a070e6SStefano Zampini garray = a->garray; 855c1a070e6SStefano Zampini noffd = a->B->cmap->N; 856c1a070e6SStefano Zampini dnnz = diag->nz; 857c1a070e6SStefano Zampini onnz = offd->nz; 858c1a070e6SStefano Zampini } else { 859c1a070e6SStefano Zampini diag = (Mat_SeqAIJ *)A->data; 860c1a070e6SStefano Zampini offd = NULL; 86106977982Sstefanozampini if (!boundtocpu && (iscuda || iship)) { 86206977982Sstefanozampini #if defined(HYPRE_USING_CUDA) && defined(PETSC_HAVE_CUDA) 86306977982Sstefanozampini if (iscuda) { 8646ea7df73SStefano Zampini sameint = PETSC_TRUE; 8659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJCUSPARSEGetIJ(A, PETSC_FALSE, (const HYPRE_Int **)&hdi, (const HYPRE_Int **)&hdj)); 86606977982Sstefanozampini } 8676ea7df73SStefano Zampini #endif 86806977982Sstefanozampini #if defined(HYPRE_USING_HIP) && defined(PETSC_HAVE_HIP) 86906977982Sstefanozampini if (iship) { 87006977982Sstefanozampini sameint = PETSC_TRUE; 87106977982Sstefanozampini PetscCall(MatSeqAIJHIPSPARSEGetIJ(A, PETSC_FALSE, (const HYPRE_Int **)&hdi, (const HYPRE_Int **)&hdj)); 87206977982Sstefanozampini } 87306977982Sstefanozampini #endif 87406977982Sstefanozampini } else { 87506977982Sstefanozampini boundtocpu = PETSC_TRUE; 8766ea7df73SStefano Zampini pdi = diag->i; 8776ea7df73SStefano Zampini pdj = diag->j; 8786ea7df73SStefano Zampini if (sameint) { 8796ea7df73SStefano Zampini hdi = (HYPRE_Int *)pdi; 8806ea7df73SStefano Zampini hdj = (HYPRE_Int *)pdj; 8816ea7df73SStefano Zampini } 8826ea7df73SStefano Zampini } 883c1a070e6SStefano Zampini garray = NULL; 884c1a070e6SStefano Zampini noffd = 0; 885c1a070e6SStefano Zampini dnnz = diag->nz; 886c1a070e6SStefano Zampini onnz = 0; 887c1a070e6SStefano Zampini } 888225daaf8SStefano Zampini 889c1a070e6SStefano Zampini /* create a temporary ParCSR */ 890c1a070e6SStefano Zampini if (HYPRE_AssumedPartitionCheck()) { 891c1a070e6SStefano Zampini PetscMPIInt myid; 892c1a070e6SStefano Zampini 8939566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_rank(comm, &myid)); 894c1a070e6SStefano Zampini row_starts = A->rmap->range + myid; 895c1a070e6SStefano Zampini col_starts = A->cmap->range + myid; 896c1a070e6SStefano Zampini } else { 897c1a070e6SStefano Zampini row_starts = A->rmap->range; 898c1a070e6SStefano Zampini col_starts = A->cmap->range; 899c1a070e6SStefano Zampini } 900*f2f41e48SZach Atkins tA = hypre_ParCSRMatrixCreate(comm, A->rmap->N, A->cmap->N, (HYPRE_BigInt *)row_starts, (HYPRE_BigInt *)col_starts, (HYPRE_Int)noffd, (HYPRE_Int)dnnz, (HYPRE_Int)onnz); 901a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts) 902c1a070e6SStefano Zampini hypre_ParCSRMatrixSetRowStartsOwner(tA, 0); 903c1a070e6SStefano Zampini hypre_ParCSRMatrixSetColStartsOwner(tA, 0); 904a1d2239cSSatish Balay #endif 905c1a070e6SStefano Zampini 906225daaf8SStefano Zampini /* set diagonal part */ 907c1a070e6SStefano Zampini hdiag = hypre_ParCSRMatrixDiag(tA); 9086ea7df73SStefano Zampini if (!sameint) { /* malloc CSR pointers */ 9099566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(A->rmap->n + 1, &hdi, dnnz, &hdj)); 910f4f49eeaSPierre Jolivet for (i = 0; i < A->rmap->n + 1; i++) hdi[i] = (HYPRE_Int)pdi[i]; 911f4f49eeaSPierre Jolivet for (i = 0; i < dnnz; i++) hdj[i] = (HYPRE_Int)pdj[i]; 9122cf14000SStefano Zampini } 9136ea7df73SStefano Zampini hypre_CSRMatrixI(hdiag) = hdi; 9146ea7df73SStefano Zampini hypre_CSRMatrixJ(hdiag) = hdj; 91539accc25SStefano Zampini hypre_CSRMatrixData(hdiag) = (HYPRE_Complex *)diag->a; 916*f2f41e48SZach Atkins hypre_CSRMatrixNumNonzeros(hdiag) = (HYPRE_Int)diag->nz; 917c1a070e6SStefano Zampini hypre_CSRMatrixSetDataOwner(hdiag, 0); 918c1a070e6SStefano Zampini 9194cf0e950SBarry Smith /* set off-diagonal part */ 920c1a070e6SStefano Zampini hoffd = hypre_ParCSRMatrixOffd(tA); 921c1a070e6SStefano Zampini if (offd) { 9226ea7df73SStefano Zampini if (!sameint) { /* malloc CSR pointers */ 9239566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(A->rmap->n + 1, &hoi, onnz, &hoj)); 924f4f49eeaSPierre Jolivet for (i = 0; i < A->rmap->n + 1; i++) hoi[i] = (HYPRE_Int)poi[i]; 925f4f49eeaSPierre Jolivet for (i = 0; i < onnz; i++) hoj[i] = (HYPRE_Int)poj[i]; 9262cf14000SStefano Zampini } 9276ea7df73SStefano Zampini hypre_CSRMatrixI(hoffd) = hoi; 9286ea7df73SStefano Zampini hypre_CSRMatrixJ(hoffd) = hoj; 92939accc25SStefano Zampini hypre_CSRMatrixData(hoffd) = (HYPRE_Complex *)offd->a; 930*f2f41e48SZach Atkins hypre_CSRMatrixNumNonzeros(hoffd) = (HYPRE_Int)offd->nz; 931c1a070e6SStefano Zampini hypre_CSRMatrixSetDataOwner(hoffd, 0); 9326ea7df73SStefano Zampini } 9336ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 934a333fa2bSZach Atkins PetscCallHYPRE(hypre_ParCSRMatrixInitialize_v2(tA, !boundtocpu ? HYPRE_MEMORY_DEVICE : HYPRE_MEMORY_HOST)); 9356ea7df73SStefano Zampini #else 9366ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 18, 0) 937a333fa2bSZach Atkins PetscCallHYPRE(hypre_ParCSRMatrixInitialize(tA)); 9386ea7df73SStefano Zampini #else 939a333fa2bSZach Atkins PetscCallHYPRE(hypre_ParCSRMatrixInitialize_v2(tA, HYPRE_MEMORY_HOST)); 9406ea7df73SStefano Zampini #endif 9416ea7df73SStefano Zampini #endif 942bb16242fSVictor A. P. Magri 943bb16242fSVictor A. P. Magri /* MatrixSetRownnz comes after MatrixInitialize, so the first uses the right memory location */ 944bb16242fSVictor A. P. Magri hypre_CSRMatrixSetRownnz(hdiag); 945bb16242fSVictor A. P. Magri if (offd) hypre_CSRMatrixSetRownnz(hoffd); 946bb16242fSVictor A. P. Magri 9476ea7df73SStefano Zampini hypre_TFree(hypre_ParCSRMatrixColMapOffd(tA), HYPRE_MEMORY_HOST); 948c1a070e6SStefano Zampini hypre_ParCSRMatrixSetNumNonzeros(tA); 9492cf14000SStefano Zampini hypre_ParCSRMatrixColMapOffd(tA) = (HYPRE_BigInt *)garray; 950a333fa2bSZach Atkins if (!hypre_ParCSRMatrixCommPkg(tA)) PetscCallHYPRE(hypre_MatvecCommPkgCreate(tA)); 951613e5ff0Sstefano_zampini *hA = tA; 9523ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 953613e5ff0Sstefano_zampini } 954c1a070e6SStefano Zampini 955d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAIJRestoreParCSR_Private(Mat A, hypre_ParCSRMatrix **hA) 956d71ae5a4SJacob Faibussowitsch { 957613e5ff0Sstefano_zampini hypre_CSRMatrix *hdiag, *hoffd; 9586ea7df73SStefano Zampini PetscBool ismpiaij, sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int)); 959b655ebf8SZach Atkins PetscBool iscuda, iship; 960c1a070e6SStefano Zampini 961613e5ff0Sstefano_zampini PetscFunctionBegin; 9629566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &ismpiaij)); 9639566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)A, &iscuda, MATSEQAIJCUSPARSE, MATMPIAIJCUSPARSE, "")); 964b655ebf8SZach Atkins PetscCall(PetscObjectTypeCompareAny((PetscObject)A, &iship, MATSEQAIJHIPSPARSE, MATMPIAIJHIPSPARSE, "")); 965b655ebf8SZach Atkins #if defined(HYPRE_USING_CUDA) && defined(PETSC_HAVE_CUDA) 9666ea7df73SStefano Zampini if (iscuda) sameint = PETSC_TRUE; 967b655ebf8SZach Atkins #elif defined(HYPRE_USING_HIP) && defined(PETSC_HAVE_HIP) 968b655ebf8SZach Atkins if (iship) sameint = PETSC_TRUE; 9696ea7df73SStefano Zampini #endif 970613e5ff0Sstefano_zampini hdiag = hypre_ParCSRMatrixDiag(*hA); 971613e5ff0Sstefano_zampini hoffd = hypre_ParCSRMatrixOffd(*hA); 9726ea7df73SStefano Zampini /* free temporary memory allocated by PETSc 9736ea7df73SStefano Zampini set pointers to NULL before destroying tA */ 9742cf14000SStefano Zampini if (!sameint) { 9752cf14000SStefano Zampini HYPRE_Int *hi, *hj; 9762cf14000SStefano Zampini 9772cf14000SStefano Zampini hi = hypre_CSRMatrixI(hdiag); 9782cf14000SStefano Zampini hj = hypre_CSRMatrixJ(hdiag); 9799566063dSJacob Faibussowitsch PetscCall(PetscFree2(hi, hj)); 9806ea7df73SStefano Zampini if (ismpiaij) { 9812cf14000SStefano Zampini hi = hypre_CSRMatrixI(hoffd); 9822cf14000SStefano Zampini hj = hypre_CSRMatrixJ(hoffd); 9839566063dSJacob Faibussowitsch PetscCall(PetscFree2(hi, hj)); 9842cf14000SStefano Zampini } 9852cf14000SStefano Zampini } 986c1a070e6SStefano Zampini hypre_CSRMatrixI(hdiag) = NULL; 987c1a070e6SStefano Zampini hypre_CSRMatrixJ(hdiag) = NULL; 988c1a070e6SStefano Zampini hypre_CSRMatrixData(hdiag) = NULL; 9896ea7df73SStefano Zampini if (ismpiaij) { 990c1a070e6SStefano Zampini hypre_CSRMatrixI(hoffd) = NULL; 991c1a070e6SStefano Zampini hypre_CSRMatrixJ(hoffd) = NULL; 992c1a070e6SStefano Zampini hypre_CSRMatrixData(hoffd) = NULL; 9936ea7df73SStefano Zampini } 994613e5ff0Sstefano_zampini hypre_ParCSRMatrixColMapOffd(*hA) = NULL; 995613e5ff0Sstefano_zampini hypre_ParCSRMatrixDestroy(*hA); 996613e5ff0Sstefano_zampini *hA = NULL; 9973ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 998613e5ff0Sstefano_zampini } 999613e5ff0Sstefano_zampini 1000613e5ff0Sstefano_zampini /* calls RAP from BoomerAMG: 10013dad0653Sstefano_zampini the resulting ParCSR will not own the column and row starts 10026ea7df73SStefano Zampini It looks like we don't need to have the diagonal entries ordered first */ 1003d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_ParCSR_RAP(hypre_ParCSRMatrix *hR, hypre_ParCSRMatrix *hA, hypre_ParCSRMatrix *hP, hypre_ParCSRMatrix **hRAP) 1004d71ae5a4SJacob Faibussowitsch { 1005a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts) 1006613e5ff0Sstefano_zampini HYPRE_Int P_owns_col_starts, R_owns_row_starts; 1007a1d2239cSSatish Balay #endif 1008613e5ff0Sstefano_zampini 1009613e5ff0Sstefano_zampini PetscFunctionBegin; 1010a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts) 1011613e5ff0Sstefano_zampini P_owns_col_starts = hypre_ParCSRMatrixOwnsColStarts(hP); 1012613e5ff0Sstefano_zampini R_owns_row_starts = hypre_ParCSRMatrixOwnsRowStarts(hR); 1013a1d2239cSSatish Balay #endif 10146ea7df73SStefano Zampini /* can be replaced by version test later */ 10156ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 1016792fecdfSBarry Smith PetscStackPushExternal("hypre_ParCSRMatrixRAP"); 10176ea7df73SStefano Zampini *hRAP = hypre_ParCSRMatrixRAP(hR, hA, hP); 10186ea7df73SStefano Zampini PetscStackPop; 10196ea7df73SStefano Zampini #else 1020a333fa2bSZach Atkins PetscCallHYPRE(hypre_BoomerAMGBuildCoarseOperator(hR, hA, hP, hRAP)); 1021a333fa2bSZach Atkins PetscCallHYPRE(hypre_ParCSRMatrixSetNumNonzeros(*hRAP)); 10226ea7df73SStefano Zampini #endif 1023613e5ff0Sstefano_zampini /* hypre_BoomerAMGBuildCoarseOperator steals the col_starts from P and the row_starts from R */ 1024a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts) 1025613e5ff0Sstefano_zampini hypre_ParCSRMatrixSetRowStartsOwner(*hRAP, 0); 1026613e5ff0Sstefano_zampini hypre_ParCSRMatrixSetColStartsOwner(*hRAP, 0); 1027613e5ff0Sstefano_zampini if (P_owns_col_starts) hypre_ParCSRMatrixSetColStartsOwner(hP, 1); 1028613e5ff0Sstefano_zampini if (R_owns_row_starts) hypre_ParCSRMatrixSetRowStartsOwner(hR, 1); 1029a1d2239cSSatish Balay #endif 10303ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1031613e5ff0Sstefano_zampini } 1032613e5ff0Sstefano_zampini 1033d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatPtAPNumeric_AIJ_AIJ_wHYPRE(Mat A, Mat P, Mat C) 1034d71ae5a4SJacob Faibussowitsch { 10356f231fbdSstefano_zampini Mat B; 10366abb4441SStefano Zampini hypre_ParCSRMatrix *hA, *hP, *hPtAP = NULL; 10374222ddf1SHong Zhang Mat_Product *product = C->product; 1038613e5ff0Sstefano_zampini 1039613e5ff0Sstefano_zampini PetscFunctionBegin; 10409566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(A, &hA)); 10419566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(P, &hP)); 10429566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_RAP(hP, hA, hP, &hPtAP)); 10439566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(hPtAP, MATAIJ, PETSC_OWN_POINTER, &B)); 10444222ddf1SHong Zhang 10459566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(C, &B)); 10464222ddf1SHong Zhang C->product = product; 10474222ddf1SHong Zhang 10489566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(A, &hA)); 10499566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(P, &hP)); 10503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10516f231fbdSstefano_zampini } 10526f231fbdSstefano_zampini 1053d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatPtAPSymbolic_AIJ_AIJ_wHYPRE(Mat A, Mat P, PetscReal fill, Mat C) 1054d71ae5a4SJacob Faibussowitsch { 10556f231fbdSstefano_zampini PetscFunctionBegin; 10569566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATAIJ)); 10574222ddf1SHong Zhang C->ops->ptapnumeric = MatPtAPNumeric_AIJ_AIJ_wHYPRE; 10584222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_PtAP; 10593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1060613e5ff0Sstefano_zampini } 1061613e5ff0Sstefano_zampini 1062d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatPtAPNumeric_AIJ_HYPRE(Mat A, Mat P, Mat C) 1063d71ae5a4SJacob Faibussowitsch { 10644cc28894Sstefano_zampini Mat B; 10654cc28894Sstefano_zampini Mat_HYPRE *hP; 10666abb4441SStefano Zampini hypre_ParCSRMatrix *hA = NULL, *Pparcsr, *ptapparcsr = NULL; 1067613e5ff0Sstefano_zampini HYPRE_Int type; 1068613e5ff0Sstefano_zampini MPI_Comm comm = PetscObjectComm((PetscObject)A); 10694cc28894Sstefano_zampini PetscBool ishypre; 1070613e5ff0Sstefano_zampini 1071613e5ff0Sstefano_zampini PetscFunctionBegin; 10729566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)P, MATHYPRE, &ishypre)); 107328b400f6SJacob Faibussowitsch PetscCheck(ishypre, comm, PETSC_ERR_USER, "P should be of type %s", MATHYPRE); 10744cc28894Sstefano_zampini hP = (Mat_HYPRE *)P->data; 1075a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(hP->ij, &type)); 107608401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, comm, PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported"); 1077a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(hP->ij, (void **)&Pparcsr)); 1078613e5ff0Sstefano_zampini 10799566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(A, &hA)); 10809566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_RAP(Pparcsr, hA, Pparcsr, &ptapparcsr)); 10819566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(A, &hA)); 1082225daaf8SStefano Zampini 10834cc28894Sstefano_zampini /* create temporary matrix and merge to C */ 10849566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(ptapparcsr, ((PetscObject)C)->type_name, PETSC_OWN_POINTER, &B)); 10859566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(C, &B)); 10863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10874cc28894Sstefano_zampini } 10884cc28894Sstefano_zampini 1089d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatPtAPNumeric_HYPRE_HYPRE(Mat A, Mat P, Mat C) 1090d71ae5a4SJacob Faibussowitsch { 10914cc28894Sstefano_zampini Mat B; 10926abb4441SStefano Zampini hypre_ParCSRMatrix *Aparcsr, *Pparcsr, *ptapparcsr = NULL; 10934cc28894Sstefano_zampini Mat_HYPRE *hA, *hP; 10944cc28894Sstefano_zampini PetscBool ishypre; 10954cc28894Sstefano_zampini HYPRE_Int type; 10964cc28894Sstefano_zampini 10974cc28894Sstefano_zampini PetscFunctionBegin; 10989566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)P, MATHYPRE, &ishypre)); 109928b400f6SJacob Faibussowitsch PetscCheck(ishypre, PetscObjectComm((PetscObject)P), PETSC_ERR_USER, "P should be of type %s", MATHYPRE); 11009566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)A, MATHYPRE, &ishypre)); 110128b400f6SJacob Faibussowitsch PetscCheck(ishypre, PetscObjectComm((PetscObject)A), PETSC_ERR_USER, "A should be of type %s", MATHYPRE); 11024cc28894Sstefano_zampini hA = (Mat_HYPRE *)A->data; 11034cc28894Sstefano_zampini hP = (Mat_HYPRE *)P->data; 1104a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(hA->ij, &type)); 110508401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported"); 1106a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(hP->ij, &type)); 110708401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)P), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported"); 1108a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(hA->ij, (void **)&Aparcsr)); 1109a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(hP->ij, (void **)&Pparcsr)); 11109566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_RAP(Pparcsr, Aparcsr, Pparcsr, &ptapparcsr)); 11119566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(ptapparcsr, MATHYPRE, PETSC_OWN_POINTER, &B)); 11129566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(C, &B)); 11133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 11144cc28894Sstefano_zampini } 11154cc28894Sstefano_zampini 1116d501dc42Sstefano_zampini /* calls hypre_ParMatmul 1117d501dc42Sstefano_zampini hypre_ParMatMul uses hypre_ParMatrixCreate with the communicator of hA 11183dad0653Sstefano_zampini hypre_ParMatrixCreate does not duplicate the communicator 11196ea7df73SStefano Zampini It looks like we don't need to have the diagonal entries ordered first */ 1120d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_ParCSR_MatMatMult(hypre_ParCSRMatrix *hA, hypre_ParCSRMatrix *hB, hypre_ParCSRMatrix **hAB) 1121d71ae5a4SJacob Faibussowitsch { 1122d501dc42Sstefano_zampini PetscFunctionBegin; 11236ea7df73SStefano Zampini /* can be replaced by version test later */ 11246ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 1125792fecdfSBarry Smith PetscStackPushExternal("hypre_ParCSRMatMat"); 11266ea7df73SStefano Zampini *hAB = hypre_ParCSRMatMat(hA, hB); 11276ea7df73SStefano Zampini #else 1128792fecdfSBarry Smith PetscStackPushExternal("hypre_ParMatmul"); 1129d501dc42Sstefano_zampini *hAB = hypre_ParMatmul(hA, hB); 11306ea7df73SStefano Zampini #endif 1131d501dc42Sstefano_zampini PetscStackPop; 11323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1133d501dc42Sstefano_zampini } 1134d501dc42Sstefano_zampini 1135d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMatMultNumeric_AIJ_AIJ_wHYPRE(Mat A, Mat B, Mat C) 1136d71ae5a4SJacob Faibussowitsch { 11375e5acdf2Sstefano_zampini Mat D; 1138d501dc42Sstefano_zampini hypre_ParCSRMatrix *hA, *hB, *hAB = NULL; 11394222ddf1SHong Zhang Mat_Product *product = C->product; 11405e5acdf2Sstefano_zampini 11415e5acdf2Sstefano_zampini PetscFunctionBegin; 11429566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(A, &hA)); 11439566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(B, &hB)); 11449566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_MatMatMult(hA, hB, &hAB)); 11459566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(hAB, MATAIJ, PETSC_OWN_POINTER, &D)); 11464222ddf1SHong Zhang 11479566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(C, &D)); 11484222ddf1SHong Zhang C->product = product; 11494222ddf1SHong Zhang 11509566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(A, &hA)); 11519566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(B, &hB)); 11523ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 11535e5acdf2Sstefano_zampini } 11545e5acdf2Sstefano_zampini 1155d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatMatMultSymbolic_AIJ_AIJ_wHYPRE(Mat A, Mat B, PetscReal fill, Mat C) 1156d71ae5a4SJacob Faibussowitsch { 11575e5acdf2Sstefano_zampini PetscFunctionBegin; 11589566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATAIJ)); 11594222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_AIJ_AIJ_wHYPRE; 11604222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_AB; 11613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 11625e5acdf2Sstefano_zampini } 11635e5acdf2Sstefano_zampini 1164d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMatMultNumeric_HYPRE_HYPRE(Mat A, Mat B, Mat C) 1165d71ae5a4SJacob Faibussowitsch { 1166d501dc42Sstefano_zampini Mat D; 1167d501dc42Sstefano_zampini hypre_ParCSRMatrix *Aparcsr, *Bparcsr, *ABparcsr = NULL; 1168d501dc42Sstefano_zampini Mat_HYPRE *hA, *hB; 1169d501dc42Sstefano_zampini PetscBool ishypre; 1170d501dc42Sstefano_zampini HYPRE_Int type; 11714222ddf1SHong Zhang Mat_Product *product; 1172d501dc42Sstefano_zampini 1173d501dc42Sstefano_zampini PetscFunctionBegin; 11749566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B, MATHYPRE, &ishypre)); 117528b400f6SJacob Faibussowitsch PetscCheck(ishypre, PetscObjectComm((PetscObject)B), PETSC_ERR_USER, "B should be of type %s", MATHYPRE); 11769566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)A, MATHYPRE, &ishypre)); 117728b400f6SJacob Faibussowitsch PetscCheck(ishypre, PetscObjectComm((PetscObject)A), PETSC_ERR_USER, "A should be of type %s", MATHYPRE); 1178d501dc42Sstefano_zampini hA = (Mat_HYPRE *)A->data; 1179d501dc42Sstefano_zampini hB = (Mat_HYPRE *)B->data; 1180a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(hA->ij, &type)); 118108401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported"); 1182a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(hB->ij, &type)); 118308401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)B), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported"); 1184a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(hA->ij, (void **)&Aparcsr)); 1185a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(hB->ij, (void **)&Bparcsr)); 11869566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_MatMatMult(Aparcsr, Bparcsr, &ABparcsr)); 11879566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(ABparcsr, MATHYPRE, PETSC_OWN_POINTER, &D)); 11884222ddf1SHong Zhang 1189d501dc42Sstefano_zampini /* need to use HeaderReplace because HeaderMerge messes up with the communicator */ 11904222ddf1SHong Zhang product = C->product; /* save it from MatHeaderReplace() */ 11914222ddf1SHong Zhang C->product = NULL; 11929566063dSJacob Faibussowitsch PetscCall(MatHeaderReplace(C, &D)); 11934222ddf1SHong Zhang C->product = product; 1194d501dc42Sstefano_zampini C->ops->matmultnumeric = MatMatMultNumeric_HYPRE_HYPRE; 11954222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_AB; 11963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1197d501dc42Sstefano_zampini } 1198d501dc42Sstefano_zampini 1199d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatTransposeMatMatMultNumeric_AIJ_AIJ_AIJ_wHYPRE(Mat A, Mat B, Mat C, Mat D) 1200d71ae5a4SJacob Faibussowitsch { 120120e1dc0dSstefano_zampini Mat E; 12026abb4441SStefano Zampini hypre_ParCSRMatrix *hA, *hB, *hC, *hABC = NULL; 120320e1dc0dSstefano_zampini 120420e1dc0dSstefano_zampini PetscFunctionBegin; 12059566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(A, &hA)); 12069566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(B, &hB)); 12079566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(C, &hC)); 12089566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_RAP(hA, hB, hC, &hABC)); 12099566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(hABC, MATAIJ, PETSC_OWN_POINTER, &E)); 12109566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(D, &E)); 12119566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(A, &hA)); 12129566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(B, &hB)); 12139566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(C, &hC)); 12143ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 121520e1dc0dSstefano_zampini } 121620e1dc0dSstefano_zampini 1217d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatTransposeMatMatMultSymbolic_AIJ_AIJ_AIJ_wHYPRE(Mat A, Mat B, Mat C, PetscReal fill, Mat D) 1218d71ae5a4SJacob Faibussowitsch { 121920e1dc0dSstefano_zampini PetscFunctionBegin; 12209566063dSJacob Faibussowitsch PetscCall(MatSetType(D, MATAIJ)); 12213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 122220e1dc0dSstefano_zampini } 122320e1dc0dSstefano_zampini 1224d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSymbolic_AB_HYPRE(Mat C) 1225d71ae5a4SJacob Faibussowitsch { 12264222ddf1SHong Zhang PetscFunctionBegin; 12274222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_AB; 12283ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12294222ddf1SHong Zhang } 12304222ddf1SHong Zhang 1231d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSetFromOptions_HYPRE_AB(Mat C) 1232d71ae5a4SJacob Faibussowitsch { 12334222ddf1SHong Zhang Mat_Product *product = C->product; 12344222ddf1SHong Zhang PetscBool Ahypre; 12354222ddf1SHong Zhang 12364222ddf1SHong Zhang PetscFunctionBegin; 12379566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)product->A, MATHYPRE, &Ahypre)); 12384222ddf1SHong Zhang if (Ahypre) { /* A is a Hypre matrix */ 12399566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATHYPRE)); 12404222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_AB_HYPRE; 12414222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_HYPRE_HYPRE; 12423ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12436718818eSStefano Zampini } 12443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12454222ddf1SHong Zhang } 12464222ddf1SHong Zhang 1247d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSymbolic_PtAP_HYPRE(Mat C) 1248d71ae5a4SJacob Faibussowitsch { 12494222ddf1SHong Zhang PetscFunctionBegin; 12504222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_PtAP; 12513ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12524222ddf1SHong Zhang } 12534222ddf1SHong Zhang 1254d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSetFromOptions_HYPRE_PtAP(Mat C) 1255d71ae5a4SJacob Faibussowitsch { 12564222ddf1SHong Zhang Mat_Product *product = C->product; 12574222ddf1SHong Zhang PetscBool flg; 12584222ddf1SHong Zhang PetscInt type = 0; 12594222ddf1SHong Zhang const char *outTypes[4] = {"aij", "seqaij", "mpiaij", "hypre"}; 12604222ddf1SHong Zhang PetscInt ntype = 4; 12614222ddf1SHong Zhang Mat A = product->A; 12624222ddf1SHong Zhang PetscBool Ahypre; 12634222ddf1SHong Zhang 12644222ddf1SHong Zhang PetscFunctionBegin; 12659566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)A, MATHYPRE, &Ahypre)); 12664222ddf1SHong Zhang if (Ahypre) { /* A is a Hypre matrix */ 12679566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATHYPRE)); 12684222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_PtAP_HYPRE; 12694222ddf1SHong Zhang C->ops->ptapnumeric = MatPtAPNumeric_HYPRE_HYPRE; 12703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12714222ddf1SHong Zhang } 12724222ddf1SHong Zhang 12734222ddf1SHong Zhang /* A is AIJ, P is Hypre, C = PtAP can be either AIJ or Hypre format */ 12744222ddf1SHong Zhang /* Get runtime option */ 12754222ddf1SHong Zhang if (product->api_user) { 1276d0609cedSBarry Smith PetscOptionsBegin(PetscObjectComm((PetscObject)C), ((PetscObject)C)->prefix, "MatPtAP_HYPRE", "Mat"); 12779566063dSJacob Faibussowitsch PetscCall(PetscOptionsEList("-matptap_hypre_outtype", "MatPtAP outtype", "MatPtAP outtype", outTypes, ntype, outTypes[type], &type, &flg)); 1278d0609cedSBarry Smith PetscOptionsEnd(); 12794222ddf1SHong Zhang } else { 1280d0609cedSBarry Smith PetscOptionsBegin(PetscObjectComm((PetscObject)C), ((PetscObject)C)->prefix, "MatProduct_PtAP_HYPRE", "Mat"); 12819566063dSJacob Faibussowitsch PetscCall(PetscOptionsEList("-mat_product_algorithm_hypre_outtype", "MatProduct_PtAP outtype", "MatProduct_PtAP", outTypes, ntype, outTypes[type], &type, &flg)); 1282d0609cedSBarry Smith PetscOptionsEnd(); 12834222ddf1SHong Zhang } 12844222ddf1SHong Zhang 12854222ddf1SHong Zhang if (type == 0 || type == 1 || type == 2) { 12869566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATAIJ)); 12874222ddf1SHong Zhang } else if (type == 3) { 12889566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATHYPRE)); 12894222ddf1SHong Zhang } else SETERRQ(PetscObjectComm((PetscObject)C), PETSC_ERR_SUP, "MatPtAP outtype is not supported"); 12904222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_PtAP_HYPRE; 12914222ddf1SHong Zhang C->ops->ptapnumeric = MatPtAPNumeric_AIJ_HYPRE; 12923ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12934222ddf1SHong Zhang } 12944222ddf1SHong Zhang 1295d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSetFromOptions_HYPRE(Mat C) 1296d71ae5a4SJacob Faibussowitsch { 12974222ddf1SHong Zhang Mat_Product *product = C->product; 12984222ddf1SHong Zhang 12994222ddf1SHong Zhang PetscFunctionBegin; 13004222ddf1SHong Zhang switch (product->type) { 1301d71ae5a4SJacob Faibussowitsch case MATPRODUCT_AB: 1302d71ae5a4SJacob Faibussowitsch PetscCall(MatProductSetFromOptions_HYPRE_AB(C)); 1303d71ae5a4SJacob Faibussowitsch break; 1304d71ae5a4SJacob Faibussowitsch case MATPRODUCT_PtAP: 1305d71ae5a4SJacob Faibussowitsch PetscCall(MatProductSetFromOptions_HYPRE_PtAP(C)); 1306d71ae5a4SJacob Faibussowitsch break; 1307d71ae5a4SJacob Faibussowitsch default: 1308d71ae5a4SJacob Faibussowitsch break; 13094222ddf1SHong Zhang } 13103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 13114222ddf1SHong Zhang } 13124222ddf1SHong Zhang 1313d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMultTranspose_HYPRE(Mat A, Vec x, Vec y) 1314d71ae5a4SJacob Faibussowitsch { 131563c07aadSStefano Zampini PetscFunctionBegin; 13169566063dSJacob Faibussowitsch PetscCall(MatHYPRE_MultKernel_Private(A, 1.0, x, 0.0, y, PETSC_TRUE)); 13173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 131863c07aadSStefano Zampini } 131963c07aadSStefano Zampini 1320d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMult_HYPRE(Mat A, Vec x, Vec y) 1321d71ae5a4SJacob Faibussowitsch { 132263c07aadSStefano Zampini PetscFunctionBegin; 13239566063dSJacob Faibussowitsch PetscCall(MatHYPRE_MultKernel_Private(A, 1.0, x, 0.0, y, PETSC_FALSE)); 13243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 132563c07aadSStefano Zampini } 132663c07aadSStefano Zampini 1327d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMultAdd_HYPRE(Mat A, Vec x, Vec y, Vec z) 1328d71ae5a4SJacob Faibussowitsch { 1329414bd5c3SStefano Zampini PetscFunctionBegin; 133048a46eb9SPierre Jolivet if (y != z) PetscCall(VecCopy(y, z)); 13319566063dSJacob Faibussowitsch PetscCall(MatHYPRE_MultKernel_Private(A, 1.0, x, 1.0, z, PETSC_FALSE)); 13323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1333414bd5c3SStefano Zampini } 1334414bd5c3SStefano Zampini 1335d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMultTransposeAdd_HYPRE(Mat A, Vec x, Vec y, Vec z) 1336d71ae5a4SJacob Faibussowitsch { 1337414bd5c3SStefano Zampini PetscFunctionBegin; 133848a46eb9SPierre Jolivet if (y != z) PetscCall(VecCopy(y, z)); 13399566063dSJacob Faibussowitsch PetscCall(MatHYPRE_MultKernel_Private(A, 1.0, x, 1.0, z, PETSC_TRUE)); 13403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1341414bd5c3SStefano Zampini } 1342414bd5c3SStefano Zampini 1343414bd5c3SStefano Zampini /* y = a * A * x + b * y or y = a * A^t * x + b * y depending on trans */ 1344d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_MultKernel_Private(Mat A, HYPRE_Complex a, Vec x, HYPRE_Complex b, Vec y, PetscBool trans) 1345d71ae5a4SJacob Faibussowitsch { 134663c07aadSStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 134763c07aadSStefano Zampini hypre_ParCSRMatrix *parcsr; 134863c07aadSStefano Zampini hypre_ParVector *hx, *hy; 134963c07aadSStefano Zampini 135063c07aadSStefano Zampini PetscFunctionBegin; 135163c07aadSStefano Zampini if (trans) { 13529566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorPushVecRead(hA->b, x)); 13539566063dSJacob Faibussowitsch if (b != 0.0) PetscCall(VecHYPRE_IJVectorPushVec(hA->x, y)); 13549566063dSJacob Faibussowitsch else PetscCall(VecHYPRE_IJVectorPushVecWrite(hA->x, y)); 1355a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJVectorGetObject(hA->b->ij, (void **)&hx)); 1356a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJVectorGetObject(hA->x->ij, (void **)&hy)); 135763c07aadSStefano Zampini } else { 13589566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorPushVecRead(hA->x, x)); 13599566063dSJacob Faibussowitsch if (b != 0.0) PetscCall(VecHYPRE_IJVectorPushVec(hA->b, y)); 13609566063dSJacob Faibussowitsch else PetscCall(VecHYPRE_IJVectorPushVecWrite(hA->b, y)); 1361a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJVectorGetObject(hA->x->ij, (void **)&hx)); 1362a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJVectorGetObject(hA->b->ij, (void **)&hy)); 136363c07aadSStefano Zampini } 1364a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(hA->ij, (void **)&parcsr)); 13656ea7df73SStefano Zampini if (trans) { 1366a333fa2bSZach Atkins PetscCallHYPRE(hypre_ParCSRMatrixMatvecT(a, parcsr, hx, b, hy)); 13676ea7df73SStefano Zampini } else { 1368a333fa2bSZach Atkins PetscCallHYPRE(hypre_ParCSRMatrixMatvec(a, parcsr, hx, b, hy)); 13696ea7df73SStefano Zampini } 13709566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorPopVec(hA->x)); 13719566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorPopVec(hA->b)); 13723ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 137363c07aadSStefano Zampini } 137463c07aadSStefano Zampini 1375d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatDestroy_HYPRE(Mat A) 1376d71ae5a4SJacob Faibussowitsch { 137763c07aadSStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 137863c07aadSStefano Zampini 137963c07aadSStefano Zampini PetscFunctionBegin; 13809566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorDestroy(&hA->x)); 13819566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorDestroy(&hA->b)); 138206977982Sstefanozampini PetscCall(MatHYPRE_DestroyCOOMat(A)); /* must be called before destroying the individual CSR */ 1383978814f1SStefano Zampini if (hA->ij) { 1384978814f1SStefano Zampini if (!hA->inner_free) hypre_IJMatrixObject(hA->ij) = NULL; 1385a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixDestroy(hA->ij)); 1386978814f1SStefano Zampini } 13879566063dSJacob Faibussowitsch if (hA->comm) PetscCall(PetscCommRestoreComm(PetscObjectComm((PetscObject)A), &hA->comm)); 1388c69f721fSFande Kong 13899566063dSJacob Faibussowitsch PetscCall(MatStashDestroy_Private(&A->stash)); 13909566063dSJacob Faibussowitsch PetscCall(PetscFree(hA->array)); 1391a32e9c99SJunchao Zhang if (hA->rows_d) PetscStackCallExternalVoid("hypre_Free", hypre_Free(hA->rows_d, HYPRE_MEMORY_DEVICE)); 1392c69f721fSFande Kong 13939566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_hypre_aij_C", NULL)); 13949566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_hypre_is_C", NULL)); 13959566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_hypre_C", NULL)); 13969566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_mpiaij_hypre_C", NULL)); 139706977982Sstefanozampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijhipsparse_hypre_C", NULL)); 139806977982Sstefanozampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_mpiaijhipsparse_hypre_C", NULL)); 139906977982Sstefanozampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_hypre_C", NULL)); 140006977982Sstefanozampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_mpiaijcusparse_hypre_C", NULL)); 14019566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatHYPRESetPreallocation_C", NULL)); 14029566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatHYPREGetParCSR_C", NULL)); 14035fbaff96SJunchao Zhang PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL)); 14045fbaff96SJunchao Zhang PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL)); 14059566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 14063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 140763c07aadSStefano Zampini } 140863c07aadSStefano Zampini 1409d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetUp_HYPRE(Mat A) 1410d71ae5a4SJacob Faibussowitsch { 14114ec6421dSstefano_zampini PetscFunctionBegin; 141206977982Sstefanozampini if (!A->preallocated) PetscCall(MatHYPRESetPreallocation(A, PETSC_DEFAULT, NULL, PETSC_DEFAULT, NULL)); 14133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 14144ec6421dSstefano_zampini } 14154ec6421dSstefano_zampini 14166ea7df73SStefano Zampini //TODO FIX hypre_CSRMatrixMatvecOutOfPlace 14176ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 1418d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatBindToCPU_HYPRE(Mat A, PetscBool bind) 1419d71ae5a4SJacob Faibussowitsch { 14206ea7df73SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 14216ea7df73SStefano Zampini HYPRE_MemoryLocation hmem = bind ? HYPRE_MEMORY_HOST : HYPRE_MEMORY_DEVICE; 14226ea7df73SStefano Zampini 14236ea7df73SStefano Zampini PetscFunctionBegin; 14246ea7df73SStefano Zampini A->boundtocpu = bind; 14255fbaff96SJunchao Zhang if (hA->ij && hypre_IJMatrixAssembleFlag(hA->ij) && hmem != hypre_IJMatrixMemoryLocation(hA->ij)) { 14266ea7df73SStefano Zampini hypre_ParCSRMatrix *parcsr; 1427a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(hA->ij, (void **)&parcsr)); 1428a333fa2bSZach Atkins PetscCallHYPRE(hypre_ParCSRMatrixMigrate(parcsr, hmem)); 14296ea7df73SStefano Zampini } 14309566063dSJacob Faibussowitsch if (hA->x) PetscCall(VecHYPRE_IJBindToCPU(hA->x, bind)); 14319566063dSJacob Faibussowitsch if (hA->b) PetscCall(VecHYPRE_IJBindToCPU(hA->b, bind)); 14323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 14336ea7df73SStefano Zampini } 14346ea7df73SStefano Zampini #endif 14356ea7df73SStefano Zampini 1436d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAssemblyEnd_HYPRE(Mat A, MatAssemblyType mode) 1437d71ae5a4SJacob Faibussowitsch { 143863c07aadSStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 1439c69f721fSFande Kong PetscMPIInt n; 1440c69f721fSFande Kong PetscInt i, j, rstart, ncols, flg; 1441c69f721fSFande Kong PetscInt *row, *col; 1442c69f721fSFande Kong PetscScalar *val; 144363c07aadSStefano Zampini 144463c07aadSStefano Zampini PetscFunctionBegin; 144508401ef6SPierre Jolivet PetscCheck(mode != MAT_FLUSH_ASSEMBLY, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "MAT_FLUSH_ASSEMBLY currently not supported with MATHYPRE"); 1446c69f721fSFande Kong 1447c69f721fSFande Kong if (!A->nooffprocentries) { 1448c69f721fSFande Kong while (1) { 14499566063dSJacob Faibussowitsch PetscCall(MatStashScatterGetMesg_Private(&A->stash, &n, &row, &col, &val, &flg)); 1450c69f721fSFande Kong if (!flg) break; 1451c69f721fSFande Kong 1452c69f721fSFande Kong for (i = 0; i < n;) { 1453c69f721fSFande Kong /* Now identify the consecutive vals belonging to the same row */ 1454c69f721fSFande Kong for (j = i, rstart = row[j]; j < n; j++) { 1455c69f721fSFande Kong if (row[j] != rstart) break; 1456c69f721fSFande Kong } 1457c69f721fSFande Kong if (j < n) ncols = j - i; 1458c69f721fSFande Kong else ncols = n - i; 1459c69f721fSFande Kong /* Now assemble all these values with a single function call */ 14609566063dSJacob Faibussowitsch PetscCall(MatSetValues_HYPRE(A, 1, row + i, ncols, col + i, val + i, A->insertmode)); 1461c69f721fSFande Kong 1462c69f721fSFande Kong i = j; 1463c69f721fSFande Kong } 1464c69f721fSFande Kong } 14659566063dSJacob Faibussowitsch PetscCall(MatStashScatterEnd_Private(&A->stash)); 1466c69f721fSFande Kong } 1467c69f721fSFande Kong 1468a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixAssemble(hA->ij)); 1469336664bdSPierre Jolivet /* The assembly routine destroys the aux_matrix, we recreate it here by calling HYPRE_IJMatrixInitialize */ 1470336664bdSPierre Jolivet /* If the option MAT_SORTED_FULL is set to true, the indices and values can be passed to hypre directly, so we don't need the aux_matrix */ 1471651b1cf9SStefano Zampini if (!A->sortedfull) { 1472af1cf968SStefano Zampini hypre_AuxParCSRMatrix *aux_matrix; 1473af1cf968SStefano Zampini 1474af1cf968SStefano Zampini /* call destroy just to make sure we do not leak anything */ 1475af1cf968SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(hA->ij); 1476a333fa2bSZach Atkins PetscCallHYPRE(hypre_AuxParCSRMatrixDestroy(aux_matrix)); 1477af1cf968SStefano Zampini hypre_IJMatrixTranslator(hA->ij) = NULL; 1478af1cf968SStefano Zampini 1479af1cf968SStefano Zampini /* Initialize with assembled flag -> it only recreates the aux_par_matrix */ 1480a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixInitialize(hA->ij)); 1481af1cf968SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(hA->ij); 14826ea7df73SStefano Zampini if (aux_matrix) { 1483af1cf968SStefano Zampini hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 1; /* see comment in MatHYPRESetPreallocation_HYPRE */ 148422235d61SPierre Jolivet #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0) 1485a333fa2bSZach Atkins PetscCallHYPRE(hypre_AuxParCSRMatrixInitialize(aux_matrix)); 148622235d61SPierre Jolivet #else 1487a333fa2bSZach Atkins PetscCallHYPRE(hypre_AuxParCSRMatrixInitialize_v2(aux_matrix, HYPRE_MEMORY_HOST)); 148822235d61SPierre Jolivet #endif 1489af1cf968SStefano Zampini } 14906ea7df73SStefano Zampini } 14916ea7df73SStefano Zampini { 14926ea7df73SStefano Zampini hypre_ParCSRMatrix *parcsr; 14936ea7df73SStefano Zampini 1494a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(hA->ij, (void **)&parcsr)); 1495a333fa2bSZach Atkins if (!hypre_ParCSRMatrixCommPkg(parcsr)) PetscCallHYPRE(hypre_MatvecCommPkgCreate(parcsr)); 14966ea7df73SStefano Zampini } 14979566063dSJacob Faibussowitsch if (!hA->x) PetscCall(VecHYPRE_IJVectorCreate(A->cmap, &hA->x)); 14989566063dSJacob Faibussowitsch if (!hA->b) PetscCall(VecHYPRE_IJVectorCreate(A->rmap, &hA->b)); 14996ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 15009566063dSJacob Faibussowitsch PetscCall(MatBindToCPU_HYPRE(A, A->boundtocpu)); 15016ea7df73SStefano Zampini #endif 15023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 150363c07aadSStefano Zampini } 150463c07aadSStefano Zampini 1505d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetArray_HYPRE(Mat A, PetscInt size, void **array) 1506d71ae5a4SJacob Faibussowitsch { 1507c69f721fSFande Kong Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 1508c69f721fSFande Kong 1509c69f721fSFande Kong PetscFunctionBegin; 1510651b1cf9SStefano Zampini PetscCheck(hA->array_available, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Temporary space is in use"); 1511c69f721fSFande Kong 1512651b1cf9SStefano Zampini if (hA->array_size >= size) { 151339accc25SStefano Zampini *array = hA->array; 151439accc25SStefano Zampini } else { 15159566063dSJacob Faibussowitsch PetscCall(PetscFree(hA->array)); 1516651b1cf9SStefano Zampini hA->array_size = size; 1517651b1cf9SStefano Zampini PetscCall(PetscMalloc(hA->array_size, &hA->array)); 1518c69f721fSFande Kong *array = hA->array; 1519c69f721fSFande Kong } 1520c69f721fSFande Kong 1521651b1cf9SStefano Zampini hA->array_available = PETSC_FALSE; 15223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1523c69f721fSFande Kong } 1524c69f721fSFande Kong 1525d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatRestoreArray_HYPRE(Mat A, void **array) 1526d71ae5a4SJacob Faibussowitsch { 1527c69f721fSFande Kong Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 1528c69f721fSFande Kong 1529c69f721fSFande Kong PetscFunctionBegin; 1530c69f721fSFande Kong *array = NULL; 1531651b1cf9SStefano Zampini hA->array_available = PETSC_TRUE; 15323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1533c69f721fSFande Kong } 1534c69f721fSFande Kong 1535d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValues_HYPRE(Mat A, PetscInt nr, const PetscInt rows[], PetscInt nc, const PetscInt cols[], const PetscScalar v[], InsertMode ins) 1536d71ae5a4SJacob Faibussowitsch { 1537d975228cSstefano_zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 1538d975228cSstefano_zampini PetscScalar *vals = (PetscScalar *)v; 153939accc25SStefano Zampini HYPRE_Complex *sscr; 1540c69f721fSFande Kong PetscInt *cscr[2]; 1541c69f721fSFande Kong PetscInt i, nzc; 1542651b1cf9SStefano Zampini PetscInt rst = A->rmap->rstart, ren = A->rmap->rend; 154308defe43SFande Kong void *array = NULL; 1544d975228cSstefano_zampini 1545d975228cSstefano_zampini PetscFunctionBegin; 15469566063dSJacob Faibussowitsch PetscCall(MatGetArray_HYPRE(A, sizeof(PetscInt) * (2 * nc) + sizeof(HYPRE_Complex) * nc * nr, &array)); 1547c69f721fSFande Kong cscr[0] = (PetscInt *)array; 1548c69f721fSFande Kong cscr[1] = ((PetscInt *)array) + nc; 154939accc25SStefano Zampini sscr = (HYPRE_Complex *)(((PetscInt *)array) + nc * 2); 1550d975228cSstefano_zampini for (i = 0, nzc = 0; i < nc; i++) { 1551d975228cSstefano_zampini if (cols[i] >= 0) { 1552d975228cSstefano_zampini cscr[0][nzc] = cols[i]; 1553d975228cSstefano_zampini cscr[1][nzc++] = i; 1554d975228cSstefano_zampini } 1555d975228cSstefano_zampini } 1556c69f721fSFande Kong if (!nzc) { 15579566063dSJacob Faibussowitsch PetscCall(MatRestoreArray_HYPRE(A, &array)); 15583ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1559c69f721fSFande Kong } 1560d975228cSstefano_zampini 15616ea7df73SStefano Zampini #if 0 //defined(PETSC_HAVE_HYPRE_DEVICE) 15626ea7df73SStefano Zampini if (HYPRE_MEMORY_HOST != hypre_IJMatrixMemoryLocation(hA->ij)) { 15636ea7df73SStefano Zampini hypre_ParCSRMatrix *parcsr; 15646ea7df73SStefano Zampini 1565a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(hA->ij,(void**)&parcsr)); 1566a333fa2bSZach Atkins PetscCallHYPRE(hypre_ParCSRMatrixMigrate(parcsr, HYPRE_MEMORY_HOST)); 15676ea7df73SStefano Zampini } 15686ea7df73SStefano Zampini #endif 15696ea7df73SStefano Zampini 1570d975228cSstefano_zampini if (ins == ADD_VALUES) { 1571d975228cSstefano_zampini for (i = 0; i < nr; i++) { 15726ea7df73SStefano Zampini if (rows[i] >= 0) { 1573d975228cSstefano_zampini PetscInt j; 15742cf14000SStefano Zampini HYPRE_Int hnc = (HYPRE_Int)nzc; 15752cf14000SStefano Zampini 1576651b1cf9SStefano Zampini if (!nzc) continue; 1577651b1cf9SStefano Zampini /* nonlocal values */ 1578651b1cf9SStefano Zampini if (rows[i] < rst || rows[i] >= ren) { 1579651b1cf9SStefano Zampini PetscCheck(!A->nooffprocentries, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Setting off process row %" PetscInt_FMT " even though MatSetOption(,MAT_NO_OFF_PROC_ENTRIES,PETSC_TRUE) was set", rows[i]); 1580651b1cf9SStefano Zampini if (hA->donotstash) continue; 1581651b1cf9SStefano Zampini } 1582aed4548fSBarry Smith PetscCheck((PetscInt)hnc == nzc, PETSC_COMM_SELF, PETSC_ERR_SUP, "Hypre overflow! number of columns %" PetscInt_FMT " for row %" PetscInt_FMT, nzc, rows[i]); 15839566063dSJacob Faibussowitsch for (j = 0; j < nzc; j++) PetscCall(PetscHYPREScalarCast(vals[cscr[1][j]], &sscr[j])); 1584a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixAddToValues(hA->ij, 1, &hnc, (HYPRE_BigInt *)(rows + i), (HYPRE_BigInt *)cscr[0], sscr)); 1585d975228cSstefano_zampini } 1586d975228cSstefano_zampini vals += nc; 1587d975228cSstefano_zampini } 1588d975228cSstefano_zampini } else { /* INSERT_VALUES */ 1589d975228cSstefano_zampini for (i = 0; i < nr; i++) { 15906ea7df73SStefano Zampini if (rows[i] >= 0) { 1591d975228cSstefano_zampini PetscInt j; 15922cf14000SStefano Zampini HYPRE_Int hnc = (HYPRE_Int)nzc; 15932cf14000SStefano Zampini 1594651b1cf9SStefano Zampini if (!nzc) continue; 1595aed4548fSBarry Smith PetscCheck((PetscInt)hnc == nzc, PETSC_COMM_SELF, PETSC_ERR_SUP, "Hypre overflow! number of columns %" PetscInt_FMT " for row %" PetscInt_FMT, nzc, rows[i]); 15969566063dSJacob Faibussowitsch for (j = 0; j < nzc; j++) PetscCall(PetscHYPREScalarCast(vals[cscr[1][j]], &sscr[j])); 1597c69f721fSFande Kong /* nonlocal values */ 1598651b1cf9SStefano Zampini if (rows[i] < rst || rows[i] >= ren) { 1599651b1cf9SStefano Zampini PetscCheck(!A->nooffprocentries, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Setting off process row %" PetscInt_FMT " even though MatSetOption(,MAT_NO_OFF_PROC_ENTRIES,PETSC_TRUE) was set", rows[i]); 1600651b1cf9SStefano Zampini if (!hA->donotstash) PetscCall(MatStashValuesRow_Private(&A->stash, rows[i], nzc, cscr[0], (PetscScalar *)sscr, PETSC_FALSE)); 1601651b1cf9SStefano Zampini } 1602c69f721fSFande Kong /* local values */ 1603651b1cf9SStefano Zampini else 1604a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixSetValues(hA->ij, 1, &hnc, (HYPRE_BigInt *)(rows + i), (HYPRE_BigInt *)cscr[0], sscr)); 1605d975228cSstefano_zampini } 1606d975228cSstefano_zampini vals += nc; 1607d975228cSstefano_zampini } 1608d975228cSstefano_zampini } 1609c69f721fSFande Kong 16109566063dSJacob Faibussowitsch PetscCall(MatRestoreArray_HYPRE(A, &array)); 16113ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1612d975228cSstefano_zampini } 1613d975228cSstefano_zampini 1614d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRESetPreallocation_HYPRE(Mat A, PetscInt dnz, const PetscInt dnnz[], PetscInt onz, const PetscInt onnz[]) 1615d71ae5a4SJacob Faibussowitsch { 1616d975228cSstefano_zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 16177d968826Sstefano_zampini HYPRE_Int *hdnnz, *honnz; 161806a29025Sstefano_zampini PetscInt i, rs, re, cs, ce, bs; 1619d975228cSstefano_zampini PetscMPIInt size; 1620d975228cSstefano_zampini 1621d975228cSstefano_zampini PetscFunctionBegin; 16229566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 16239566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 1624d975228cSstefano_zampini rs = A->rmap->rstart; 1625d975228cSstefano_zampini re = A->rmap->rend; 1626d975228cSstefano_zampini cs = A->cmap->rstart; 1627d975228cSstefano_zampini ce = A->cmap->rend; 1628d975228cSstefano_zampini if (!hA->ij) { 1629a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixCreate(hA->comm, rs, re - 1, cs, ce - 1, &hA->ij)); 1630a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixSetObjectType(hA->ij, HYPRE_PARCSR)); 1631d975228cSstefano_zampini } else { 16322cf14000SStefano Zampini HYPRE_BigInt hrs, hre, hcs, hce; 1633a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetLocalRange(hA->ij, &hrs, &hre, &hcs, &hce)); 1634aed4548fSBarry Smith PetscCheck(hre - hrs + 1 == re - rs, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Inconsistent local rows: IJMatrix [%" PetscHYPRE_BigInt_FMT ",%" PetscHYPRE_BigInt_FMT "), PETSc [%" PetscInt_FMT ",%" PetscInt_FMT ")", hrs, hre + 1, rs, re); 1635aed4548fSBarry Smith PetscCheck(hce - hcs + 1 == ce - cs, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Inconsistent local cols: IJMatrix [%" PetscHYPRE_BigInt_FMT ",%" PetscHYPRE_BigInt_FMT "), PETSc [%" PetscInt_FMT ",%" PetscInt_FMT ")", hcs, hce + 1, cs, ce); 1636d975228cSstefano_zampini } 163706977982Sstefanozampini PetscCall(MatHYPRE_DestroyCOOMat(A)); 16389566063dSJacob Faibussowitsch PetscCall(MatGetBlockSize(A, &bs)); 163906a29025Sstefano_zampini if (dnz == PETSC_DEFAULT || dnz == PETSC_DECIDE) dnz = 10 * bs; 164006a29025Sstefano_zampini if (onz == PETSC_DEFAULT || onz == PETSC_DECIDE) onz = 10 * bs; 164106a29025Sstefano_zampini 1642d975228cSstefano_zampini if (!dnnz) { 16439566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &hdnnz)); 1644*f2f41e48SZach Atkins for (i = 0; i < A->rmap->n; i++) hdnnz[i] = (HYPRE_Int)dnz; 1645d975228cSstefano_zampini } else { 16467d968826Sstefano_zampini hdnnz = (HYPRE_Int *)dnnz; 1647d975228cSstefano_zampini } 16489566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)A), &size)); 1649d975228cSstefano_zampini if (size > 1) { 1650ddbeb582SStefano Zampini hypre_AuxParCSRMatrix *aux_matrix; 1651d975228cSstefano_zampini if (!onnz) { 16529566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &honnz)); 1653*f2f41e48SZach Atkins for (i = 0; i < A->rmap->n; i++) honnz[i] = (HYPRE_Int)onz; 165422235d61SPierre Jolivet } else honnz = (HYPRE_Int *)onnz; 1655ddbeb582SStefano Zampini /* SetDiagOffdSizes sets hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0, since it seems 1656ddbeb582SStefano Zampini they assume the user will input the entire row values, properly sorted 1657336664bdSPierre Jolivet In PETSc, we don't make such an assumption and set this flag to 1, 1658336664bdSPierre Jolivet unless the option MAT_SORTED_FULL is set to true. 1659ddbeb582SStefano Zampini Also, to avoid possible memory leaks, we destroy and recreate the translator 1660ddbeb582SStefano Zampini This has to be done here, as HYPRE_IJMatrixInitialize will properly initialize 1661ddbeb582SStefano Zampini the IJ matrix for us */ 1662ddbeb582SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(hA->ij); 1663ddbeb582SStefano Zampini hypre_AuxParCSRMatrixDestroy(aux_matrix); 1664ddbeb582SStefano Zampini hypre_IJMatrixTranslator(hA->ij) = NULL; 1665a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixSetDiagOffdSizes(hA->ij, hdnnz, honnz)); 1666ddbeb582SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(hA->ij); 1667651b1cf9SStefano Zampini hypre_AuxParCSRMatrixNeedAux(aux_matrix) = !A->sortedfull; 1668d975228cSstefano_zampini } else { 1669d975228cSstefano_zampini honnz = NULL; 1670a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixSetRowSizes(hA->ij, hdnnz)); 1671d975228cSstefano_zampini } 1672ddbeb582SStefano Zampini 1673af1cf968SStefano Zampini /* reset assembled flag and call the initialize method */ 1674af1cf968SStefano Zampini hypre_IJMatrixAssembleFlag(hA->ij) = 0; 16756ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0) 1676a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixInitialize(hA->ij)); 16776ea7df73SStefano Zampini #else 1678a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixInitialize_v2(hA->ij, HYPRE_MEMORY_HOST)); 16796ea7df73SStefano Zampini #endif 168048a46eb9SPierre Jolivet if (!dnnz) PetscCall(PetscFree(hdnnz)); 168148a46eb9SPierre Jolivet if (!onnz && honnz) PetscCall(PetscFree(honnz)); 1682af1cf968SStefano Zampini /* Match AIJ logic */ 168306a29025Sstefano_zampini A->preallocated = PETSC_TRUE; 1684af1cf968SStefano Zampini A->assembled = PETSC_FALSE; 16853ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1686d975228cSstefano_zampini } 1687d975228cSstefano_zampini 1688d975228cSstefano_zampini /*@C 1689d975228cSstefano_zampini MatHYPRESetPreallocation - Preallocates memory for a sparse parallel matrix in HYPRE IJ format 1690d975228cSstefano_zampini 1691c3339decSBarry Smith Collective 1692d975228cSstefano_zampini 1693d975228cSstefano_zampini Input Parameters: 1694d975228cSstefano_zampini + A - the matrix 1695d975228cSstefano_zampini . dnz - number of nonzeros per row in DIAGONAL portion of local submatrix 1696d975228cSstefano_zampini (same value is used for all local rows) 1697d975228cSstefano_zampini . dnnz - array containing the number of nonzeros in the various rows of the 1698d975228cSstefano_zampini DIAGONAL portion of the local submatrix (possibly different for each row) 16992ef1f0ffSBarry Smith or `NULL` (`PETSC_NULL_INTEGER` in Fortran), if `d_nz` is used to specify the nonzero structure. 17002ef1f0ffSBarry Smith The size of this array is equal to the number of local rows, i.e `m`. 1701d975228cSstefano_zampini For matrices that will be factored, you must leave room for (and set) 1702d975228cSstefano_zampini the diagonal entry even if it is zero. 1703d975228cSstefano_zampini . onz - number of nonzeros per row in the OFF-DIAGONAL portion of local 1704d975228cSstefano_zampini submatrix (same value is used for all local rows). 1705d975228cSstefano_zampini - onnz - array containing the number of nonzeros in the various rows of the 1706d975228cSstefano_zampini OFF-DIAGONAL portion of the local submatrix (possibly different for 17072ef1f0ffSBarry Smith each row) or `NULL` (`PETSC_NULL_INTEGER` in Fortran), if `o_nz` is used to specify the nonzero 1708d975228cSstefano_zampini structure. The size of this array is equal to the number 17092ef1f0ffSBarry Smith of local rows, i.e `m`. 1710d975228cSstefano_zampini 17112fe279fdSBarry Smith Level: intermediate 17122fe279fdSBarry Smith 171311a5261eSBarry Smith Note: 17142ef1f0ffSBarry Smith If the *nnz parameter is given then the *nz parameter is ignored; for sequential matrices, `onz` and `onnz` are ignored. 1715d975228cSstefano_zampini 17161cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatMPIAIJSetPreallocation()`, `MATHYPRE`, `MATAIJ` 1717d975228cSstefano_zampini @*/ 1718d71ae5a4SJacob Faibussowitsch PetscErrorCode MatHYPRESetPreallocation(Mat A, PetscInt dnz, const PetscInt dnnz[], PetscInt onz, const PetscInt onnz[]) 1719d71ae5a4SJacob Faibussowitsch { 1720d975228cSstefano_zampini PetscFunctionBegin; 1721d975228cSstefano_zampini PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 1722d975228cSstefano_zampini PetscValidType(A, 1); 1723cac4c232SBarry Smith PetscTryMethod(A, "MatHYPRESetPreallocation_C", (Mat, PetscInt, const PetscInt[], PetscInt, const PetscInt[]), (A, dnz, dnnz, onz, onnz)); 17243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1725d975228cSstefano_zampini } 1726d975228cSstefano_zampini 172720f4b53cSBarry Smith /*@C 17282ef1f0ffSBarry Smith MatCreateFromParCSR - Creates a `Mat` from a `hypre_ParCSRMatrix` 1729225daaf8SStefano Zampini 1730225daaf8SStefano Zampini Collective 1731225daaf8SStefano Zampini 1732225daaf8SStefano Zampini Input Parameters: 17332ef1f0ffSBarry Smith + parcsr - the pointer to the `hypre_ParCSRMatrix` 17342ef1f0ffSBarry Smith . mtype - matrix type to be created. Currently `MATAIJ`, `MATIS` and `MATHYPRE` are supported. 173520f4b53cSBarry Smith - copymode - PETSc copying options, see `PetscCopyMode` 1736225daaf8SStefano Zampini 1737225daaf8SStefano Zampini Output Parameter: 1738225daaf8SStefano Zampini . A - the matrix 1739225daaf8SStefano Zampini 1740225daaf8SStefano Zampini Level: intermediate 1741225daaf8SStefano Zampini 1742bfe80ac4SPierre Jolivet .seealso: [](ch_matrices), `Mat`, `MATHYPRE`, `PetscCopyMode` 174320f4b53cSBarry Smith @*/ 1744d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreateFromParCSR(hypre_ParCSRMatrix *parcsr, MatType mtype, PetscCopyMode copymode, Mat *A) 1745d71ae5a4SJacob Faibussowitsch { 1746225daaf8SStefano Zampini Mat T; 1747978814f1SStefano Zampini Mat_HYPRE *hA; 1748978814f1SStefano Zampini MPI_Comm comm; 1749978814f1SStefano Zampini PetscInt rstart, rend, cstart, cend, M, N; 1750d248a85cSRichard Tran Mills PetscBool isseqaij, isseqaijmkl, ismpiaij, isaij, ishyp, isis; 1751978814f1SStefano Zampini 1752978814f1SStefano Zampini PetscFunctionBegin; 1753978814f1SStefano Zampini comm = hypre_ParCSRMatrixComm(parcsr); 17549566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype, MATSEQAIJ, &isseqaij)); 17559566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype, MATSEQAIJMKL, &isseqaijmkl)); 17569566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype, MATMPIAIJ, &ismpiaij)); 17579566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype, MATAIJ, &isaij)); 17589566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype, MATHYPRE, &ishyp)); 17599566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype, MATIS, &isis)); 1760d248a85cSRichard Tran Mills isaij = (PetscBool)(isseqaij || isseqaijmkl || ismpiaij || isaij); 17616ea7df73SStefano Zampini /* TODO */ 1762aed4548fSBarry Smith PetscCheck(isaij || ishyp || isis, comm, PETSC_ERR_SUP, "Unsupported MatType %s! Supported types are %s, %s, %s, %s, %s, and %s", mtype, MATAIJ, MATSEQAIJ, MATSEQAIJMKL, MATMPIAIJ, MATIS, MATHYPRE); 1763978814f1SStefano Zampini /* access ParCSRMatrix */ 1764978814f1SStefano Zampini rstart = hypre_ParCSRMatrixFirstRowIndex(parcsr); 1765978814f1SStefano Zampini rend = hypre_ParCSRMatrixLastRowIndex(parcsr); 1766978814f1SStefano Zampini cstart = hypre_ParCSRMatrixFirstColDiag(parcsr); 1767978814f1SStefano Zampini cend = hypre_ParCSRMatrixLastColDiag(parcsr); 1768978814f1SStefano Zampini M = hypre_ParCSRMatrixGlobalNumRows(parcsr); 1769978814f1SStefano Zampini N = hypre_ParCSRMatrixGlobalNumCols(parcsr); 1770978814f1SStefano Zampini 1771978814f1SStefano Zampini /* create PETSc matrix with MatHYPRE */ 17729566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, &T)); 1773c2886e86SStefano Zampini PetscCall(MatSetSizes(T, PetscMax(rend - rstart + 1, 0), PetscMax(cend - cstart + 1, 0), M, N)); 17749566063dSJacob Faibussowitsch PetscCall(MatSetType(T, MATHYPRE)); 1775f4f49eeaSPierre Jolivet hA = (Mat_HYPRE *)T->data; 1776978814f1SStefano Zampini 1777978814f1SStefano Zampini /* create HYPRE_IJMatrix */ 1778a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixCreate(hA->comm, rstart, rend, cstart, cend, &hA->ij)); 1779a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixSetObjectType(hA->ij, HYPRE_PARCSR)); 178045b8d346SStefano Zampini 178145b8d346SStefano Zampini /* create new ParCSR object if needed */ 178245b8d346SStefano Zampini if (ishyp && copymode == PETSC_COPY_VALUES) { 178345b8d346SStefano Zampini hypre_ParCSRMatrix *new_parcsr; 17846ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 18, 0) 178545b8d346SStefano Zampini hypre_CSRMatrix *hdiag, *hoffd, *ndiag, *noffd; 178645b8d346SStefano Zampini 17870e6427aaSSatish Balay new_parcsr = hypre_ParCSRMatrixClone(parcsr, 0); 178845b8d346SStefano Zampini hdiag = hypre_ParCSRMatrixDiag(parcsr); 178945b8d346SStefano Zampini hoffd = hypre_ParCSRMatrixOffd(parcsr); 179045b8d346SStefano Zampini ndiag = hypre_ParCSRMatrixDiag(new_parcsr); 179145b8d346SStefano Zampini noffd = hypre_ParCSRMatrixOffd(new_parcsr); 17929566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hypre_CSRMatrixData(ndiag), hypre_CSRMatrixData(hdiag), hypre_CSRMatrixNumNonzeros(hdiag))); 17939566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hypre_CSRMatrixData(noffd), hypre_CSRMatrixData(hoffd), hypre_CSRMatrixNumNonzeros(hoffd))); 17946ea7df73SStefano Zampini #else 17956ea7df73SStefano Zampini new_parcsr = hypre_ParCSRMatrixClone(parcsr, 1); 17966ea7df73SStefano Zampini #endif 179745b8d346SStefano Zampini parcsr = new_parcsr; 179845b8d346SStefano Zampini copymode = PETSC_OWN_POINTER; 179945b8d346SStefano Zampini } 1800978814f1SStefano Zampini 1801978814f1SStefano Zampini /* set ParCSR object */ 1802978814f1SStefano Zampini hypre_IJMatrixObject(hA->ij) = parcsr; 18034ec6421dSstefano_zampini T->preallocated = PETSC_TRUE; 1804978814f1SStefano Zampini 1805978814f1SStefano Zampini /* set assembled flag */ 1806978814f1SStefano Zampini hypre_IJMatrixAssembleFlag(hA->ij) = 1; 18076ea7df73SStefano Zampini #if 0 1808a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixInitialize(hA->ij)); 18096ea7df73SStefano Zampini #endif 1810225daaf8SStefano Zampini if (ishyp) { 18116d2a658fSstefano_zampini PetscMPIInt myid = 0; 18126d2a658fSstefano_zampini 18136d2a658fSstefano_zampini /* make sure we always have row_starts and col_starts available */ 181448a46eb9SPierre Jolivet if (HYPRE_AssumedPartitionCheck()) PetscCallMPI(MPI_Comm_rank(comm, &myid)); 1815a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts) 18166d2a658fSstefano_zampini if (!hypre_ParCSRMatrixOwnsColStarts(parcsr)) { 18176d2a658fSstefano_zampini PetscLayout map; 18186d2a658fSstefano_zampini 18199566063dSJacob Faibussowitsch PetscCall(MatGetLayouts(T, NULL, &map)); 18209566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(map)); 18212cf14000SStefano Zampini hypre_ParCSRMatrixColStarts(parcsr) = (HYPRE_BigInt *)(map->range + myid); 18226d2a658fSstefano_zampini } 18236d2a658fSstefano_zampini if (!hypre_ParCSRMatrixOwnsRowStarts(parcsr)) { 18246d2a658fSstefano_zampini PetscLayout map; 18256d2a658fSstefano_zampini 18269566063dSJacob Faibussowitsch PetscCall(MatGetLayouts(T, &map, NULL)); 18279566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(map)); 18282cf14000SStefano Zampini hypre_ParCSRMatrixRowStarts(parcsr) = (HYPRE_BigInt *)(map->range + myid); 18296d2a658fSstefano_zampini } 1830a1d2239cSSatish Balay #endif 1831978814f1SStefano Zampini /* prevent from freeing the pointer */ 1832978814f1SStefano Zampini if (copymode == PETSC_USE_POINTER) hA->inner_free = PETSC_FALSE; 1833225daaf8SStefano Zampini *A = T; 18349566063dSJacob Faibussowitsch PetscCall(MatSetOption(*A, MAT_SORTED_FULL, PETSC_TRUE)); 18359566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*A, MAT_FINAL_ASSEMBLY)); 18369566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*A, MAT_FINAL_ASSEMBLY)); 1837bb4689ddSStefano Zampini } else if (isaij) { 1838bb4689ddSStefano Zampini if (copymode != PETSC_OWN_POINTER) { 1839225daaf8SStefano Zampini /* prevent from freeing the pointer */ 1840225daaf8SStefano Zampini hA->inner_free = PETSC_FALSE; 18419566063dSJacob Faibussowitsch PetscCall(MatConvert_HYPRE_AIJ(T, MATAIJ, MAT_INITIAL_MATRIX, A)); 18429566063dSJacob Faibussowitsch PetscCall(MatDestroy(&T)); 1843225daaf8SStefano Zampini } else { /* AIJ return type with PETSC_OWN_POINTER */ 18449566063dSJacob Faibussowitsch PetscCall(MatConvert_HYPRE_AIJ(T, MATAIJ, MAT_INPLACE_MATRIX, &T)); 1845225daaf8SStefano Zampini *A = T; 1846225daaf8SStefano Zampini } 1847bb4689ddSStefano Zampini } else if (isis) { 18489566063dSJacob Faibussowitsch PetscCall(MatConvert_HYPRE_IS(T, MATIS, MAT_INITIAL_MATRIX, A)); 18498cfe8d00SStefano Zampini if (copymode != PETSC_OWN_POINTER) hA->inner_free = PETSC_FALSE; 18509566063dSJacob Faibussowitsch PetscCall(MatDestroy(&T)); 1851bb4689ddSStefano Zampini } 18523ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1853978814f1SStefano Zampini } 1854978814f1SStefano Zampini 1855d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPREGetParCSR_HYPRE(Mat A, hypre_ParCSRMatrix **parcsr) 1856d71ae5a4SJacob Faibussowitsch { 1857dd9c0a25Sstefano_zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 1858dd9c0a25Sstefano_zampini HYPRE_Int type; 1859dd9c0a25Sstefano_zampini 1860dd9c0a25Sstefano_zampini PetscFunctionBegin; 186128b400f6SJacob Faibussowitsch PetscCheck(hA->ij, PetscObjectComm((PetscObject)A), PETSC_ERR_PLIB, "HYPRE_IJMatrix not present"); 1862a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(hA->ij, &type)); 186308401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "HYPRE_IJMatrix is not of type HYPRE_PARCSR"); 1864a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(hA->ij, (void **)parcsr)); 18653ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1866dd9c0a25Sstefano_zampini } 1867dd9c0a25Sstefano_zampini 186820f4b53cSBarry Smith /*@C 1869dd9c0a25Sstefano_zampini MatHYPREGetParCSR - Gets the pointer to the ParCSR matrix 1870dd9c0a25Sstefano_zampini 1871cc4c1da9SBarry Smith Not Collective, No Fortran Support 1872dd9c0a25Sstefano_zampini 187320f4b53cSBarry Smith Input Parameter: 187420f4b53cSBarry Smith . A - the `MATHYPRE` object 1875dd9c0a25Sstefano_zampini 1876dd9c0a25Sstefano_zampini Output Parameter: 18772ef1f0ffSBarry Smith . parcsr - the pointer to the `hypre_ParCSRMatrix` 1878dd9c0a25Sstefano_zampini 1879dd9c0a25Sstefano_zampini Level: intermediate 1880dd9c0a25Sstefano_zampini 1881bfe80ac4SPierre Jolivet .seealso: [](ch_matrices), `Mat`, `MATHYPRE`, `PetscCopyMode` 188220f4b53cSBarry Smith @*/ 1883d71ae5a4SJacob Faibussowitsch PetscErrorCode MatHYPREGetParCSR(Mat A, hypre_ParCSRMatrix **parcsr) 1884d71ae5a4SJacob Faibussowitsch { 1885dd9c0a25Sstefano_zampini PetscFunctionBegin; 1886dd9c0a25Sstefano_zampini PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 1887dd9c0a25Sstefano_zampini PetscValidType(A, 1); 1888cac4c232SBarry Smith PetscUseMethod(A, "MatHYPREGetParCSR_C", (Mat, hypre_ParCSRMatrix **), (A, parcsr)); 18893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1890dd9c0a25Sstefano_zampini } 1891dd9c0a25Sstefano_zampini 1892d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMissingDiagonal_HYPRE(Mat A, PetscBool *missing, PetscInt *dd) 1893d71ae5a4SJacob Faibussowitsch { 189468ec7858SStefano Zampini hypre_ParCSRMatrix *parcsr; 189568ec7858SStefano Zampini hypre_CSRMatrix *ha; 189668ec7858SStefano Zampini PetscInt rst; 189768ec7858SStefano Zampini 189868ec7858SStefano Zampini PetscFunctionBegin; 189908401ef6SPierre Jolivet PetscCheck(A->rmap->n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_SUP, "Not implemented with non-square diagonal blocks"); 19009566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(A, &rst, NULL)); 19019566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 190268ec7858SStefano Zampini if (missing) *missing = PETSC_FALSE; 190368ec7858SStefano Zampini if (dd) *dd = -1; 190468ec7858SStefano Zampini ha = hypre_ParCSRMatrixDiag(parcsr); 190568ec7858SStefano Zampini if (ha) { 190668299464SStefano Zampini PetscInt size, i; 190768299464SStefano Zampini HYPRE_Int *ii, *jj; 190868ec7858SStefano Zampini 190968ec7858SStefano Zampini size = hypre_CSRMatrixNumRows(ha); 191068ec7858SStefano Zampini ii = hypre_CSRMatrixI(ha); 191168ec7858SStefano Zampini jj = hypre_CSRMatrixJ(ha); 191268ec7858SStefano Zampini for (i = 0; i < size; i++) { 191368ec7858SStefano Zampini PetscInt j; 191468ec7858SStefano Zampini PetscBool found = PETSC_FALSE; 191568ec7858SStefano Zampini 19169371c9d4SSatish Balay for (j = ii[i]; j < ii[i + 1] && !found; j++) found = (jj[j] == i) ? PETSC_TRUE : PETSC_FALSE; 191768ec7858SStefano Zampini 191868ec7858SStefano Zampini if (!found) { 19193ba16761SJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix is missing local diagonal entry %" PetscInt_FMT "\n", i)); 192068ec7858SStefano Zampini if (missing) *missing = PETSC_TRUE; 192168ec7858SStefano Zampini if (dd) *dd = i + rst; 19223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 192368ec7858SStefano Zampini } 192468ec7858SStefano Zampini } 192568ec7858SStefano Zampini if (!size) { 19263ba16761SJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no diagonal entries therefore is missing diagonal\n")); 192768ec7858SStefano Zampini if (missing) *missing = PETSC_TRUE; 192868ec7858SStefano Zampini if (dd) *dd = rst; 192968ec7858SStefano Zampini } 193068ec7858SStefano Zampini } else { 19313ba16761SJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no diagonal entries therefore is missing diagonal\n")); 193268ec7858SStefano Zampini if (missing) *missing = PETSC_TRUE; 193368ec7858SStefano Zampini if (dd) *dd = rst; 193468ec7858SStefano Zampini } 19353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 193668ec7858SStefano Zampini } 193768ec7858SStefano Zampini 1938d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatScale_HYPRE(Mat A, PetscScalar s) 1939d71ae5a4SJacob Faibussowitsch { 194068ec7858SStefano Zampini hypre_ParCSRMatrix *parcsr; 19416ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0) 194268ec7858SStefano Zampini hypre_CSRMatrix *ha; 19436ea7df73SStefano Zampini #endif 194439accc25SStefano Zampini HYPRE_Complex hs; 194568ec7858SStefano Zampini 194668ec7858SStefano Zampini PetscFunctionBegin; 19479566063dSJacob Faibussowitsch PetscCall(PetscHYPREScalarCast(s, &hs)); 19489566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 19496ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2, 19, 0) 1950a333fa2bSZach Atkins PetscCallHYPRE(hypre_ParCSRMatrixScale(parcsr, hs)); 19516ea7df73SStefano Zampini #else /* diagonal part */ 195268ec7858SStefano Zampini ha = hypre_ParCSRMatrixDiag(parcsr); 195368ec7858SStefano Zampini if (ha) { 195468299464SStefano Zampini PetscInt size, i; 195568299464SStefano Zampini HYPRE_Int *ii; 195639accc25SStefano Zampini HYPRE_Complex *a; 195768ec7858SStefano Zampini 195868ec7858SStefano Zampini size = hypre_CSRMatrixNumRows(ha); 195968ec7858SStefano Zampini a = hypre_CSRMatrixData(ha); 196068ec7858SStefano Zampini ii = hypre_CSRMatrixI(ha); 196139accc25SStefano Zampini for (i = 0; i < ii[size]; i++) a[i] *= hs; 196268ec7858SStefano Zampini } 19634cf0e950SBarry Smith /* off-diagonal part */ 196468ec7858SStefano Zampini ha = hypre_ParCSRMatrixOffd(parcsr); 196568ec7858SStefano Zampini if (ha) { 196668299464SStefano Zampini PetscInt size, i; 196768299464SStefano Zampini HYPRE_Int *ii; 196839accc25SStefano Zampini HYPRE_Complex *a; 196968ec7858SStefano Zampini 197068ec7858SStefano Zampini size = hypre_CSRMatrixNumRows(ha); 197168ec7858SStefano Zampini a = hypre_CSRMatrixData(ha); 197268ec7858SStefano Zampini ii = hypre_CSRMatrixI(ha); 197339accc25SStefano Zampini for (i = 0; i < ii[size]; i++) a[i] *= hs; 197468ec7858SStefano Zampini } 19756ea7df73SStefano Zampini #endif 19763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 197768ec7858SStefano Zampini } 197868ec7858SStefano Zampini 1979d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatZeroRowsColumns_HYPRE(Mat A, PetscInt numRows, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 1980d71ae5a4SJacob Faibussowitsch { 198168ec7858SStefano Zampini hypre_ParCSRMatrix *parcsr; 198268299464SStefano Zampini HYPRE_Int *lrows; 198368299464SStefano Zampini PetscInt rst, ren, i; 198468ec7858SStefano Zampini 198568ec7858SStefano Zampini PetscFunctionBegin; 198608401ef6SPierre Jolivet PetscCheck(!x && !b, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "To be implemented"); 19879566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 19889566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(numRows, &lrows)); 19899566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(A, &rst, &ren)); 199068ec7858SStefano Zampini for (i = 0; i < numRows; i++) { 19917a46b595SBarry Smith PetscCheck(rows[i] >= rst && rows[i] < ren, PETSC_COMM_SELF, PETSC_ERR_SUP, "Non-local rows not yet supported"); 1992*f2f41e48SZach Atkins lrows[i] = (HYPRE_Int)(rows[i] - rst); 199368ec7858SStefano Zampini } 1994*f2f41e48SZach Atkins PetscCallHYPRE(hypre_ParCSRMatrixEliminateRowsCols(parcsr, (HYPRE_Int)numRows, lrows)); 19959566063dSJacob Faibussowitsch PetscCall(PetscFree(lrows)); 19963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 199768ec7858SStefano Zampini } 199868ec7858SStefano Zampini 1999d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatZeroEntries_HYPRE_CSRMatrix(hypre_CSRMatrix *ha) 2000d71ae5a4SJacob Faibussowitsch { 2001c69f721fSFande Kong PetscFunctionBegin; 2002c69f721fSFande Kong if (ha) { 2003c69f721fSFande Kong HYPRE_Int *ii, size; 2004c69f721fSFande Kong HYPRE_Complex *a; 2005c69f721fSFande Kong 2006c69f721fSFande Kong size = hypre_CSRMatrixNumRows(ha); 2007c69f721fSFande Kong a = hypre_CSRMatrixData(ha); 2008c69f721fSFande Kong ii = hypre_CSRMatrixI(ha); 2009c69f721fSFande Kong 20109566063dSJacob Faibussowitsch if (a) PetscCall(PetscArrayzero(a, ii[size])); 2011c69f721fSFande Kong } 20123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2013c69f721fSFande Kong } 2014c69f721fSFande Kong 201566976f2fSJacob Faibussowitsch static PetscErrorCode MatZeroEntries_HYPRE(Mat A) 2016d71ae5a4SJacob Faibussowitsch { 20176ea7df73SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 20186ea7df73SStefano Zampini 20196ea7df73SStefano Zampini PetscFunctionBegin; 20206ea7df73SStefano Zampini if (HYPRE_MEMORY_DEVICE == hypre_IJMatrixMemoryLocation(hA->ij)) { 2021a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixSetConstantValues(hA->ij, 0.0)); 20226ea7df73SStefano Zampini } else { 2023c69f721fSFande Kong hypre_ParCSRMatrix *parcsr; 2024c69f721fSFande Kong 20259566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 20269566063dSJacob Faibussowitsch PetscCall(MatZeroEntries_HYPRE_CSRMatrix(hypre_ParCSRMatrixDiag(parcsr))); 20279566063dSJacob Faibussowitsch PetscCall(MatZeroEntries_HYPRE_CSRMatrix(hypre_ParCSRMatrixOffd(parcsr))); 20286ea7df73SStefano Zampini } 20293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2030c69f721fSFande Kong } 2031c69f721fSFande Kong 2032d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatZeroRows_HYPRE_CSRMatrix(hypre_CSRMatrix *hA, PetscInt N, const PetscInt rows[], HYPRE_Complex diag) 2033d71ae5a4SJacob Faibussowitsch { 203439accc25SStefano Zampini PetscInt ii; 203539accc25SStefano Zampini HYPRE_Int *i, *j; 203639accc25SStefano Zampini HYPRE_Complex *a; 2037c69f721fSFande Kong 2038c69f721fSFande Kong PetscFunctionBegin; 20393ba16761SJacob Faibussowitsch if (!hA) PetscFunctionReturn(PETSC_SUCCESS); 2040c69f721fSFande Kong 204139accc25SStefano Zampini i = hypre_CSRMatrixI(hA); 204239accc25SStefano Zampini j = hypre_CSRMatrixJ(hA); 2043c69f721fSFande Kong a = hypre_CSRMatrixData(hA); 2044a32e9c99SJunchao Zhang #if defined(PETSC_HAVE_HYPRE_DEVICE) 2045a32e9c99SJunchao Zhang if (HYPRE_MEMORY_DEVICE == hypre_CSRMatrixMemoryLocation(hA)) { 2046a32e9c99SJunchao Zhang #if defined(HYPRE_USING_CUDA) 2047a32e9c99SJunchao Zhang MatZeroRows_CUDA(N, rows, i, j, a, diag); 2048a32e9c99SJunchao Zhang #elif defined(HYPRE_USING_HIP) 2049a32e9c99SJunchao Zhang MatZeroRows_HIP(N, rows, i, j, a, diag); 2050a32e9c99SJunchao Zhang #elif defined(PETSC_HAVE_KOKKOS) 2051a32e9c99SJunchao Zhang MatZeroRows_Kokkos(N, rows, i, j, a, diag); 2052a32e9c99SJunchao Zhang #else 2053a32e9c99SJunchao Zhang SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for MatZeroRows on a hypre matrix in this memory location"); 2054a32e9c99SJunchao Zhang #endif 2055a32e9c99SJunchao Zhang } else 2056a32e9c99SJunchao Zhang #endif 2057a32e9c99SJunchao Zhang { 2058c69f721fSFande Kong for (ii = 0; ii < N; ii++) { 205939accc25SStefano Zampini HYPRE_Int jj, ibeg, iend, irow; 206039accc25SStefano Zampini 2061*f2f41e48SZach Atkins irow = (HYPRE_Int)rows[ii]; 2062c69f721fSFande Kong ibeg = i[irow]; 2063c69f721fSFande Kong iend = i[irow + 1]; 2064c69f721fSFande Kong for (jj = ibeg; jj < iend; jj++) 2065c69f721fSFande Kong if (j[jj] == irow) a[jj] = diag; 2066c69f721fSFande Kong else a[jj] = 0.0; 2067c69f721fSFande Kong } 2068a32e9c99SJunchao Zhang } 20693ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2070c69f721fSFande Kong } 2071c69f721fSFande Kong 2072d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatZeroRows_HYPRE(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2073d71ae5a4SJacob Faibussowitsch { 2074c69f721fSFande Kong hypre_ParCSRMatrix *parcsr; 2075a32e9c99SJunchao Zhang PetscInt *lrows, len, *lrows2; 207639accc25SStefano Zampini HYPRE_Complex hdiag; 2077c69f721fSFande Kong 2078c69f721fSFande Kong PetscFunctionBegin; 207908401ef6SPierre Jolivet PetscCheck(!x && !b, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Does not support to modify the solution and the right hand size"); 20809566063dSJacob Faibussowitsch PetscCall(PetscHYPREScalarCast(diag, &hdiag)); 2081c69f721fSFande Kong /* retrieve the internal matrix */ 20829566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 2083c69f721fSFande Kong /* get locally owned rows */ 20849566063dSJacob Faibussowitsch PetscCall(MatZeroRowsMapLocal_Private(A, N, rows, &len, &lrows)); 2085a32e9c99SJunchao Zhang 2086a32e9c99SJunchao Zhang #if defined(PETSC_HAVE_HYPRE_DEVICE) 2087a32e9c99SJunchao Zhang if (HYPRE_MEMORY_DEVICE == hypre_CSRMatrixMemoryLocation(hypre_ParCSRMatrixDiag(parcsr))) { 2088a32e9c99SJunchao Zhang Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 2089a32e9c99SJunchao Zhang PetscInt m; 2090a32e9c99SJunchao Zhang PetscCall(MatGetLocalSize(A, &m, NULL)); 2091a32e9c99SJunchao Zhang if (!hA->rows_d) { 2092a32e9c99SJunchao Zhang hA->rows_d = hypre_TAlloc(PetscInt, m, HYPRE_MEMORY_DEVICE); 2093a32e9c99SJunchao Zhang if (m) PetscCheck(hA->rows_d, PETSC_COMM_SELF, PETSC_ERR_MEM, "HYPRE_TAlloc failed"); 2094a32e9c99SJunchao Zhang } 2095a32e9c99SJunchao Zhang PetscCheck(len <= m, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Too many rows in rows[]"); 2096a32e9c99SJunchao Zhang PetscStackCallExternalVoid("hypre_Memcpy", hypre_Memcpy(hA->rows_d, lrows, sizeof(PetscInt) * len, HYPRE_MEMORY_DEVICE, HYPRE_MEMORY_HOST)); 2097a32e9c99SJunchao Zhang lrows2 = hA->rows_d; 2098a32e9c99SJunchao Zhang } else 2099a32e9c99SJunchao Zhang #endif 2100a32e9c99SJunchao Zhang { 2101a32e9c99SJunchao Zhang lrows2 = lrows; 2102a32e9c99SJunchao Zhang } 2103a32e9c99SJunchao Zhang 2104c69f721fSFande Kong /* zero diagonal part */ 2105a32e9c99SJunchao Zhang PetscCall(MatZeroRows_HYPRE_CSRMatrix(hypre_ParCSRMatrixDiag(parcsr), len, lrows2, hdiag)); 2106c69f721fSFande Kong /* zero off-diagonal part */ 2107a32e9c99SJunchao Zhang PetscCall(MatZeroRows_HYPRE_CSRMatrix(hypre_ParCSRMatrixOffd(parcsr), len, lrows2, 0.0)); 2108c69f721fSFande Kong 21099566063dSJacob Faibussowitsch PetscCall(PetscFree(lrows)); 21103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2111c69f721fSFande Kong } 2112c69f721fSFande Kong 2113d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAssemblyBegin_HYPRE(Mat mat, MatAssemblyType mode) 2114d71ae5a4SJacob Faibussowitsch { 2115c69f721fSFande Kong PetscFunctionBegin; 21163ba16761SJacob Faibussowitsch if (mat->nooffprocentries) PetscFunctionReturn(PETSC_SUCCESS); 2117c69f721fSFande Kong 21189566063dSJacob Faibussowitsch PetscCall(MatStashScatterBegin_Private(mat, &mat->stash, mat->rmap->range)); 21193ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2120c69f721fSFande Kong } 2121c69f721fSFande Kong 2122d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetRow_HYPRE(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2123d71ae5a4SJacob Faibussowitsch { 2124c69f721fSFande Kong hypre_ParCSRMatrix *parcsr; 21252cf14000SStefano Zampini HYPRE_Int hnz; 2126c69f721fSFande Kong 2127c69f721fSFande Kong PetscFunctionBegin; 2128c69f721fSFande Kong /* retrieve the internal matrix */ 21299566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 2130c69f721fSFande Kong /* call HYPRE API */ 2131a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_ParCSRMatrixGetRow(parcsr, row, &hnz, (HYPRE_BigInt **)idx, (HYPRE_Complex **)v)); 21322cf14000SStefano Zampini if (nz) *nz = (PetscInt)hnz; 21333ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2134c69f721fSFande Kong } 2135c69f721fSFande Kong 2136d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatRestoreRow_HYPRE(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2137d71ae5a4SJacob Faibussowitsch { 2138c69f721fSFande Kong hypre_ParCSRMatrix *parcsr; 21392cf14000SStefano Zampini HYPRE_Int hnz; 2140c69f721fSFande Kong 2141c69f721fSFande Kong PetscFunctionBegin; 2142c69f721fSFande Kong /* retrieve the internal matrix */ 21439566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 2144c69f721fSFande Kong /* call HYPRE API */ 21452cf14000SStefano Zampini hnz = nz ? (HYPRE_Int)(*nz) : 0; 2146a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_ParCSRMatrixRestoreRow(parcsr, row, &hnz, (HYPRE_BigInt **)idx, (HYPRE_Complex **)v)); 21473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2148c69f721fSFande Kong } 2149c69f721fSFande Kong 2150d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetValues_HYPRE(Mat A, PetscInt m, const PetscInt idxm[], PetscInt n, const PetscInt idxn[], PetscScalar v[]) 2151d71ae5a4SJacob Faibussowitsch { 215245b8d346SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 2153c69f721fSFande Kong PetscInt i; 21541d4906efSStefano Zampini 2155c69f721fSFande Kong PetscFunctionBegin; 21563ba16761SJacob Faibussowitsch if (!m || !n) PetscFunctionReturn(PETSC_SUCCESS); 2157c69f721fSFande Kong /* Ignore negative row indices 2158c69f721fSFande Kong * And negative column indices should be automatically ignored in hypre 2159c69f721fSFande Kong * */ 21602cf14000SStefano Zampini for (i = 0; i < m; i++) { 21612cf14000SStefano Zampini if (idxm[i] >= 0) { 21622cf14000SStefano Zampini HYPRE_Int hn = (HYPRE_Int)n; 2163a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetValues(hA->ij, 1, &hn, (HYPRE_BigInt *)&idxm[i], (HYPRE_BigInt *)idxn, (HYPRE_Complex *)(v + i * n))); 21642cf14000SStefano Zampini } 21652cf14000SStefano Zampini } 21663ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2167c69f721fSFande Kong } 2168c69f721fSFande Kong 2169d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetOption_HYPRE(Mat A, MatOption op, PetscBool flg) 2170d71ae5a4SJacob Faibussowitsch { 2171ddbeb582SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 2172ddbeb582SStefano Zampini 2173ddbeb582SStefano Zampini PetscFunctionBegin; 2174c6698e78SStefano Zampini switch (op) { 2175ddbeb582SStefano Zampini case MAT_NO_OFF_PROC_ENTRIES: 2176a333fa2bSZach Atkins if (flg) PetscCallHYPRE(HYPRE_IJMatrixSetMaxOffProcElmts(hA->ij, 0)); 2177ddbeb582SStefano Zampini break; 2178651b1cf9SStefano Zampini case MAT_IGNORE_OFF_PROC_ENTRIES: 2179651b1cf9SStefano Zampini hA->donotstash = flg; 2180d71ae5a4SJacob Faibussowitsch break; 2181d71ae5a4SJacob Faibussowitsch default: 2182d71ae5a4SJacob Faibussowitsch break; 2183ddbeb582SStefano Zampini } 21843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2185ddbeb582SStefano Zampini } 2186c69f721fSFande Kong 2187d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_HYPRE(Mat A, PetscViewer view) 2188d71ae5a4SJacob Faibussowitsch { 218945b8d346SStefano Zampini PetscViewerFormat format; 219045b8d346SStefano Zampini 219145b8d346SStefano Zampini PetscFunctionBegin; 21929566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(view, &format)); 21933ba16761SJacob Faibussowitsch if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS); 219445b8d346SStefano Zampini if (format != PETSC_VIEWER_NATIVE) { 21956ea7df73SStefano Zampini Mat B; 21966ea7df73SStefano Zampini hypre_ParCSRMatrix *parcsr; 21976ea7df73SStefano Zampini PetscErrorCode (*mview)(Mat, PetscViewer) = NULL; 21986ea7df73SStefano Zampini 21999566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 22009566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(parcsr, MATAIJ, PETSC_USE_POINTER, &B)); 220157d50842SBarry Smith PetscCall(MatGetOperation(B, MATOP_VIEW, (PetscErrorCodeFn **)&mview)); 220228b400f6SJacob Faibussowitsch PetscCheck(mview, PetscObjectComm((PetscObject)A), PETSC_ERR_PLIB, "Missing view operation"); 22039566063dSJacob Faibussowitsch PetscCall((*mview)(B, view)); 22049566063dSJacob Faibussowitsch PetscCall(MatDestroy(&B)); 220545b8d346SStefano Zampini } else { 220645b8d346SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 220745b8d346SStefano Zampini PetscMPIInt size; 220845b8d346SStefano Zampini PetscBool isascii; 220945b8d346SStefano Zampini const char *filename; 221045b8d346SStefano Zampini 221145b8d346SStefano Zampini /* HYPRE uses only text files */ 22129566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)view, PETSCVIEWERASCII, &isascii)); 221328b400f6SJacob Faibussowitsch PetscCheck(isascii, PetscObjectComm((PetscObject)view), PETSC_ERR_SUP, "PetscViewerType %s: native HYPRE format needs PETSCVIEWERASCII", ((PetscObject)view)->type_name); 22149566063dSJacob Faibussowitsch PetscCall(PetscViewerFileGetName(view, &filename)); 2215a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixPrint(hA->ij, filename)); 22169566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(hA->comm, &size)); 221745b8d346SStefano Zampini if (size > 1) { 22189566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(view, "Matrix files: %s.%05d ... %s.%05d\n", filename, 0, filename, size - 1)); 221945b8d346SStefano Zampini } else { 22209566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(view, "Matrix file: %s.%05d\n", filename, 0)); 222145b8d346SStefano Zampini } 222245b8d346SStefano Zampini } 22233ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 222445b8d346SStefano Zampini } 222545b8d346SStefano Zampini 2226d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatCopy_HYPRE(Mat A, Mat B, MatStructure str) 2227d71ae5a4SJacob Faibussowitsch { 2228465edc17SStefano Zampini hypre_ParCSRMatrix *acsr, *bcsr; 2229465edc17SStefano Zampini 2230465edc17SStefano Zampini PetscFunctionBegin; 2231465edc17SStefano Zampini if (str == SAME_NONZERO_PATTERN && A->ops->copy == B->ops->copy) { 22329566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &acsr)); 22339566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(B, &bcsr)); 2234a333fa2bSZach Atkins PetscCallHYPRE(hypre_ParCSRMatrixCopy(acsr, bcsr, 1)); 22359566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_SORTED_FULL, PETSC_TRUE)); /* "perfect" preallocation, so no need for hypre_AuxParCSRMatrixNeedAux */ 22369566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 22379566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 2238465edc17SStefano Zampini } else { 22399566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 2240465edc17SStefano Zampini } 22413ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2242465edc17SStefano Zampini } 2243465edc17SStefano Zampini 2244d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetDiagonal_HYPRE(Mat A, Vec d) 2245d71ae5a4SJacob Faibussowitsch { 22466305df00SStefano Zampini hypre_ParCSRMatrix *parcsr; 22476305df00SStefano Zampini hypre_CSRMatrix *dmat; 224839accc25SStefano Zampini HYPRE_Complex *a; 22496305df00SStefano Zampini PetscBool cong; 22506305df00SStefano Zampini 22516305df00SStefano Zampini PetscFunctionBegin; 22529566063dSJacob Faibussowitsch PetscCall(MatHasCongruentLayouts(A, &cong)); 225328b400f6SJacob Faibussowitsch PetscCheck(cong, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only for square matrices with same local distributions of rows and columns"); 22549566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 22556305df00SStefano Zampini dmat = hypre_ParCSRMatrixDiag(parcsr); 22566305df00SStefano Zampini if (dmat) { 225706977982Sstefanozampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 225806977982Sstefanozampini HYPRE_MemoryLocation mem = hypre_CSRMatrixMemoryLocation(dmat); 225906977982Sstefanozampini #else 226006977982Sstefanozampini HYPRE_MemoryLocation mem = HYPRE_MEMORY_HOST; 226106977982Sstefanozampini #endif 226206977982Sstefanozampini 226306977982Sstefanozampini if (mem != HYPRE_MEMORY_HOST) PetscCall(VecGetArrayWriteAndMemType(d, (PetscScalar **)&a, NULL)); 226406977982Sstefanozampini else PetscCall(VecGetArrayWrite(d, (PetscScalar **)&a)); 226506977982Sstefanozampini hypre_CSRMatrixExtractDiagonal(dmat, a, 0); 226606977982Sstefanozampini if (mem != HYPRE_MEMORY_HOST) PetscCall(VecRestoreArrayWriteAndMemType(d, (PetscScalar **)&a)); 226706977982Sstefanozampini else PetscCall(VecRestoreArrayWrite(d, (PetscScalar **)&a)); 22686305df00SStefano Zampini } 22693ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22706305df00SStefano Zampini } 22716305df00SStefano Zampini 2272363d496dSStefano Zampini #include <petscblaslapack.h> 2273363d496dSStefano Zampini 2274d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAXPY_HYPRE(Mat Y, PetscScalar a, Mat X, MatStructure str) 2275d71ae5a4SJacob Faibussowitsch { 2276363d496dSStefano Zampini PetscFunctionBegin; 22776ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 22786ea7df73SStefano Zampini { 22796ea7df73SStefano Zampini Mat B; 22806ea7df73SStefano Zampini hypre_ParCSRMatrix *x, *y, *z; 22816ea7df73SStefano Zampini 22829566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR(Y, &y)); 22839566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR(X, &x)); 2284a333fa2bSZach Atkins PetscCallHYPRE(hypre_ParCSRMatrixAdd(1.0, y, 1.0, x, &z)); 22859566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(z, MATHYPRE, PETSC_OWN_POINTER, &B)); 22869566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 22876ea7df73SStefano Zampini } 22886ea7df73SStefano Zampini #else 2289363d496dSStefano Zampini if (str == SAME_NONZERO_PATTERN) { 2290363d496dSStefano Zampini hypre_ParCSRMatrix *x, *y; 2291363d496dSStefano Zampini hypre_CSRMatrix *xloc, *yloc; 2292363d496dSStefano Zampini PetscInt xnnz, ynnz; 229339accc25SStefano Zampini HYPRE_Complex *xarr, *yarr; 2294363d496dSStefano Zampini PetscBLASInt one = 1, bnz; 2295363d496dSStefano Zampini 22969566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR(Y, &y)); 22979566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR(X, &x)); 2298363d496dSStefano Zampini 2299363d496dSStefano Zampini /* diagonal block */ 2300363d496dSStefano Zampini xloc = hypre_ParCSRMatrixDiag(x); 2301363d496dSStefano Zampini yloc = hypre_ParCSRMatrixDiag(y); 2302363d496dSStefano Zampini xnnz = 0; 2303363d496dSStefano Zampini ynnz = 0; 2304363d496dSStefano Zampini xarr = NULL; 2305363d496dSStefano Zampini yarr = NULL; 2306363d496dSStefano Zampini if (xloc) { 230739accc25SStefano Zampini xarr = hypre_CSRMatrixData(xloc); 2308363d496dSStefano Zampini xnnz = hypre_CSRMatrixNumNonzeros(xloc); 2309363d496dSStefano Zampini } 2310363d496dSStefano Zampini if (yloc) { 231139accc25SStefano Zampini yarr = hypre_CSRMatrixData(yloc); 2312363d496dSStefano Zampini ynnz = hypre_CSRMatrixNumNonzeros(yloc); 2313363d496dSStefano Zampini } 231408401ef6SPierre Jolivet PetscCheck(xnnz == ynnz, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Different number of nonzeros in diagonal block %" PetscInt_FMT " != %" PetscInt_FMT, xnnz, ynnz); 23159566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(xnnz, &bnz)); 2316792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &a, (PetscScalar *)xarr, &one, (PetscScalar *)yarr, &one)); 2317363d496dSStefano Zampini 2318363d496dSStefano Zampini /* off-diagonal block */ 2319363d496dSStefano Zampini xloc = hypre_ParCSRMatrixOffd(x); 2320363d496dSStefano Zampini yloc = hypre_ParCSRMatrixOffd(y); 2321363d496dSStefano Zampini xnnz = 0; 2322363d496dSStefano Zampini ynnz = 0; 2323363d496dSStefano Zampini xarr = NULL; 2324363d496dSStefano Zampini yarr = NULL; 2325363d496dSStefano Zampini if (xloc) { 232639accc25SStefano Zampini xarr = hypre_CSRMatrixData(xloc); 2327363d496dSStefano Zampini xnnz = hypre_CSRMatrixNumNonzeros(xloc); 2328363d496dSStefano Zampini } 2329363d496dSStefano Zampini if (yloc) { 233039accc25SStefano Zampini yarr = hypre_CSRMatrixData(yloc); 2331363d496dSStefano Zampini ynnz = hypre_CSRMatrixNumNonzeros(yloc); 2332363d496dSStefano Zampini } 233308401ef6SPierre Jolivet PetscCheck(xnnz == ynnz, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Different number of nonzeros in off-diagonal block %" PetscInt_FMT " != %" PetscInt_FMT, xnnz, ynnz); 23349566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(xnnz, &bnz)); 2335792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &a, (PetscScalar *)xarr, &one, (PetscScalar *)yarr, &one)); 2336363d496dSStefano Zampini } else if (str == SUBSET_NONZERO_PATTERN) { 23379566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 2338363d496dSStefano Zampini } else { 2339363d496dSStefano Zampini Mat B; 2340363d496dSStefano Zampini 23419566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic_Preallocate(Y, X, &B)); 23429566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 23439566063dSJacob Faibussowitsch PetscCall(MatHeaderReplace(Y, &B)); 2344363d496dSStefano Zampini } 23456ea7df73SStefano Zampini #endif 23463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2347363d496dSStefano Zampini } 2348363d496dSStefano Zampini 23492c4ab24aSJunchao Zhang static PetscErrorCode MatDuplicate_HYPRE(Mat A, MatDuplicateOption op, Mat *B) 23502c4ab24aSJunchao Zhang { 23512c4ab24aSJunchao Zhang hypre_ParCSRMatrix *parcsr = NULL; 23522c4ab24aSJunchao Zhang PetscCopyMode cpmode; 23532c4ab24aSJunchao Zhang Mat_HYPRE *hA; 23542c4ab24aSJunchao Zhang 23552c4ab24aSJunchao Zhang PetscFunctionBegin; 23562c4ab24aSJunchao Zhang PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 23572c4ab24aSJunchao Zhang if (op == MAT_DO_NOT_COPY_VALUES || op == MAT_SHARE_NONZERO_PATTERN) { 23582c4ab24aSJunchao Zhang parcsr = hypre_ParCSRMatrixClone(parcsr, 0); 23592c4ab24aSJunchao Zhang cpmode = PETSC_OWN_POINTER; 23602c4ab24aSJunchao Zhang } else { 23612c4ab24aSJunchao Zhang cpmode = PETSC_COPY_VALUES; 23622c4ab24aSJunchao Zhang } 23632c4ab24aSJunchao Zhang PetscCall(MatCreateFromParCSR(parcsr, MATHYPRE, cpmode, B)); 23642c4ab24aSJunchao Zhang hA = (Mat_HYPRE *)A->data; 23652c4ab24aSJunchao Zhang if (hA->cooMat) { 236606977982Sstefanozampini Mat_HYPRE *hB = (Mat_HYPRE *)((*B)->data); 2367b73e3080SStefano Zampini op = (op == MAT_DO_NOT_COPY_VALUES) ? op : MAT_COPY_VALUES; 2368b73e3080SStefano Zampini /* Cannot simply increase the reference count of hA->cooMat, since B needs to share cooMat's data array */ 236906977982Sstefanozampini PetscCall(MatDuplicate(hA->cooMat, op, &hB->cooMat)); 237006977982Sstefanozampini PetscCall(MatHYPRE_AttachCOOMat(*B)); 23712c4ab24aSJunchao Zhang } 23722c4ab24aSJunchao Zhang PetscFunctionReturn(PETSC_SUCCESS); 23732c4ab24aSJunchao Zhang } 23742c4ab24aSJunchao Zhang 2375d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetPreallocationCOO_HYPRE(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[]) 2376d71ae5a4SJacob Faibussowitsch { 237706977982Sstefanozampini Mat_HYPRE *hmat = (Mat_HYPRE *)mat->data; 23785fbaff96SJunchao Zhang 23795fbaff96SJunchao Zhang PetscFunctionBegin; 2380651b1cf9SStefano Zampini /* Build an agent matrix cooMat with AIJ format 23815fbaff96SJunchao Zhang It has the same sparsity pattern as mat, and also shares the data array with mat. We use cooMat to do the COO work. 23825fbaff96SJunchao Zhang */ 238306977982Sstefanozampini PetscCall(MatHYPRE_CreateCOOMat(mat)); 238406977982Sstefanozampini PetscCall(MatSetOption(hmat->cooMat, MAT_IGNORE_OFF_PROC_ENTRIES, hmat->donotstash)); 238506977982Sstefanozampini PetscCall(MatSetOption(hmat->cooMat, MAT_NO_OFF_PROC_ENTRIES, mat->nooffprocentries)); 2386651b1cf9SStefano Zampini 2387651b1cf9SStefano Zampini /* MatSetPreallocationCOO_SeqAIJ and MatSetPreallocationCOO_MPIAIJ uses this specific 2388651b1cf9SStefano Zampini name to automatically put the diagonal entries first */ 238906977982Sstefanozampini PetscCall(PetscObjectSetName((PetscObject)hmat->cooMat, "_internal_COO_mat_for_hypre")); 239006977982Sstefanozampini PetscCall(MatSetPreallocationCOO(hmat->cooMat, coo_n, coo_i, coo_j)); 239106977982Sstefanozampini hmat->cooMat->assembled = PETSC_TRUE; 23925fbaff96SJunchao Zhang 23935fbaff96SJunchao Zhang /* Copy the sparsity pattern from cooMat to hypre IJMatrix hmat->ij */ 23945fbaff96SJunchao Zhang PetscCall(MatSetOption(mat, MAT_SORTED_FULL, PETSC_TRUE)); 239506977982Sstefanozampini PetscCall(MatHYPRE_CreateFromMat(hmat->cooMat, hmat)); /* Create hmat->ij and preallocate it */ 239606977982Sstefanozampini PetscCall(MatHYPRE_IJMatrixCopyIJ(hmat->cooMat, hmat->ij)); /* Copy A's (i,j) to hmat->ij */ 23975fbaff96SJunchao Zhang 23985fbaff96SJunchao Zhang mat->preallocated = PETSC_TRUE; 23995fbaff96SJunchao Zhang PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY)); 24005fbaff96SJunchao Zhang PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY)); /* Migrate mat to device if it is bound to. Hypre builds its own SpMV context here */ 24015fbaff96SJunchao Zhang 24022c4ab24aSJunchao Zhang /* Attach cooMat to mat */ 240306977982Sstefanozampini PetscCall(MatHYPRE_AttachCOOMat(mat)); 24043ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24055fbaff96SJunchao Zhang } 24065fbaff96SJunchao Zhang 2407d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_HYPRE(Mat mat, const PetscScalar v[], InsertMode imode) 2408d71ae5a4SJacob Faibussowitsch { 24095fbaff96SJunchao Zhang Mat_HYPRE *hmat = (Mat_HYPRE *)mat->data; 24105fbaff96SJunchao Zhang 24115fbaff96SJunchao Zhang PetscFunctionBegin; 2412b73e3080SStefano Zampini PetscCheck(hmat->cooMat, PetscObjectComm((PetscObject)mat), PETSC_ERR_PLIB, "HYPRE COO delegate matrix has not been created yet"); 24135fbaff96SJunchao Zhang PetscCall(MatSetValuesCOO(hmat->cooMat, v, imode)); 2414651b1cf9SStefano Zampini PetscCall(MatViewFromOptions(hmat->cooMat, (PetscObject)mat, "-cooMat_view")); 24153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24165fbaff96SJunchao Zhang } 24175fbaff96SJunchao Zhang 241803db1824SAlex Lindsay static PetscErrorCode MatGetCurrentMemType_HYPRE(Mat A, PetscMemType *m) 241903db1824SAlex Lindsay { 242003db1824SAlex Lindsay PetscBool petsconcpu; 242103db1824SAlex Lindsay 242203db1824SAlex Lindsay PetscFunctionBegin; 242303db1824SAlex Lindsay PetscCall(MatBoundToCPU(A, &petsconcpu)); 242403db1824SAlex Lindsay *m = petsconcpu ? PETSC_MEMTYPE_HOST : PETSC_MEMTYPE_DEVICE; 242503db1824SAlex Lindsay PetscFunctionReturn(PETSC_SUCCESS); 242603db1824SAlex Lindsay } 242703db1824SAlex Lindsay 2428a055b5aaSBarry Smith /*MC 24292ef1f0ffSBarry Smith MATHYPRE - "hypre" - A matrix type to be used for sequential and parallel sparse matrices 2430a055b5aaSBarry Smith based on the hypre IJ interface. 2431a055b5aaSBarry Smith 2432a055b5aaSBarry Smith Level: intermediate 2433a055b5aaSBarry Smith 24341cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatHYPRESetPreallocation` 2435a055b5aaSBarry Smith M*/ 2436d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_HYPRE(Mat B) 2437d71ae5a4SJacob Faibussowitsch { 243863c07aadSStefano Zampini Mat_HYPRE *hB; 2439a9e6c71bSAlex Lindsay #if defined(PETSC_HAVE_HYPRE_DEVICE) 2440a9e6c71bSAlex Lindsay HYPRE_MemoryLocation memory_location; 2441a9e6c71bSAlex Lindsay #endif 244263c07aadSStefano Zampini 244363c07aadSStefano Zampini PetscFunctionBegin; 2444a9e6c71bSAlex Lindsay PetscHYPREInitialize(); 24454dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&hB)); 24466ea7df73SStefano Zampini 2447978814f1SStefano Zampini hB->inner_free = PETSC_TRUE; 2448651b1cf9SStefano Zampini hB->array_available = PETSC_TRUE; 2449978814f1SStefano Zampini 245063c07aadSStefano Zampini B->data = (void *)hB; 245163c07aadSStefano Zampini 24529566063dSJacob Faibussowitsch PetscCall(PetscMemzero(B->ops, sizeof(struct _MatOps))); 245363c07aadSStefano Zampini B->ops->mult = MatMult_HYPRE; 245463c07aadSStefano Zampini B->ops->multtranspose = MatMultTranspose_HYPRE; 2455414bd5c3SStefano Zampini B->ops->multadd = MatMultAdd_HYPRE; 2456414bd5c3SStefano Zampini B->ops->multtransposeadd = MatMultTransposeAdd_HYPRE; 245763c07aadSStefano Zampini B->ops->setup = MatSetUp_HYPRE; 245863c07aadSStefano Zampini B->ops->destroy = MatDestroy_HYPRE; 245963c07aadSStefano Zampini B->ops->assemblyend = MatAssemblyEnd_HYPRE; 2460c69f721fSFande Kong B->ops->assemblybegin = MatAssemblyBegin_HYPRE; 2461d975228cSstefano_zampini B->ops->setvalues = MatSetValues_HYPRE; 246268ec7858SStefano Zampini B->ops->missingdiagonal = MatMissingDiagonal_HYPRE; 246368ec7858SStefano Zampini B->ops->scale = MatScale_HYPRE; 246468ec7858SStefano Zampini B->ops->zerorowscolumns = MatZeroRowsColumns_HYPRE; 2465c69f721fSFande Kong B->ops->zeroentries = MatZeroEntries_HYPRE; 2466c69f721fSFande Kong B->ops->zerorows = MatZeroRows_HYPRE; 2467c69f721fSFande Kong B->ops->getrow = MatGetRow_HYPRE; 2468c69f721fSFande Kong B->ops->restorerow = MatRestoreRow_HYPRE; 2469c69f721fSFande Kong B->ops->getvalues = MatGetValues_HYPRE; 2470ddbeb582SStefano Zampini B->ops->setoption = MatSetOption_HYPRE; 247145b8d346SStefano Zampini B->ops->duplicate = MatDuplicate_HYPRE; 2472465edc17SStefano Zampini B->ops->copy = MatCopy_HYPRE; 247345b8d346SStefano Zampini B->ops->view = MatView_HYPRE; 24746305df00SStefano Zampini B->ops->getdiagonal = MatGetDiagonal_HYPRE; 2475363d496dSStefano Zampini B->ops->axpy = MatAXPY_HYPRE; 24764222ddf1SHong Zhang B->ops->productsetfromoptions = MatProductSetFromOptions_HYPRE; 247703db1824SAlex Lindsay B->ops->getcurrentmemtype = MatGetCurrentMemType_HYPRE; 24786ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 24796ea7df73SStefano Zampini B->ops->bindtocpu = MatBindToCPU_HYPRE; 2480a9e6c71bSAlex Lindsay /* Get hypre's default memory location. Users can control this using the corresponding HYPRE_SetMemoryLocation API */ 2481a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_GetMemoryLocation(&memory_location)); 2482a9e6c71bSAlex Lindsay B->boundtocpu = (memory_location == HYPRE_MEMORY_HOST) ? PETSC_TRUE : PETSC_FALSE; 24836ea7df73SStefano Zampini #endif 248445b8d346SStefano Zampini 248545b8d346SStefano Zampini /* build cache for off array entries formed */ 24869566063dSJacob Faibussowitsch PetscCall(MatStashCreate_Private(PetscObjectComm((PetscObject)B), 1, &B->stash)); 248763c07aadSStefano Zampini 24889566063dSJacob Faibussowitsch PetscCall(PetscCommGetComm(PetscObjectComm((PetscObject)B), &hB->comm)); 24899566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATHYPRE)); 24909566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_hypre_aij_C", MatConvert_HYPRE_AIJ)); 24919566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_hypre_is_C", MatConvert_HYPRE_IS)); 24929566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_hypre_C", MatProductSetFromOptions_HYPRE)); 24939566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_mpiaij_hypre_C", MatProductSetFromOptions_HYPRE)); 24949566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatHYPRESetPreallocation_C", MatHYPRESetPreallocation_HYPRE)); 24959566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatHYPREGetParCSR_C", MatHYPREGetParCSR_HYPRE)); 24965fbaff96SJunchao Zhang PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_HYPRE)); 24975fbaff96SJunchao Zhang PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_HYPRE)); 24986ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 24996ea7df73SStefano Zampini #if defined(HYPRE_USING_HIP) 250006977982Sstefanozampini PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijhipsparse_hypre_C", MatProductSetFromOptions_HYPRE)); 250106977982Sstefanozampini PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_mpiaijhipsparse_hypre_C", MatProductSetFromOptions_HYPRE)); 25029566063dSJacob Faibussowitsch PetscCall(PetscDeviceInitialize(PETSC_DEVICE_HIP)); 25039566063dSJacob Faibussowitsch PetscCall(MatSetVecType(B, VECHIP)); 25046ea7df73SStefano Zampini #endif 25056ea7df73SStefano Zampini #if defined(HYPRE_USING_CUDA) 250606977982Sstefanozampini PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_hypre_C", MatProductSetFromOptions_HYPRE)); 250706977982Sstefanozampini PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_mpiaijcusparse_hypre_C", MatProductSetFromOptions_HYPRE)); 25089566063dSJacob Faibussowitsch PetscCall(PetscDeviceInitialize(PETSC_DEVICE_CUDA)); 25099566063dSJacob Faibussowitsch PetscCall(MatSetVecType(B, VECCUDA)); 25106ea7df73SStefano Zampini #endif 25116ea7df73SStefano Zampini #endif 25123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 251363c07aadSStefano Zampini } 2514