163c07aadSStefano Zampini 263c07aadSStefano Zampini /* 363c07aadSStefano Zampini Creates hypre ijmatrix from PETSc matrix 463c07aadSStefano Zampini */ 5225daaf8SStefano Zampini 6c6698e78SStefano Zampini #include <petscpkg_version.h> 739accc25SStefano Zampini #include <petsc/private/petschypre.h> 8dd9c0a25Sstefano_zampini #include <petscmathypre.h> 963c07aadSStefano Zampini #include <petsc/private/matimpl.h> 10a4af0ceeSJacob Faibussowitsch #include <petsc/private/deviceimpl.h> 1163c07aadSStefano Zampini #include <../src/mat/impls/hypre/mhypre.h> 1263c07aadSStefano Zampini #include <../src/mat/impls/aij/mpi/mpiaij.h> 1358968eb6SStefano Zampini #include <../src/vec/vec/impls/hypre/vhyp.h> 1458968eb6SStefano Zampini #include <HYPRE.h> 15c1a070e6SStefano Zampini #include <HYPRE_utilities.h> 16cd8bc7baSStefano Zampini #include <_hypre_parcsr_ls.h> 1768ec7858SStefano Zampini #include <_hypre_sstruct_ls.h> 1863c07aadSStefano Zampini 190e6427aaSSatish Balay #if PETSC_PKG_HYPRE_VERSION_LT(2, 18, 0) 200e6427aaSSatish Balay #define hypre_ParCSRMatrixClone(A, B) hypre_ParCSRMatrixCompleteClone(A) 210e6427aaSSatish Balay #endif 220e6427aaSSatish Balay 2363c07aadSStefano Zampini static PetscErrorCode MatHYPRE_CreateFromMat(Mat, Mat_HYPRE *); 2463c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixPreallocate(Mat, Mat, HYPRE_IJMatrix); 2563c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixFastCopy_MPIAIJ(Mat, HYPRE_IJMatrix); 2663c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixFastCopy_SeqAIJ(Mat, HYPRE_IJMatrix); 2739accc25SStefano Zampini static PetscErrorCode MatHYPRE_MultKernel_Private(Mat, HYPRE_Complex, Vec, HYPRE_Complex, Vec, PetscBool); 28225daaf8SStefano Zampini static PetscErrorCode hypre_array_destroy(void *); 296ea7df73SStefano Zampini static PetscErrorCode MatSetValues_HYPRE(Mat, PetscInt, const PetscInt[], PetscInt, const PetscInt[], const PetscScalar[], InsertMode ins); 3063c07aadSStefano Zampini 31d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_IJMatrixPreallocate(Mat A_d, Mat A_o, HYPRE_IJMatrix ij) 32d71ae5a4SJacob Faibussowitsch { 3363c07aadSStefano Zampini PetscInt i, n_d, n_o; 3463c07aadSStefano Zampini const PetscInt *ia_d, *ia_o; 3563c07aadSStefano Zampini PetscBool done_d = PETSC_FALSE, done_o = PETSC_FALSE; 362cf14000SStefano Zampini HYPRE_Int *nnz_d = NULL, *nnz_o = NULL; 3763c07aadSStefano Zampini 3863c07aadSStefano Zampini PetscFunctionBegin; 3963c07aadSStefano Zampini if (A_d) { /* determine number of nonzero entries in local diagonal part */ 409566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(A_d, 0, PETSC_FALSE, PETSC_FALSE, &n_d, &ia_d, NULL, &done_d)); 4163c07aadSStefano Zampini if (done_d) { 429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n_d, &nnz_d)); 43ad540459SPierre Jolivet for (i = 0; i < n_d; i++) nnz_d[i] = ia_d[i + 1] - ia_d[i]; 4463c07aadSStefano Zampini } 459566063dSJacob Faibussowitsch PetscCall(MatRestoreRowIJ(A_d, 0, PETSC_FALSE, PETSC_FALSE, NULL, &ia_d, NULL, &done_d)); 4663c07aadSStefano Zampini } 4763c07aadSStefano Zampini if (A_o) { /* determine number of nonzero entries in local off-diagonal part */ 489566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(A_o, 0, PETSC_FALSE, PETSC_FALSE, &n_o, &ia_o, NULL, &done_o)); 4963c07aadSStefano Zampini if (done_o) { 509566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n_o, &nnz_o)); 51ad540459SPierre Jolivet for (i = 0; i < n_o; i++) nnz_o[i] = ia_o[i + 1] - ia_o[i]; 5263c07aadSStefano Zampini } 539566063dSJacob Faibussowitsch PetscCall(MatRestoreRowIJ(A_o, 0, PETSC_FALSE, PETSC_FALSE, &n_o, &ia_o, NULL, &done_o)); 5463c07aadSStefano Zampini } 5563c07aadSStefano Zampini if (done_d) { /* set number of nonzeros in HYPRE IJ matrix */ 5663c07aadSStefano Zampini if (!done_o) { /* only diagonal part */ 579566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n_d, &nnz_o)); 5863c07aadSStefano Zampini } 59c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2, 16, 0) 60c6698e78SStefano Zampini { /* If we don't do this, the columns of the matrix will be all zeros! */ 61c6698e78SStefano Zampini hypre_AuxParCSRMatrix *aux_matrix; 62c6698e78SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij); 63c6698e78SStefano Zampini hypre_AuxParCSRMatrixDestroy(aux_matrix); 64c6698e78SStefano Zampini hypre_IJMatrixTranslator(ij) = NULL; 65792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetDiagOffdSizes, ij, nnz_d, nnz_o); 6622235d61SPierre Jolivet /* it seems they partially fixed it in 2.19.0 */ 6722235d61SPierre Jolivet #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0) 68c6698e78SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij); 69c6698e78SStefano Zampini hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 1; 7022235d61SPierre Jolivet #endif 71c6698e78SStefano Zampini } 72c6698e78SStefano Zampini #else 73792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetDiagOffdSizes, ij, nnz_d, nnz_o); 74c6698e78SStefano Zampini #endif 759566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz_d)); 769566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz_o)); 7763c07aadSStefano Zampini } 783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7963c07aadSStefano Zampini } 8063c07aadSStefano Zampini 81d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_CreateFromMat(Mat A, Mat_HYPRE *hA) 82d71ae5a4SJacob Faibussowitsch { 8363c07aadSStefano Zampini PetscInt rstart, rend, cstart, cend; 8463c07aadSStefano Zampini 8563c07aadSStefano Zampini PetscFunctionBegin; 869566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 879566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 8863c07aadSStefano Zampini rstart = A->rmap->rstart; 8963c07aadSStefano Zampini rend = A->rmap->rend; 9063c07aadSStefano Zampini cstart = A->cmap->rstart; 9163c07aadSStefano Zampini cend = A->cmap->rend; 92792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixCreate, hA->comm, rstart, rend - 1, cstart, cend - 1, &hA->ij); 93792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetObjectType, hA->ij, HYPRE_PARCSR); 9463c07aadSStefano Zampini { 9563c07aadSStefano Zampini PetscBool same; 9663c07aadSStefano Zampini Mat A_d, A_o; 9763c07aadSStefano Zampini const PetscInt *colmap; 989566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &same)); 9963c07aadSStefano Zampini if (same) { 1009566063dSJacob Faibussowitsch PetscCall(MatMPIAIJGetSeqAIJ(A, &A_d, &A_o, &colmap)); 1019566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixPreallocate(A_d, A_o, hA->ij)); 1023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10363c07aadSStefano Zampini } 1049566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIBAIJ, &same)); 10563c07aadSStefano Zampini if (same) { 1069566063dSJacob Faibussowitsch PetscCall(MatMPIBAIJGetSeqBAIJ(A, &A_d, &A_o, &colmap)); 1079566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixPreallocate(A_d, A_o, hA->ij)); 1083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10963c07aadSStefano Zampini } 1109566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATSEQAIJ, &same)); 11163c07aadSStefano Zampini if (same) { 1129566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixPreallocate(A, NULL, hA->ij)); 1133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 11463c07aadSStefano Zampini } 1159566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATSEQBAIJ, &same)); 11663c07aadSStefano Zampini if (same) { 1179566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixPreallocate(A, NULL, hA->ij)); 1183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 11963c07aadSStefano Zampini } 12063c07aadSStefano Zampini } 1213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12263c07aadSStefano Zampini } 12363c07aadSStefano Zampini 124d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_IJMatrixCopy(Mat A, HYPRE_IJMatrix ij) 125d71ae5a4SJacob Faibussowitsch { 12663c07aadSStefano Zampini PetscInt i, rstart, rend, ncols, nr, nc; 12763c07aadSStefano Zampini const PetscScalar *values; 12863c07aadSStefano Zampini const PetscInt *cols; 12963c07aadSStefano Zampini PetscBool flg; 13063c07aadSStefano Zampini 13163c07aadSStefano Zampini PetscFunctionBegin; 1326ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0) 133792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixInitialize, ij); 1346ea7df73SStefano Zampini #else 135792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixInitialize_v2, ij, HYPRE_MEMORY_HOST); 1366ea7df73SStefano Zampini #endif 1379566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &flg)); 1389566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &nr, &nc)); 13963c07aadSStefano Zampini if (flg && nr == nc) { 1409566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixFastCopy_MPIAIJ(A, ij)); 1413ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 14263c07aadSStefano Zampini } 1439566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATSEQAIJ, &flg)); 14463c07aadSStefano Zampini if (flg) { 1459566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixFastCopy_SeqAIJ(A, ij)); 1463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 14763c07aadSStefano Zampini } 14863c07aadSStefano Zampini 1495fbaff96SJunchao Zhang /* Do not need Aux since we have done precise i[],j[] allocation in MatHYPRE_CreateFromMat() */ 1505fbaff96SJunchao Zhang hypre_AuxParCSRMatrixNeedAux((hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij)) = 0; 1515fbaff96SJunchao Zhang 1529566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(A, &rstart, &rend)); 15363c07aadSStefano Zampini for (i = rstart; i < rend; i++) { 1549566063dSJacob Faibussowitsch PetscCall(MatGetRow(A, i, &ncols, &cols, &values)); 155e3977e59Sstefano_zampini if (ncols) { 1562cf14000SStefano Zampini HYPRE_Int nc = (HYPRE_Int)ncols; 1572cf14000SStefano Zampini 158aed4548fSBarry Smith PetscCheck((PetscInt)nc == ncols, PETSC_COMM_SELF, PETSC_ERR_SUP, "Hypre overflow! number of columns %" PetscInt_FMT " for row %" PetscInt_FMT, ncols, i); 159792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetValues, ij, 1, &nc, (HYPRE_BigInt *)&i, (HYPRE_BigInt *)cols, (HYPRE_Complex *)values); 160e3977e59Sstefano_zampini } 1619566063dSJacob Faibussowitsch PetscCall(MatRestoreRow(A, i, &ncols, &cols, &values)); 16263c07aadSStefano Zampini } 1633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 16463c07aadSStefano Zampini } 16563c07aadSStefano Zampini 166d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_IJMatrixFastCopy_SeqAIJ(Mat A, HYPRE_IJMatrix ij) 167d71ae5a4SJacob Faibussowitsch { 16863c07aadSStefano Zampini Mat_SeqAIJ *pdiag = (Mat_SeqAIJ *)A->data; 16958968eb6SStefano Zampini HYPRE_Int type; 17063c07aadSStefano Zampini hypre_ParCSRMatrix *par_matrix; 17163c07aadSStefano Zampini hypre_AuxParCSRMatrix *aux_matrix; 17263c07aadSStefano Zampini hypre_CSRMatrix *hdiag; 1732cf14000SStefano Zampini PetscBool sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int)); 1746ea7df73SStefano Zampini const PetscScalar *pa; 17563c07aadSStefano Zampini 17663c07aadSStefano Zampini PetscFunctionBegin; 177792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType, ij, &type); 17808401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported"); 179792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, ij, (void **)&par_matrix); 18063c07aadSStefano Zampini hdiag = hypre_ParCSRMatrixDiag(par_matrix); 18163c07aadSStefano Zampini /* 18263c07aadSStefano Zampini this is the Hack part where we monkey directly with the hypre datastructures 18363c07aadSStefano Zampini */ 1842cf14000SStefano Zampini if (sameint) { 1859566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hdiag->i, pdiag->i, A->rmap->n + 1)); 1869566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hdiag->j, pdiag->j, pdiag->nz)); 1872cf14000SStefano Zampini } else { 1882cf14000SStefano Zampini PetscInt i; 1892cf14000SStefano Zampini 1902cf14000SStefano Zampini for (i = 0; i < A->rmap->n + 1; i++) hdiag->i[i] = (HYPRE_Int)pdiag->i[i]; 1912cf14000SStefano Zampini for (i = 0; i < pdiag->nz; i++) hdiag->j[i] = (HYPRE_Int)pdiag->j[i]; 1922cf14000SStefano Zampini } 1936ea7df73SStefano Zampini 1949566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &pa)); 1959566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hdiag->data, pa, pdiag->nz)); 1969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &pa)); 197ea9daf28SStefano Zampini 198ea9daf28SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij); 19963c07aadSStefano Zampini hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0; 2003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 20163c07aadSStefano Zampini } 20263c07aadSStefano Zampini 203d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_IJMatrixFastCopy_MPIAIJ(Mat A, HYPRE_IJMatrix ij) 204d71ae5a4SJacob Faibussowitsch { 20563c07aadSStefano Zampini Mat_MPIAIJ *pA = (Mat_MPIAIJ *)A->data; 20663c07aadSStefano Zampini Mat_SeqAIJ *pdiag, *poffd; 20763c07aadSStefano Zampini PetscInt i, *garray = pA->garray, *jj, cstart, *pjj; 2082cf14000SStefano Zampini HYPRE_Int *hjj, type; 20963c07aadSStefano Zampini hypre_ParCSRMatrix *par_matrix; 21063c07aadSStefano Zampini hypre_AuxParCSRMatrix *aux_matrix; 21163c07aadSStefano Zampini hypre_CSRMatrix *hdiag, *hoffd; 2122cf14000SStefano Zampini PetscBool sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int)); 2136ea7df73SStefano Zampini const PetscScalar *pa; 21463c07aadSStefano Zampini 21563c07aadSStefano Zampini PetscFunctionBegin; 21663c07aadSStefano Zampini pdiag = (Mat_SeqAIJ *)pA->A->data; 21763c07aadSStefano Zampini poffd = (Mat_SeqAIJ *)pA->B->data; 218da81f932SPierre Jolivet /* cstart is only valid for square MPIAIJ laid out in the usual way */ 2199566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(A, &cstart, NULL)); 22063c07aadSStefano Zampini 221792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType, ij, &type); 22208401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported"); 223792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, ij, (void **)&par_matrix); 22463c07aadSStefano Zampini hdiag = hypre_ParCSRMatrixDiag(par_matrix); 22563c07aadSStefano Zampini hoffd = hypre_ParCSRMatrixOffd(par_matrix); 22663c07aadSStefano Zampini 22763c07aadSStefano Zampini /* 22863c07aadSStefano Zampini this is the Hack part where we monkey directly with the hypre datastructures 22963c07aadSStefano Zampini */ 2302cf14000SStefano Zampini if (sameint) { 2319566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hdiag->i, pdiag->i, pA->A->rmap->n + 1)); 2322cf14000SStefano Zampini } else { 2332cf14000SStefano Zampini for (i = 0; i < pA->A->rmap->n + 1; i++) hdiag->i[i] = (HYPRE_Int)(pdiag->i[i]); 2342cf14000SStefano Zampini } 23563c07aadSStefano Zampini /* need to shift the diag column indices (hdiag->j) back to global numbering since hypre is expecting this */ 2362cf14000SStefano Zampini hjj = hdiag->j; 2372cf14000SStefano Zampini pjj = pdiag->j; 238c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2, 16, 0) 2392cf14000SStefano Zampini for (i = 0; i < pdiag->nz; i++) hjj[i] = pjj[i]; 240c6698e78SStefano Zampini #else 2412cf14000SStefano Zampini for (i = 0; i < pdiag->nz; i++) hjj[i] = cstart + pjj[i]; 242c6698e78SStefano Zampini #endif 2439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(pA->A, &pa)); 2449566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hdiag->data, pa, pdiag->nz)); 2459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(pA->A, &pa)); 2462cf14000SStefano Zampini if (sameint) { 2479566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hoffd->i, poffd->i, pA->A->rmap->n + 1)); 2482cf14000SStefano Zampini } else { 2492cf14000SStefano Zampini for (i = 0; i < pA->A->rmap->n + 1; i++) hoffd->i[i] = (HYPRE_Int)(poffd->i[i]); 2502cf14000SStefano Zampini } 2512cf14000SStefano Zampini 25263c07aadSStefano Zampini /* need to move the offd column indices (hoffd->j) back to global numbering since hypre is expecting this 25363c07aadSStefano Zampini If we hacked a hypre a bit more we might be able to avoid this step */ 254c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2, 16, 0) 255792fecdfSBarry Smith PetscCallExternal(hypre_CSRMatrixBigInitialize, hoffd); 256c6698e78SStefano Zampini jj = (PetscInt *)hoffd->big_j; 257c6698e78SStefano Zampini #else 25863c07aadSStefano Zampini jj = (PetscInt *)hoffd->j; 259c6698e78SStefano Zampini #endif 2602cf14000SStefano Zampini pjj = poffd->j; 26163c07aadSStefano Zampini for (i = 0; i < poffd->nz; i++) jj[i] = garray[pjj[i]]; 262c6698e78SStefano Zampini 2639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(pA->B, &pa)); 2649566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hoffd->data, pa, poffd->nz)); 2659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(pA->B, &pa)); 26663c07aadSStefano Zampini 267ea9daf28SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij); 26863c07aadSStefano Zampini hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0; 2693ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 27063c07aadSStefano Zampini } 27163c07aadSStefano Zampini 272d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatConvert_HYPRE_IS(Mat A, MatType mtype, MatReuse reuse, Mat *B) 273d71ae5a4SJacob Faibussowitsch { 2742df22349SStefano Zampini Mat_HYPRE *mhA = (Mat_HYPRE *)(A->data); 2752df22349SStefano Zampini Mat lA; 2762df22349SStefano Zampini ISLocalToGlobalMapping rl2g, cl2g; 2772df22349SStefano Zampini IS is; 2782df22349SStefano Zampini hypre_ParCSRMatrix *hA; 2792df22349SStefano Zampini hypre_CSRMatrix *hdiag, *hoffd; 2802df22349SStefano Zampini MPI_Comm comm; 28139accc25SStefano Zampini HYPRE_Complex *hdd, *hod, *aa; 28239accc25SStefano Zampini PetscScalar *data; 2832cf14000SStefano Zampini HYPRE_BigInt *col_map_offd; 2842cf14000SStefano Zampini HYPRE_Int *hdi, *hdj, *hoi, *hoj; 2852df22349SStefano Zampini PetscInt *ii, *jj, *iptr, *jptr; 2862df22349SStefano Zampini PetscInt cum, dr, dc, oc, str, stc, nnz, i, jd, jo, M, N; 28758968eb6SStefano Zampini HYPRE_Int type; 2882df22349SStefano Zampini 2892df22349SStefano Zampini PetscFunctionBegin; 290a1787963SStefano Zampini comm = PetscObjectComm((PetscObject)A); 291792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType, mhA->ij, &type); 29208401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, comm, PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported"); 293792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, mhA->ij, (void **)&hA); 2942df22349SStefano Zampini M = hypre_ParCSRMatrixGlobalNumRows(hA); 2952df22349SStefano Zampini N = hypre_ParCSRMatrixGlobalNumCols(hA); 2962df22349SStefano Zampini str = hypre_ParCSRMatrixFirstRowIndex(hA); 2972df22349SStefano Zampini stc = hypre_ParCSRMatrixFirstColDiag(hA); 2982df22349SStefano Zampini hdiag = hypre_ParCSRMatrixDiag(hA); 2992df22349SStefano Zampini hoffd = hypre_ParCSRMatrixOffd(hA); 3002df22349SStefano Zampini dr = hypre_CSRMatrixNumRows(hdiag); 3012df22349SStefano Zampini dc = hypre_CSRMatrixNumCols(hdiag); 3022df22349SStefano Zampini nnz = hypre_CSRMatrixNumNonzeros(hdiag); 3032df22349SStefano Zampini hdi = hypre_CSRMatrixI(hdiag); 3042df22349SStefano Zampini hdj = hypre_CSRMatrixJ(hdiag); 3052df22349SStefano Zampini hdd = hypre_CSRMatrixData(hdiag); 3062df22349SStefano Zampini oc = hypre_CSRMatrixNumCols(hoffd); 3072df22349SStefano Zampini nnz += hypre_CSRMatrixNumNonzeros(hoffd); 3082df22349SStefano Zampini hoi = hypre_CSRMatrixI(hoffd); 3092df22349SStefano Zampini hoj = hypre_CSRMatrixJ(hoffd); 3102df22349SStefano Zampini hod = hypre_CSRMatrixData(hoffd); 3112df22349SStefano Zampini if (reuse != MAT_REUSE_MATRIX) { 3122df22349SStefano Zampini PetscInt *aux; 3132df22349SStefano Zampini 3142df22349SStefano Zampini /* generate l2g maps for rows and cols */ 3159566063dSJacob Faibussowitsch PetscCall(ISCreateStride(comm, dr, str, 1, &is)); 3169566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreateIS(is, &rl2g)); 3179566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is)); 3182df22349SStefano Zampini col_map_offd = hypre_ParCSRMatrixColMapOffd(hA); 3199566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(dc + oc, &aux)); 3202df22349SStefano Zampini for (i = 0; i < dc; i++) aux[i] = i + stc; 3212df22349SStefano Zampini for (i = 0; i < oc; i++) aux[i + dc] = col_map_offd[i]; 3229566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(comm, dc + oc, aux, PETSC_OWN_POINTER, &is)); 3239566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreateIS(is, &cl2g)); 3249566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is)); 3252df22349SStefano Zampini /* create MATIS object */ 3269566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, B)); 3279566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, dr, dc, M, N)); 3289566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, MATIS)); 3299566063dSJacob Faibussowitsch PetscCall(MatSetLocalToGlobalMapping(*B, rl2g, cl2g)); 3309566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingDestroy(&rl2g)); 3319566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingDestroy(&cl2g)); 3322df22349SStefano Zampini 3332df22349SStefano Zampini /* allocate CSR for local matrix */ 3349566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(dr + 1, &iptr)); 3359566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz, &jptr)); 3369566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz, &data)); 3372df22349SStefano Zampini } else { 3382df22349SStefano Zampini PetscInt nr; 3392df22349SStefano Zampini PetscBool done; 3409566063dSJacob Faibussowitsch PetscCall(MatISGetLocalMat(*B, &lA)); 3419566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(lA, 0, PETSC_FALSE, PETSC_FALSE, &nr, (const PetscInt **)&iptr, (const PetscInt **)&jptr, &done)); 34208401ef6SPierre Jolivet PetscCheck(nr == dr, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of rows in local mat! %" PetscInt_FMT " != %" PetscInt_FMT, nr, dr); 34308401ef6SPierre Jolivet PetscCheck(iptr[nr] >= nnz, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of nonzeros in local mat! reuse %" PetscInt_FMT " requested %" PetscInt_FMT, iptr[nr], nnz); 3449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(lA, &data)); 3452df22349SStefano Zampini } 3462df22349SStefano Zampini /* merge local matrices */ 3472df22349SStefano Zampini ii = iptr; 3482df22349SStefano Zampini jj = jptr; 34939accc25SStefano Zampini aa = (HYPRE_Complex *)data; /* this cast fixes the clang error when doing the assignments below: implicit conversion from 'HYPRE_Complex' (aka '_Complex double') to 'double' is not permitted in C++ */ 3502df22349SStefano Zampini *ii = *(hdi++) + *(hoi++); 3512df22349SStefano Zampini for (jd = 0, jo = 0, cum = 0; *ii < nnz; cum++) { 35239accc25SStefano Zampini PetscScalar *aold = (PetscScalar *)aa; 3532df22349SStefano Zampini PetscInt *jold = jj, nc = jd + jo; 3549371c9d4SSatish Balay for (; jd < *hdi; jd++) { 3559371c9d4SSatish Balay *jj++ = *hdj++; 3569371c9d4SSatish Balay *aa++ = *hdd++; 3579371c9d4SSatish Balay } 3589371c9d4SSatish Balay for (; jo < *hoi; jo++) { 3599371c9d4SSatish Balay *jj++ = *hoj++ + dc; 3609371c9d4SSatish Balay *aa++ = *hod++; 3619371c9d4SSatish Balay } 3622df22349SStefano Zampini *(++ii) = *(hdi++) + *(hoi++); 3639566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(jd + jo - nc, jold, aold)); 3642df22349SStefano Zampini } 3652df22349SStefano Zampini for (; cum < dr; cum++) *(++ii) = nnz; 3662df22349SStefano Zampini if (reuse != MAT_REUSE_MATRIX) { 367a033916dSStefano Zampini Mat_SeqAIJ *a; 368a033916dSStefano Zampini 3699566063dSJacob Faibussowitsch PetscCall(MatCreateSeqAIJWithArrays(PETSC_COMM_SELF, dr, dc + oc, iptr, jptr, data, &lA)); 3709566063dSJacob Faibussowitsch PetscCall(MatISSetLocalMat(*B, lA)); 371a033916dSStefano Zampini /* hack SeqAIJ */ 372a033916dSStefano Zampini a = (Mat_SeqAIJ *)(lA->data); 373a033916dSStefano Zampini a->free_a = PETSC_TRUE; 374a033916dSStefano Zampini a->free_ij = PETSC_TRUE; 3759566063dSJacob Faibussowitsch PetscCall(MatDestroy(&lA)); 3762df22349SStefano Zampini } 3779566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 3789566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 37948a46eb9SPierre Jolivet if (reuse == MAT_INPLACE_MATRIX) PetscCall(MatHeaderReplace(A, B)); 3803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3812df22349SStefano Zampini } 3822df22349SStefano Zampini 383d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType type, MatReuse reuse, Mat *B) 384d71ae5a4SJacob Faibussowitsch { 38584d4e069SStefano Zampini Mat M = NULL; 38663c07aadSStefano Zampini Mat_HYPRE *hB; 38763c07aadSStefano Zampini MPI_Comm comm = PetscObjectComm((PetscObject)A); 38863c07aadSStefano Zampini 38963c07aadSStefano Zampini PetscFunctionBegin; 39063c07aadSStefano Zampini if (reuse == MAT_REUSE_MATRIX) { 39163c07aadSStefano Zampini /* always destroy the old matrix and create a new memory; 39263c07aadSStefano Zampini hope this does not churn the memory too much. The problem 39363c07aadSStefano Zampini is I do not know if it is possible to put the matrix back to 39463c07aadSStefano Zampini its initial state so that we can directly copy the values 39563c07aadSStefano Zampini the second time through. */ 39663c07aadSStefano Zampini hB = (Mat_HYPRE *)((*B)->data); 397792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixDestroy, hB->ij); 39863c07aadSStefano Zampini } else { 3999566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, &M)); 4009566063dSJacob Faibussowitsch PetscCall(MatSetType(M, MATHYPRE)); 4019566063dSJacob Faibussowitsch PetscCall(MatSetSizes(M, A->rmap->n, A->cmap->n, A->rmap->N, A->cmap->N)); 40284d4e069SStefano Zampini hB = (Mat_HYPRE *)(M->data); 40384d4e069SStefano Zampini if (reuse == MAT_INITIAL_MATRIX) *B = M; 40463c07aadSStefano Zampini } 4059566063dSJacob Faibussowitsch PetscCall(MatSetOption(*B, MAT_SORTED_FULL, PETSC_TRUE)); /* "perfect" preallocation, so no need for hypre_AuxParCSRMatrixNeedAux */ 4069566063dSJacob Faibussowitsch PetscCall(MatSetOption(*B, MAT_NO_OFF_PROC_ENTRIES, PETSC_TRUE)); 4079566063dSJacob Faibussowitsch PetscCall(MatHYPRE_CreateFromMat(A, hB)); 4089566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixCopy(A, hB->ij)); 40948a46eb9SPierre Jolivet if (reuse == MAT_INPLACE_MATRIX) PetscCall(MatHeaderReplace(A, &M)); 4104ec6421dSstefano_zampini (*B)->preallocated = PETSC_TRUE; 4119566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 4129566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 4133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 41463c07aadSStefano Zampini } 41563c07aadSStefano Zampini 416d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatConvert_HYPRE_AIJ(Mat A, MatType mtype, MatReuse reuse, Mat *B) 417d71ae5a4SJacob Faibussowitsch { 41863c07aadSStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 41963c07aadSStefano Zampini hypre_ParCSRMatrix *parcsr; 42063c07aadSStefano Zampini hypre_CSRMatrix *hdiag, *hoffd; 42163c07aadSStefano Zampini MPI_Comm comm; 42263c07aadSStefano Zampini PetscScalar *da, *oa, *aptr; 42363c07aadSStefano Zampini PetscInt *dii, *djj, *oii, *ojj, *iptr; 42463c07aadSStefano Zampini PetscInt i, dnnz, onnz, m, n; 42558968eb6SStefano Zampini HYPRE_Int type; 42663c07aadSStefano Zampini PetscMPIInt size; 4272cf14000SStefano Zampini PetscBool sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int)); 42863c07aadSStefano Zampini 42963c07aadSStefano Zampini PetscFunctionBegin; 43063c07aadSStefano Zampini comm = PetscObjectComm((PetscObject)A); 431792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType, hA->ij, &type); 43208401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, comm, PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported"); 43363c07aadSStefano Zampini if (reuse == MAT_REUSE_MATRIX) { 43463c07aadSStefano Zampini PetscBool ismpiaij, isseqaij; 4359566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)*B, MATMPIAIJ, &ismpiaij)); 4369566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)*B, MATSEQAIJ, &isseqaij)); 43708401ef6SPierre Jolivet PetscCheck(ismpiaij || isseqaij, comm, PETSC_ERR_SUP, "Only MATMPIAIJ or MATSEQAIJ are supported"); 43863c07aadSStefano Zampini } 4396ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 44008401ef6SPierre Jolivet PetscCheck(HYPRE_MEMORY_DEVICE != hypre_IJMatrixMemoryLocation(hA->ij), comm, PETSC_ERR_SUP, "Not yet implemented"); 4416ea7df73SStefano Zampini #endif 4429566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(comm, &size)); 44363c07aadSStefano Zampini 444792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, hA->ij, (void **)&parcsr); 44563c07aadSStefano Zampini hdiag = hypre_ParCSRMatrixDiag(parcsr); 44663c07aadSStefano Zampini hoffd = hypre_ParCSRMatrixOffd(parcsr); 44763c07aadSStefano Zampini m = hypre_CSRMatrixNumRows(hdiag); 44863c07aadSStefano Zampini n = hypre_CSRMatrixNumCols(hdiag); 44963c07aadSStefano Zampini dnnz = hypre_CSRMatrixNumNonzeros(hdiag); 45063c07aadSStefano Zampini onnz = hypre_CSRMatrixNumNonzeros(hoffd); 451225daaf8SStefano Zampini if (reuse == MAT_INITIAL_MATRIX) { 4529566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &dii)); 4539566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(dnnz, &djj)); 4549566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(dnnz, &da)); 455225daaf8SStefano Zampini } else if (reuse == MAT_REUSE_MATRIX) { 45663c07aadSStefano Zampini PetscInt nr; 45763c07aadSStefano Zampini PetscBool done; 45863c07aadSStefano Zampini if (size > 1) { 45963c07aadSStefano Zampini Mat_MPIAIJ *b = (Mat_MPIAIJ *)((*B)->data); 46063c07aadSStefano Zampini 4619566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(b->A, 0, PETSC_FALSE, PETSC_FALSE, &nr, (const PetscInt **)&dii, (const PetscInt **)&djj, &done)); 46208401ef6SPierre Jolivet PetscCheck(nr == m, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of local rows in diag part! %" PetscInt_FMT " != %" PetscInt_FMT, nr, m); 46308401ef6SPierre Jolivet PetscCheck(dii[nr] >= dnnz, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of nonzeros in diag part! reuse %" PetscInt_FMT " hypre %" PetscInt_FMT, dii[nr], dnnz); 4649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(b->A, &da)); 46563c07aadSStefano Zampini } else { 4669566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(*B, 0, PETSC_FALSE, PETSC_FALSE, &nr, (const PetscInt **)&dii, (const PetscInt **)&djj, &done)); 46708401ef6SPierre Jolivet PetscCheck(nr == m, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of local rows! %" PetscInt_FMT " != %" PetscInt_FMT, nr, m); 46808401ef6SPierre Jolivet PetscCheck(dii[nr] >= dnnz, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of nonzeros! reuse %" PetscInt_FMT " hypre %" PetscInt_FMT, dii[nr], dnnz); 4699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*B, &da)); 47063c07aadSStefano Zampini } 471225daaf8SStefano Zampini } else { /* MAT_INPLACE_MATRIX */ 4722cf14000SStefano Zampini if (!sameint) { 4739566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &dii)); 4749566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(dnnz, &djj)); 4752cf14000SStefano Zampini } else { 4767d968826Sstefano_zampini dii = (PetscInt *)hypre_CSRMatrixI(hdiag); 4777d968826Sstefano_zampini djj = (PetscInt *)hypre_CSRMatrixJ(hdiag); 47863c07aadSStefano Zampini } 47939accc25SStefano Zampini da = (PetscScalar *)hypre_CSRMatrixData(hdiag); 48063c07aadSStefano Zampini } 4812cf14000SStefano Zampini 4822cf14000SStefano Zampini if (!sameint) { 4839371c9d4SSatish Balay if (reuse != MAT_REUSE_MATRIX) { 4849371c9d4SSatish Balay for (i = 0; i < m + 1; i++) dii[i] = (PetscInt)(hypre_CSRMatrixI(hdiag)[i]); 4859371c9d4SSatish Balay } 4862cf14000SStefano Zampini for (i = 0; i < dnnz; i++) djj[i] = (PetscInt)(hypre_CSRMatrixJ(hdiag)[i]); 4872cf14000SStefano Zampini } else { 4889566063dSJacob Faibussowitsch if (reuse != MAT_REUSE_MATRIX) PetscCall(PetscArraycpy(dii, hypre_CSRMatrixI(hdiag), m + 1)); 4899566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(djj, hypre_CSRMatrixJ(hdiag), dnnz)); 4902cf14000SStefano Zampini } 4919566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(da, hypre_CSRMatrixData(hdiag), dnnz)); 49263c07aadSStefano Zampini iptr = djj; 49363c07aadSStefano Zampini aptr = da; 49463c07aadSStefano Zampini for (i = 0; i < m; i++) { 49563c07aadSStefano Zampini PetscInt nc = dii[i + 1] - dii[i]; 4969566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(nc, iptr, aptr)); 49763c07aadSStefano Zampini iptr += nc; 49863c07aadSStefano Zampini aptr += nc; 49963c07aadSStefano Zampini } 50063c07aadSStefano Zampini if (size > 1) { 5012cf14000SStefano Zampini HYPRE_BigInt *coffd; 5022cf14000SStefano Zampini HYPRE_Int *offdj; 50363c07aadSStefano Zampini 504225daaf8SStefano Zampini if (reuse == MAT_INITIAL_MATRIX) { 5059566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &oii)); 5069566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(onnz, &ojj)); 5079566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(onnz, &oa)); 508225daaf8SStefano Zampini } else if (reuse == MAT_REUSE_MATRIX) { 50963c07aadSStefano Zampini Mat_MPIAIJ *b = (Mat_MPIAIJ *)((*B)->data); 51063c07aadSStefano Zampini PetscInt nr, hr = hypre_CSRMatrixNumRows(hoffd); 51163c07aadSStefano Zampini PetscBool done; 51263c07aadSStefano Zampini 5139566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(b->B, 0, PETSC_FALSE, PETSC_FALSE, &nr, (const PetscInt **)&oii, (const PetscInt **)&ojj, &done)); 51408401ef6SPierre Jolivet PetscCheck(nr == hr, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of local rows in offdiag part! %" PetscInt_FMT " != %" PetscInt_FMT, nr, hr); 51508401ef6SPierre Jolivet PetscCheck(oii[nr] >= onnz, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of nonzeros in offdiag part! reuse %" PetscInt_FMT " hypre %" PetscInt_FMT, oii[nr], onnz); 5169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(b->B, &oa)); 517225daaf8SStefano Zampini } else { /* MAT_INPLACE_MATRIX */ 5182cf14000SStefano Zampini if (!sameint) { 5199566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &oii)); 5209566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(onnz, &ojj)); 5212cf14000SStefano Zampini } else { 5227d968826Sstefano_zampini oii = (PetscInt *)hypre_CSRMatrixI(hoffd); 5237d968826Sstefano_zampini ojj = (PetscInt *)hypre_CSRMatrixJ(hoffd); 52463c07aadSStefano Zampini } 52539accc25SStefano Zampini oa = (PetscScalar *)hypre_CSRMatrixData(hoffd); 52663c07aadSStefano Zampini } 527a16187a7SStefano Zampini if (reuse != MAT_REUSE_MATRIX) { 5282cf14000SStefano Zampini if (!sameint) { 5292cf14000SStefano Zampini for (i = 0; i < m + 1; i++) oii[i] = (PetscInt)(hypre_CSRMatrixI(hoffd)[i]); 5302cf14000SStefano Zampini } else { 5319566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(oii, hypre_CSRMatrixI(hoffd), m + 1)); 5322cf14000SStefano Zampini } 533a16187a7SStefano Zampini } 5349566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(oa, hypre_CSRMatrixData(hoffd), onnz)); 535a16187a7SStefano Zampini 53663c07aadSStefano Zampini offdj = hypre_CSRMatrixJ(hoffd); 53763c07aadSStefano Zampini coffd = hypre_ParCSRMatrixColMapOffd(parcsr); 538a16187a7SStefano Zampini /* we only need the permutation to be computed properly, I don't know if HYPRE 539a16187a7SStefano Zampini messes up with the ordering. Just in case, allocate some memory and free it 540a16187a7SStefano Zampini later */ 541a16187a7SStefano Zampini if (reuse == MAT_REUSE_MATRIX) { 542a16187a7SStefano Zampini Mat_MPIAIJ *b = (Mat_MPIAIJ *)((*B)->data); 543a16187a7SStefano Zampini PetscInt mnz; 544a16187a7SStefano Zampini 5459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetMaxRowNonzeros(b->B, &mnz)); 5469566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mnz, &ojj)); 5479371c9d4SSatish Balay } else 5489371c9d4SSatish Balay for (i = 0; i < onnz; i++) ojj[i] = coffd[offdj[i]]; 54963c07aadSStefano Zampini iptr = ojj; 55063c07aadSStefano Zampini aptr = oa; 55163c07aadSStefano Zampini for (i = 0; i < m; i++) { 55263c07aadSStefano Zampini PetscInt nc = oii[i + 1] - oii[i]; 553a16187a7SStefano Zampini if (reuse == MAT_REUSE_MATRIX) { 554a16187a7SStefano Zampini PetscInt j; 555a16187a7SStefano Zampini 556a16187a7SStefano Zampini iptr = ojj; 557a16187a7SStefano Zampini for (j = 0; j < nc; j++) iptr[j] = coffd[offdj[oii[i] + j]]; 558a16187a7SStefano Zampini } 5599566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(nc, iptr, aptr)); 56063c07aadSStefano Zampini iptr += nc; 56163c07aadSStefano Zampini aptr += nc; 56263c07aadSStefano Zampini } 5639566063dSJacob Faibussowitsch if (reuse == MAT_REUSE_MATRIX) PetscCall(PetscFree(ojj)); 564225daaf8SStefano Zampini if (reuse == MAT_INITIAL_MATRIX) { 56563c07aadSStefano Zampini Mat_MPIAIJ *b; 56663c07aadSStefano Zampini Mat_SeqAIJ *d, *o; 567225daaf8SStefano Zampini 5689566063dSJacob Faibussowitsch PetscCall(MatCreateMPIAIJWithSplitArrays(comm, m, n, PETSC_DECIDE, PETSC_DECIDE, dii, djj, da, oii, ojj, oa, B)); 56963c07aadSStefano Zampini /* hack MPIAIJ */ 57063c07aadSStefano Zampini b = (Mat_MPIAIJ *)((*B)->data); 57163c07aadSStefano Zampini d = (Mat_SeqAIJ *)b->A->data; 57263c07aadSStefano Zampini o = (Mat_SeqAIJ *)b->B->data; 57363c07aadSStefano Zampini d->free_a = PETSC_TRUE; 57463c07aadSStefano Zampini d->free_ij = PETSC_TRUE; 57563c07aadSStefano Zampini o->free_a = PETSC_TRUE; 57663c07aadSStefano Zampini o->free_ij = PETSC_TRUE; 577225daaf8SStefano Zampini } else if (reuse == MAT_INPLACE_MATRIX) { 578225daaf8SStefano Zampini Mat T; 5792cf14000SStefano Zampini 5809566063dSJacob Faibussowitsch PetscCall(MatCreateMPIAIJWithSplitArrays(comm, m, n, PETSC_DECIDE, PETSC_DECIDE, dii, djj, da, oii, ojj, oa, &T)); 5812cf14000SStefano Zampini if (sameint) { /* ownership of CSR pointers is transferred to PETSc */ 582225daaf8SStefano Zampini hypre_CSRMatrixI(hdiag) = NULL; 583225daaf8SStefano Zampini hypre_CSRMatrixJ(hdiag) = NULL; 584225daaf8SStefano Zampini hypre_CSRMatrixI(hoffd) = NULL; 585225daaf8SStefano Zampini hypre_CSRMatrixJ(hoffd) = NULL; 5862cf14000SStefano Zampini } else { /* Hack MPIAIJ -> free ij but not a */ 5872cf14000SStefano Zampini Mat_MPIAIJ *b = (Mat_MPIAIJ *)(T->data); 5882cf14000SStefano Zampini Mat_SeqAIJ *d = (Mat_SeqAIJ *)(b->A->data); 5892cf14000SStefano Zampini Mat_SeqAIJ *o = (Mat_SeqAIJ *)(b->B->data); 5902cf14000SStefano Zampini 5912cf14000SStefano Zampini d->free_ij = PETSC_TRUE; 5922cf14000SStefano Zampini o->free_ij = PETSC_TRUE; 5932cf14000SStefano Zampini } 5942cf14000SStefano Zampini hypre_CSRMatrixData(hdiag) = NULL; 595225daaf8SStefano Zampini hypre_CSRMatrixData(hoffd) = NULL; 5969566063dSJacob Faibussowitsch PetscCall(MatHeaderReplace(A, &T)); 59763c07aadSStefano Zampini } 598225daaf8SStefano Zampini } else { 599225daaf8SStefano Zampini oii = NULL; 600225daaf8SStefano Zampini ojj = NULL; 601225daaf8SStefano Zampini oa = NULL; 602225daaf8SStefano Zampini if (reuse == MAT_INITIAL_MATRIX) { 60363c07aadSStefano Zampini Mat_SeqAIJ *b; 6042cf14000SStefano Zampini 6059566063dSJacob Faibussowitsch PetscCall(MatCreateSeqAIJWithArrays(comm, m, n, dii, djj, da, B)); 60663c07aadSStefano Zampini /* hack SeqAIJ */ 60763c07aadSStefano Zampini b = (Mat_SeqAIJ *)((*B)->data); 60863c07aadSStefano Zampini b->free_a = PETSC_TRUE; 60963c07aadSStefano Zampini b->free_ij = PETSC_TRUE; 610225daaf8SStefano Zampini } else if (reuse == MAT_INPLACE_MATRIX) { 611225daaf8SStefano Zampini Mat T; 6122cf14000SStefano Zampini 6139566063dSJacob Faibussowitsch PetscCall(MatCreateSeqAIJWithArrays(comm, m, n, dii, djj, da, &T)); 6142cf14000SStefano Zampini if (sameint) { /* ownership of CSR pointers is transferred to PETSc */ 615225daaf8SStefano Zampini hypre_CSRMatrixI(hdiag) = NULL; 616225daaf8SStefano Zampini hypre_CSRMatrixJ(hdiag) = NULL; 6172cf14000SStefano Zampini } else { /* free ij but not a */ 6182cf14000SStefano Zampini Mat_SeqAIJ *b = (Mat_SeqAIJ *)(T->data); 6192cf14000SStefano Zampini 6202cf14000SStefano Zampini b->free_ij = PETSC_TRUE; 6212cf14000SStefano Zampini } 622225daaf8SStefano Zampini hypre_CSRMatrixData(hdiag) = NULL; 6239566063dSJacob Faibussowitsch PetscCall(MatHeaderReplace(A, &T)); 62463c07aadSStefano Zampini } 625225daaf8SStefano Zampini } 626225daaf8SStefano Zampini 6272cf14000SStefano Zampini /* we have to use hypre_Tfree to free the HYPRE arrays 628da81f932SPierre Jolivet that PETSc now owns */ 62963c07aadSStefano Zampini if (reuse == MAT_INPLACE_MATRIX) { 6302cf14000SStefano Zampini PetscInt nh; 6312cf14000SStefano Zampini void *ptrs[6] = {da, oa, dii, djj, oii, ojj}; 6329371c9d4SSatish Balay const char *names[6] = {"_hypre_csr_da", "_hypre_csr_oa", "_hypre_csr_dii", "_hypre_csr_djj", "_hypre_csr_oii", "_hypre_csr_ojj"}; 6332cf14000SStefano Zampini nh = sameint ? 6 : 2; 6342cf14000SStefano Zampini for (i = 0; i < nh; i++) { 635225daaf8SStefano Zampini PetscContainer c; 636225daaf8SStefano Zampini 6379566063dSJacob Faibussowitsch PetscCall(PetscContainerCreate(comm, &c)); 6389566063dSJacob Faibussowitsch PetscCall(PetscContainerSetPointer(c, ptrs[i])); 6399566063dSJacob Faibussowitsch PetscCall(PetscContainerSetUserDestroy(c, hypre_array_destroy)); 6409566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)(*B), names[i], (PetscObject)c)); 6419566063dSJacob Faibussowitsch PetscCall(PetscContainerDestroy(&c)); 642225daaf8SStefano Zampini } 64363c07aadSStefano Zampini } 6443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 64563c07aadSStefano Zampini } 64663c07aadSStefano Zampini 647d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAIJGetParCSR_Private(Mat A, hypre_ParCSRMatrix **hA) 648d71ae5a4SJacob Faibussowitsch { 649613e5ff0Sstefano_zampini hypre_ParCSRMatrix *tA; 650c1a070e6SStefano Zampini hypre_CSRMatrix *hdiag, *hoffd; 651c1a070e6SStefano Zampini Mat_SeqAIJ *diag, *offd; 6522cf14000SStefano Zampini PetscInt *garray, i, noffd, dnnz, onnz, *row_starts, *col_starts; 653c1a070e6SStefano Zampini MPI_Comm comm = PetscObjectComm((PetscObject)A); 654613e5ff0Sstefano_zampini PetscBool ismpiaij, isseqaij; 6552cf14000SStefano Zampini PetscBool sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int)); 6566ea7df73SStefano Zampini HYPRE_Int *hdi = NULL, *hdj = NULL, *hoi = NULL, *hoj = NULL; 6575c97c10fSStefano Zampini PetscInt *pdi = NULL, *pdj = NULL, *poi = NULL, *poj = NULL; 6586ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 6596ea7df73SStefano Zampini PetscBool iscuda = PETSC_FALSE; 6606ea7df73SStefano Zampini #endif 661c1a070e6SStefano Zampini 662c1a070e6SStefano Zampini PetscFunctionBegin; 6639566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &ismpiaij)); 6649566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATSEQAIJ, &isseqaij)); 66508401ef6SPierre Jolivet PetscCheck(ismpiaij || isseqaij, comm, PETSC_ERR_SUP, "Unsupported type %s", ((PetscObject)A)->type_name); 666c1a070e6SStefano Zampini if (ismpiaij) { 667c1a070e6SStefano Zampini Mat_MPIAIJ *a = (Mat_MPIAIJ *)(A->data); 668c1a070e6SStefano Zampini 669c1a070e6SStefano Zampini diag = (Mat_SeqAIJ *)a->A->data; 670c1a070e6SStefano Zampini offd = (Mat_SeqAIJ *)a->B->data; 6716ea7df73SStefano Zampini #if defined(PETSC_HAVE_CUDA) && defined(PETSC_HAVE_HYPRE_DEVICE) && defined(HYPRE_USING_CUDA) 6729566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)A, MATMPIAIJCUSPARSE, &iscuda)); 6736ea7df73SStefano Zampini if (iscuda && !A->boundtocpu) { 6746ea7df73SStefano Zampini sameint = PETSC_TRUE; 6759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJCUSPARSEGetIJ(a->A, PETSC_FALSE, (const HYPRE_Int **)&hdi, (const HYPRE_Int **)&hdj)); 6769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJCUSPARSEGetIJ(a->B, PETSC_FALSE, (const HYPRE_Int **)&hoi, (const HYPRE_Int **)&hoj)); 6776ea7df73SStefano Zampini } else { 6786ea7df73SStefano Zampini #else 6796ea7df73SStefano Zampini { 6806ea7df73SStefano Zampini #endif 6816ea7df73SStefano Zampini pdi = diag->i; 6826ea7df73SStefano Zampini pdj = diag->j; 6836ea7df73SStefano Zampini poi = offd->i; 6846ea7df73SStefano Zampini poj = offd->j; 6856ea7df73SStefano Zampini if (sameint) { 6866ea7df73SStefano Zampini hdi = (HYPRE_Int *)pdi; 6876ea7df73SStefano Zampini hdj = (HYPRE_Int *)pdj; 6886ea7df73SStefano Zampini hoi = (HYPRE_Int *)poi; 6896ea7df73SStefano Zampini hoj = (HYPRE_Int *)poj; 6906ea7df73SStefano Zampini } 6916ea7df73SStefano Zampini } 692c1a070e6SStefano Zampini garray = a->garray; 693c1a070e6SStefano Zampini noffd = a->B->cmap->N; 694c1a070e6SStefano Zampini dnnz = diag->nz; 695c1a070e6SStefano Zampini onnz = offd->nz; 696c1a070e6SStefano Zampini } else { 697c1a070e6SStefano Zampini diag = (Mat_SeqAIJ *)A->data; 698c1a070e6SStefano Zampini offd = NULL; 6996ea7df73SStefano Zampini #if defined(PETSC_HAVE_CUDA) && defined(PETSC_HAVE_HYPRE_DEVICE) 7009566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)A, MATSEQAIJCUSPARSE, &iscuda)); 7016ea7df73SStefano Zampini if (iscuda && !A->boundtocpu) { 7026ea7df73SStefano Zampini sameint = PETSC_TRUE; 7039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJCUSPARSEGetIJ(A, PETSC_FALSE, (const HYPRE_Int **)&hdi, (const HYPRE_Int **)&hdj)); 7046ea7df73SStefano Zampini } else { 7056ea7df73SStefano Zampini #else 7066ea7df73SStefano Zampini { 7076ea7df73SStefano Zampini #endif 7086ea7df73SStefano Zampini pdi = diag->i; 7096ea7df73SStefano Zampini pdj = diag->j; 7106ea7df73SStefano Zampini if (sameint) { 7116ea7df73SStefano Zampini hdi = (HYPRE_Int *)pdi; 7126ea7df73SStefano Zampini hdj = (HYPRE_Int *)pdj; 7136ea7df73SStefano Zampini } 7146ea7df73SStefano Zampini } 715c1a070e6SStefano Zampini garray = NULL; 716c1a070e6SStefano Zampini noffd = 0; 717c1a070e6SStefano Zampini dnnz = diag->nz; 718c1a070e6SStefano Zampini onnz = 0; 719c1a070e6SStefano Zampini } 720225daaf8SStefano Zampini 721c1a070e6SStefano Zampini /* create a temporary ParCSR */ 722c1a070e6SStefano Zampini if (HYPRE_AssumedPartitionCheck()) { 723c1a070e6SStefano Zampini PetscMPIInt myid; 724c1a070e6SStefano Zampini 7259566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_rank(comm, &myid)); 726c1a070e6SStefano Zampini row_starts = A->rmap->range + myid; 727c1a070e6SStefano Zampini col_starts = A->cmap->range + myid; 728c1a070e6SStefano Zampini } else { 729c1a070e6SStefano Zampini row_starts = A->rmap->range; 730c1a070e6SStefano Zampini col_starts = A->cmap->range; 731c1a070e6SStefano Zampini } 7322cf14000SStefano Zampini tA = hypre_ParCSRMatrixCreate(comm, A->rmap->N, A->cmap->N, (HYPRE_BigInt *)row_starts, (HYPRE_BigInt *)col_starts, noffd, dnnz, onnz); 733a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts) 734c1a070e6SStefano Zampini hypre_ParCSRMatrixSetRowStartsOwner(tA, 0); 735c1a070e6SStefano Zampini hypre_ParCSRMatrixSetColStartsOwner(tA, 0); 736a1d2239cSSatish Balay #endif 737c1a070e6SStefano Zampini 738225daaf8SStefano Zampini /* set diagonal part */ 739c1a070e6SStefano Zampini hdiag = hypre_ParCSRMatrixDiag(tA); 7406ea7df73SStefano Zampini if (!sameint) { /* malloc CSR pointers */ 7419566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(A->rmap->n + 1, &hdi, dnnz, &hdj)); 7426ea7df73SStefano Zampini for (i = 0; i < A->rmap->n + 1; i++) hdi[i] = (HYPRE_Int)(pdi[i]); 7436ea7df73SStefano Zampini for (i = 0; i < dnnz; i++) hdj[i] = (HYPRE_Int)(pdj[i]); 7442cf14000SStefano Zampini } 7456ea7df73SStefano Zampini hypre_CSRMatrixI(hdiag) = hdi; 7466ea7df73SStefano Zampini hypre_CSRMatrixJ(hdiag) = hdj; 74739accc25SStefano Zampini hypre_CSRMatrixData(hdiag) = (HYPRE_Complex *)diag->a; 748c1a070e6SStefano Zampini hypre_CSRMatrixNumNonzeros(hdiag) = diag->nz; 749c1a070e6SStefano Zampini hypre_CSRMatrixSetRownnz(hdiag); 750c1a070e6SStefano Zampini hypre_CSRMatrixSetDataOwner(hdiag, 0); 751c1a070e6SStefano Zampini 752225daaf8SStefano Zampini /* set offdiagonal part */ 753c1a070e6SStefano Zampini hoffd = hypre_ParCSRMatrixOffd(tA); 754c1a070e6SStefano Zampini if (offd) { 7556ea7df73SStefano Zampini if (!sameint) { /* malloc CSR pointers */ 7569566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(A->rmap->n + 1, &hoi, onnz, &hoj)); 7576ea7df73SStefano Zampini for (i = 0; i < A->rmap->n + 1; i++) hoi[i] = (HYPRE_Int)(poi[i]); 7586ea7df73SStefano Zampini for (i = 0; i < onnz; i++) hoj[i] = (HYPRE_Int)(poj[i]); 7592cf14000SStefano Zampini } 7606ea7df73SStefano Zampini hypre_CSRMatrixI(hoffd) = hoi; 7616ea7df73SStefano Zampini hypre_CSRMatrixJ(hoffd) = hoj; 76239accc25SStefano Zampini hypre_CSRMatrixData(hoffd) = (HYPRE_Complex *)offd->a; 763c1a070e6SStefano Zampini hypre_CSRMatrixNumNonzeros(hoffd) = offd->nz; 764c1a070e6SStefano Zampini hypre_CSRMatrixSetRownnz(hoffd); 765c1a070e6SStefano Zampini hypre_CSRMatrixSetDataOwner(hoffd, 0); 7666ea7df73SStefano Zampini } 7676ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 768792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixInitialize_v2, tA, iscuda ? HYPRE_MEMORY_DEVICE : HYPRE_MEMORY_HOST); 7696ea7df73SStefano Zampini #else 7706ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 18, 0) 771792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixInitialize, tA); 7726ea7df73SStefano Zampini #else 773792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixInitialize_v2, tA, HYPRE_MEMORY_HOST); 7746ea7df73SStefano Zampini #endif 7756ea7df73SStefano Zampini #endif 7766ea7df73SStefano Zampini hypre_TFree(hypre_ParCSRMatrixColMapOffd(tA), HYPRE_MEMORY_HOST); 777c1a070e6SStefano Zampini hypre_ParCSRMatrixSetNumNonzeros(tA); 7782cf14000SStefano Zampini hypre_ParCSRMatrixColMapOffd(tA) = (HYPRE_BigInt *)garray; 779792fecdfSBarry Smith if (!hypre_ParCSRMatrixCommPkg(tA)) PetscCallExternal(hypre_MatvecCommPkgCreate, tA); 780613e5ff0Sstefano_zampini *hA = tA; 7813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 782613e5ff0Sstefano_zampini } 783c1a070e6SStefano Zampini 784d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAIJRestoreParCSR_Private(Mat A, hypre_ParCSRMatrix **hA) 785d71ae5a4SJacob Faibussowitsch { 786613e5ff0Sstefano_zampini hypre_CSRMatrix *hdiag, *hoffd; 7876ea7df73SStefano Zampini PetscBool ismpiaij, sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int)); 7886ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 7896ea7df73SStefano Zampini PetscBool iscuda = PETSC_FALSE; 7906ea7df73SStefano Zampini #endif 791c1a070e6SStefano Zampini 792613e5ff0Sstefano_zampini PetscFunctionBegin; 7939566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &ismpiaij)); 7946ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 7959566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)A, &iscuda, MATSEQAIJCUSPARSE, MATMPIAIJCUSPARSE, "")); 7966ea7df73SStefano Zampini if (iscuda) sameint = PETSC_TRUE; 7976ea7df73SStefano Zampini #endif 798613e5ff0Sstefano_zampini hdiag = hypre_ParCSRMatrixDiag(*hA); 799613e5ff0Sstefano_zampini hoffd = hypre_ParCSRMatrixOffd(*hA); 8006ea7df73SStefano Zampini /* free temporary memory allocated by PETSc 8016ea7df73SStefano Zampini set pointers to NULL before destroying tA */ 8022cf14000SStefano Zampini if (!sameint) { 8032cf14000SStefano Zampini HYPRE_Int *hi, *hj; 8042cf14000SStefano Zampini 8052cf14000SStefano Zampini hi = hypre_CSRMatrixI(hdiag); 8062cf14000SStefano Zampini hj = hypre_CSRMatrixJ(hdiag); 8079566063dSJacob Faibussowitsch PetscCall(PetscFree2(hi, hj)); 8086ea7df73SStefano Zampini if (ismpiaij) { 8092cf14000SStefano Zampini hi = hypre_CSRMatrixI(hoffd); 8102cf14000SStefano Zampini hj = hypre_CSRMatrixJ(hoffd); 8119566063dSJacob Faibussowitsch PetscCall(PetscFree2(hi, hj)); 8122cf14000SStefano Zampini } 8132cf14000SStefano Zampini } 814c1a070e6SStefano Zampini hypre_CSRMatrixI(hdiag) = NULL; 815c1a070e6SStefano Zampini hypre_CSRMatrixJ(hdiag) = NULL; 816c1a070e6SStefano Zampini hypre_CSRMatrixData(hdiag) = NULL; 8176ea7df73SStefano Zampini if (ismpiaij) { 818c1a070e6SStefano Zampini hypre_CSRMatrixI(hoffd) = NULL; 819c1a070e6SStefano Zampini hypre_CSRMatrixJ(hoffd) = NULL; 820c1a070e6SStefano Zampini hypre_CSRMatrixData(hoffd) = NULL; 8216ea7df73SStefano Zampini } 822613e5ff0Sstefano_zampini hypre_ParCSRMatrixColMapOffd(*hA) = NULL; 823613e5ff0Sstefano_zampini hypre_ParCSRMatrixDestroy(*hA); 824613e5ff0Sstefano_zampini *hA = NULL; 8253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 826613e5ff0Sstefano_zampini } 827613e5ff0Sstefano_zampini 828613e5ff0Sstefano_zampini /* calls RAP from BoomerAMG: 8293dad0653Sstefano_zampini the resulting ParCSR will not own the column and row starts 8306ea7df73SStefano Zampini It looks like we don't need to have the diagonal entries ordered first */ 831d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_ParCSR_RAP(hypre_ParCSRMatrix *hR, hypre_ParCSRMatrix *hA, hypre_ParCSRMatrix *hP, hypre_ParCSRMatrix **hRAP) 832d71ae5a4SJacob Faibussowitsch { 833a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts) 834613e5ff0Sstefano_zampini HYPRE_Int P_owns_col_starts, R_owns_row_starts; 835a1d2239cSSatish Balay #endif 836613e5ff0Sstefano_zampini 837613e5ff0Sstefano_zampini PetscFunctionBegin; 838a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts) 839613e5ff0Sstefano_zampini P_owns_col_starts = hypre_ParCSRMatrixOwnsColStarts(hP); 840613e5ff0Sstefano_zampini R_owns_row_starts = hypre_ParCSRMatrixOwnsRowStarts(hR); 841a1d2239cSSatish Balay #endif 8426ea7df73SStefano Zampini /* can be replaced by version test later */ 8436ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 844792fecdfSBarry Smith PetscStackPushExternal("hypre_ParCSRMatrixRAP"); 8456ea7df73SStefano Zampini *hRAP = hypre_ParCSRMatrixRAP(hR, hA, hP); 8466ea7df73SStefano Zampini PetscStackPop; 8476ea7df73SStefano Zampini #else 848792fecdfSBarry Smith PetscCallExternal(hypre_BoomerAMGBuildCoarseOperator, hR, hA, hP, hRAP); 849792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixSetNumNonzeros, *hRAP); 8506ea7df73SStefano Zampini #endif 851613e5ff0Sstefano_zampini /* hypre_BoomerAMGBuildCoarseOperator steals the col_starts from P and the row_starts from R */ 852a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts) 853613e5ff0Sstefano_zampini hypre_ParCSRMatrixSetRowStartsOwner(*hRAP, 0); 854613e5ff0Sstefano_zampini hypre_ParCSRMatrixSetColStartsOwner(*hRAP, 0); 855613e5ff0Sstefano_zampini if (P_owns_col_starts) hypre_ParCSRMatrixSetColStartsOwner(hP, 1); 856613e5ff0Sstefano_zampini if (R_owns_row_starts) hypre_ParCSRMatrixSetRowStartsOwner(hR, 1); 857a1d2239cSSatish Balay #endif 8583ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 859613e5ff0Sstefano_zampini } 860613e5ff0Sstefano_zampini 861d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatPtAPNumeric_AIJ_AIJ_wHYPRE(Mat A, Mat P, Mat C) 862d71ae5a4SJacob Faibussowitsch { 8636f231fbdSstefano_zampini Mat B; 8646abb4441SStefano Zampini hypre_ParCSRMatrix *hA, *hP, *hPtAP = NULL; 8654222ddf1SHong Zhang Mat_Product *product = C->product; 866613e5ff0Sstefano_zampini 867613e5ff0Sstefano_zampini PetscFunctionBegin; 8689566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(A, &hA)); 8699566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(P, &hP)); 8709566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_RAP(hP, hA, hP, &hPtAP)); 8719566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(hPtAP, MATAIJ, PETSC_OWN_POINTER, &B)); 8724222ddf1SHong Zhang 8739566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(C, &B)); 8744222ddf1SHong Zhang C->product = product; 8754222ddf1SHong Zhang 8769566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(A, &hA)); 8779566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(P, &hP)); 8783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 8796f231fbdSstefano_zampini } 8806f231fbdSstefano_zampini 881d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatPtAPSymbolic_AIJ_AIJ_wHYPRE(Mat A, Mat P, PetscReal fill, Mat C) 882d71ae5a4SJacob Faibussowitsch { 8836f231fbdSstefano_zampini PetscFunctionBegin; 8849566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATAIJ)); 8854222ddf1SHong Zhang C->ops->ptapnumeric = MatPtAPNumeric_AIJ_AIJ_wHYPRE; 8864222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_PtAP; 8873ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 888613e5ff0Sstefano_zampini } 889613e5ff0Sstefano_zampini 890d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatPtAPNumeric_AIJ_HYPRE(Mat A, Mat P, Mat C) 891d71ae5a4SJacob Faibussowitsch { 8924cc28894Sstefano_zampini Mat B; 8934cc28894Sstefano_zampini Mat_HYPRE *hP; 8946abb4441SStefano Zampini hypre_ParCSRMatrix *hA = NULL, *Pparcsr, *ptapparcsr = NULL; 895613e5ff0Sstefano_zampini HYPRE_Int type; 896613e5ff0Sstefano_zampini MPI_Comm comm = PetscObjectComm((PetscObject)A); 8974cc28894Sstefano_zampini PetscBool ishypre; 898613e5ff0Sstefano_zampini 899613e5ff0Sstefano_zampini PetscFunctionBegin; 9009566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)P, MATHYPRE, &ishypre)); 90128b400f6SJacob Faibussowitsch PetscCheck(ishypre, comm, PETSC_ERR_USER, "P should be of type %s", MATHYPRE); 9024cc28894Sstefano_zampini hP = (Mat_HYPRE *)P->data; 903792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType, hP->ij, &type); 90408401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, comm, PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported"); 905792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, hP->ij, (void **)&Pparcsr); 906613e5ff0Sstefano_zampini 9079566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(A, &hA)); 9089566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_RAP(Pparcsr, hA, Pparcsr, &ptapparcsr)); 9099566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(A, &hA)); 910225daaf8SStefano Zampini 9114cc28894Sstefano_zampini /* create temporary matrix and merge to C */ 9129566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(ptapparcsr, ((PetscObject)C)->type_name, PETSC_OWN_POINTER, &B)); 9139566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(C, &B)); 9143ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 9154cc28894Sstefano_zampini } 9164cc28894Sstefano_zampini 917d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatPtAPNumeric_HYPRE_HYPRE(Mat A, Mat P, Mat C) 918d71ae5a4SJacob Faibussowitsch { 9194cc28894Sstefano_zampini Mat B; 9206abb4441SStefano Zampini hypre_ParCSRMatrix *Aparcsr, *Pparcsr, *ptapparcsr = NULL; 9214cc28894Sstefano_zampini Mat_HYPRE *hA, *hP; 9224cc28894Sstefano_zampini PetscBool ishypre; 9234cc28894Sstefano_zampini HYPRE_Int type; 9244cc28894Sstefano_zampini 9254cc28894Sstefano_zampini PetscFunctionBegin; 9269566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)P, MATHYPRE, &ishypre)); 92728b400f6SJacob Faibussowitsch PetscCheck(ishypre, PetscObjectComm((PetscObject)P), PETSC_ERR_USER, "P should be of type %s", MATHYPRE); 9289566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)A, MATHYPRE, &ishypre)); 92928b400f6SJacob Faibussowitsch PetscCheck(ishypre, PetscObjectComm((PetscObject)A), PETSC_ERR_USER, "A should be of type %s", MATHYPRE); 9304cc28894Sstefano_zampini hA = (Mat_HYPRE *)A->data; 9314cc28894Sstefano_zampini hP = (Mat_HYPRE *)P->data; 932792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType, hA->ij, &type); 93308401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported"); 934792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType, hP->ij, &type); 93508401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)P), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported"); 936792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, hA->ij, (void **)&Aparcsr); 937792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, hP->ij, (void **)&Pparcsr); 9389566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_RAP(Pparcsr, Aparcsr, Pparcsr, &ptapparcsr)); 9399566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(ptapparcsr, MATHYPRE, PETSC_OWN_POINTER, &B)); 9409566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(C, &B)); 9413ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 9424cc28894Sstefano_zampini } 9434cc28894Sstefano_zampini 944d501dc42Sstefano_zampini /* calls hypre_ParMatmul 945d501dc42Sstefano_zampini hypre_ParMatMul uses hypre_ParMatrixCreate with the communicator of hA 9463dad0653Sstefano_zampini hypre_ParMatrixCreate does not duplicate the communicator 9476ea7df73SStefano Zampini It looks like we don't need to have the diagonal entries ordered first */ 948d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_ParCSR_MatMatMult(hypre_ParCSRMatrix *hA, hypre_ParCSRMatrix *hB, hypre_ParCSRMatrix **hAB) 949d71ae5a4SJacob Faibussowitsch { 950d501dc42Sstefano_zampini PetscFunctionBegin; 9516ea7df73SStefano Zampini /* can be replaced by version test later */ 9526ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 953792fecdfSBarry Smith PetscStackPushExternal("hypre_ParCSRMatMat"); 9546ea7df73SStefano Zampini *hAB = hypre_ParCSRMatMat(hA, hB); 9556ea7df73SStefano Zampini #else 956792fecdfSBarry Smith PetscStackPushExternal("hypre_ParMatmul"); 957d501dc42Sstefano_zampini *hAB = hypre_ParMatmul(hA, hB); 9586ea7df73SStefano Zampini #endif 959d501dc42Sstefano_zampini PetscStackPop; 9603ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 961d501dc42Sstefano_zampini } 962d501dc42Sstefano_zampini 963d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMatMultNumeric_AIJ_AIJ_wHYPRE(Mat A, Mat B, Mat C) 964d71ae5a4SJacob Faibussowitsch { 9655e5acdf2Sstefano_zampini Mat D; 966d501dc42Sstefano_zampini hypre_ParCSRMatrix *hA, *hB, *hAB = NULL; 9674222ddf1SHong Zhang Mat_Product *product = C->product; 9685e5acdf2Sstefano_zampini 9695e5acdf2Sstefano_zampini PetscFunctionBegin; 9709566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(A, &hA)); 9719566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(B, &hB)); 9729566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_MatMatMult(hA, hB, &hAB)); 9739566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(hAB, MATAIJ, PETSC_OWN_POINTER, &D)); 9744222ddf1SHong Zhang 9759566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(C, &D)); 9764222ddf1SHong Zhang C->product = product; 9774222ddf1SHong Zhang 9789566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(A, &hA)); 9799566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(B, &hB)); 9803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 9815e5acdf2Sstefano_zampini } 9825e5acdf2Sstefano_zampini 983d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatMatMultSymbolic_AIJ_AIJ_wHYPRE(Mat A, Mat B, PetscReal fill, Mat C) 984d71ae5a4SJacob Faibussowitsch { 9855e5acdf2Sstefano_zampini PetscFunctionBegin; 9869566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATAIJ)); 9874222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_AIJ_AIJ_wHYPRE; 9884222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_AB; 9893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 9905e5acdf2Sstefano_zampini } 9915e5acdf2Sstefano_zampini 992d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMatMultNumeric_HYPRE_HYPRE(Mat A, Mat B, Mat C) 993d71ae5a4SJacob Faibussowitsch { 994d501dc42Sstefano_zampini Mat D; 995d501dc42Sstefano_zampini hypre_ParCSRMatrix *Aparcsr, *Bparcsr, *ABparcsr = NULL; 996d501dc42Sstefano_zampini Mat_HYPRE *hA, *hB; 997d501dc42Sstefano_zampini PetscBool ishypre; 998d501dc42Sstefano_zampini HYPRE_Int type; 9994222ddf1SHong Zhang Mat_Product *product; 1000d501dc42Sstefano_zampini 1001d501dc42Sstefano_zampini PetscFunctionBegin; 10029566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B, MATHYPRE, &ishypre)); 100328b400f6SJacob Faibussowitsch PetscCheck(ishypre, PetscObjectComm((PetscObject)B), PETSC_ERR_USER, "B should be of type %s", MATHYPRE); 10049566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)A, MATHYPRE, &ishypre)); 100528b400f6SJacob Faibussowitsch PetscCheck(ishypre, PetscObjectComm((PetscObject)A), PETSC_ERR_USER, "A should be of type %s", MATHYPRE); 1006d501dc42Sstefano_zampini hA = (Mat_HYPRE *)A->data; 1007d501dc42Sstefano_zampini hB = (Mat_HYPRE *)B->data; 1008792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType, hA->ij, &type); 100908401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported"); 1010792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType, hB->ij, &type); 101108401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)B), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported"); 1012792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, hA->ij, (void **)&Aparcsr); 1013792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, hB->ij, (void **)&Bparcsr); 10149566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_MatMatMult(Aparcsr, Bparcsr, &ABparcsr)); 10159566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(ABparcsr, MATHYPRE, PETSC_OWN_POINTER, &D)); 10164222ddf1SHong Zhang 1017d501dc42Sstefano_zampini /* need to use HeaderReplace because HeaderMerge messes up with the communicator */ 10184222ddf1SHong Zhang product = C->product; /* save it from MatHeaderReplace() */ 10194222ddf1SHong Zhang C->product = NULL; 10209566063dSJacob Faibussowitsch PetscCall(MatHeaderReplace(C, &D)); 10214222ddf1SHong Zhang C->product = product; 1022d501dc42Sstefano_zampini C->ops->matmultnumeric = MatMatMultNumeric_HYPRE_HYPRE; 10234222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_AB; 10243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1025d501dc42Sstefano_zampini } 1026d501dc42Sstefano_zampini 1027d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatTransposeMatMatMultNumeric_AIJ_AIJ_AIJ_wHYPRE(Mat A, Mat B, Mat C, Mat D) 1028d71ae5a4SJacob Faibussowitsch { 102920e1dc0dSstefano_zampini Mat E; 10306abb4441SStefano Zampini hypre_ParCSRMatrix *hA, *hB, *hC, *hABC = NULL; 103120e1dc0dSstefano_zampini 103220e1dc0dSstefano_zampini PetscFunctionBegin; 10339566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(A, &hA)); 10349566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(B, &hB)); 10359566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(C, &hC)); 10369566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_RAP(hA, hB, hC, &hABC)); 10379566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(hABC, MATAIJ, PETSC_OWN_POINTER, &E)); 10389566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(D, &E)); 10399566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(A, &hA)); 10409566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(B, &hB)); 10419566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(C, &hC)); 10423ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 104320e1dc0dSstefano_zampini } 104420e1dc0dSstefano_zampini 1045d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatTransposeMatMatMultSymbolic_AIJ_AIJ_AIJ_wHYPRE(Mat A, Mat B, Mat C, PetscReal fill, Mat D) 1046d71ae5a4SJacob Faibussowitsch { 104720e1dc0dSstefano_zampini PetscFunctionBegin; 10489566063dSJacob Faibussowitsch PetscCall(MatSetType(D, MATAIJ)); 10493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 105020e1dc0dSstefano_zampini } 105120e1dc0dSstefano_zampini 1052d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSymbolic_AB_HYPRE(Mat C) 1053d71ae5a4SJacob Faibussowitsch { 10544222ddf1SHong Zhang PetscFunctionBegin; 10554222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_AB; 10563ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10574222ddf1SHong Zhang } 10584222ddf1SHong Zhang 1059d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSetFromOptions_HYPRE_AB(Mat C) 1060d71ae5a4SJacob Faibussowitsch { 10614222ddf1SHong Zhang Mat_Product *product = C->product; 10624222ddf1SHong Zhang PetscBool Ahypre; 10634222ddf1SHong Zhang 10644222ddf1SHong Zhang PetscFunctionBegin; 10659566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)product->A, MATHYPRE, &Ahypre)); 10664222ddf1SHong Zhang if (Ahypre) { /* A is a Hypre matrix */ 10679566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATHYPRE)); 10684222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_AB_HYPRE; 10694222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_HYPRE_HYPRE; 10703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10716718818eSStefano Zampini } 10723ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10734222ddf1SHong Zhang } 10744222ddf1SHong Zhang 1075d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSymbolic_PtAP_HYPRE(Mat C) 1076d71ae5a4SJacob Faibussowitsch { 10774222ddf1SHong Zhang PetscFunctionBegin; 10784222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_PtAP; 10793ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10804222ddf1SHong Zhang } 10814222ddf1SHong Zhang 1082d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSetFromOptions_HYPRE_PtAP(Mat C) 1083d71ae5a4SJacob Faibussowitsch { 10844222ddf1SHong Zhang Mat_Product *product = C->product; 10854222ddf1SHong Zhang PetscBool flg; 10864222ddf1SHong Zhang PetscInt type = 0; 10874222ddf1SHong Zhang const char *outTypes[4] = {"aij", "seqaij", "mpiaij", "hypre"}; 10884222ddf1SHong Zhang PetscInt ntype = 4; 10894222ddf1SHong Zhang Mat A = product->A; 10904222ddf1SHong Zhang PetscBool Ahypre; 10914222ddf1SHong Zhang 10924222ddf1SHong Zhang PetscFunctionBegin; 10939566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)A, MATHYPRE, &Ahypre)); 10944222ddf1SHong Zhang if (Ahypre) { /* A is a Hypre matrix */ 10959566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATHYPRE)); 10964222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_PtAP_HYPRE; 10974222ddf1SHong Zhang C->ops->ptapnumeric = MatPtAPNumeric_HYPRE_HYPRE; 10983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10994222ddf1SHong Zhang } 11004222ddf1SHong Zhang 11014222ddf1SHong Zhang /* A is AIJ, P is Hypre, C = PtAP can be either AIJ or Hypre format */ 11024222ddf1SHong Zhang /* Get runtime option */ 11034222ddf1SHong Zhang if (product->api_user) { 1104d0609cedSBarry Smith PetscOptionsBegin(PetscObjectComm((PetscObject)C), ((PetscObject)C)->prefix, "MatPtAP_HYPRE", "Mat"); 11059566063dSJacob Faibussowitsch PetscCall(PetscOptionsEList("-matptap_hypre_outtype", "MatPtAP outtype", "MatPtAP outtype", outTypes, ntype, outTypes[type], &type, &flg)); 1106d0609cedSBarry Smith PetscOptionsEnd(); 11074222ddf1SHong Zhang } else { 1108d0609cedSBarry Smith PetscOptionsBegin(PetscObjectComm((PetscObject)C), ((PetscObject)C)->prefix, "MatProduct_PtAP_HYPRE", "Mat"); 11099566063dSJacob Faibussowitsch PetscCall(PetscOptionsEList("-mat_product_algorithm_hypre_outtype", "MatProduct_PtAP outtype", "MatProduct_PtAP", outTypes, ntype, outTypes[type], &type, &flg)); 1110d0609cedSBarry Smith PetscOptionsEnd(); 11114222ddf1SHong Zhang } 11124222ddf1SHong Zhang 11134222ddf1SHong Zhang if (type == 0 || type == 1 || type == 2) { 11149566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATAIJ)); 11154222ddf1SHong Zhang } else if (type == 3) { 11169566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATHYPRE)); 11174222ddf1SHong Zhang } else SETERRQ(PetscObjectComm((PetscObject)C), PETSC_ERR_SUP, "MatPtAP outtype is not supported"); 11184222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_PtAP_HYPRE; 11194222ddf1SHong Zhang C->ops->ptapnumeric = MatPtAPNumeric_AIJ_HYPRE; 11203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 11214222ddf1SHong Zhang } 11224222ddf1SHong Zhang 1123d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSetFromOptions_HYPRE(Mat C) 1124d71ae5a4SJacob Faibussowitsch { 11254222ddf1SHong Zhang Mat_Product *product = C->product; 11264222ddf1SHong Zhang 11274222ddf1SHong Zhang PetscFunctionBegin; 11284222ddf1SHong Zhang switch (product->type) { 1129d71ae5a4SJacob Faibussowitsch case MATPRODUCT_AB: 1130d71ae5a4SJacob Faibussowitsch PetscCall(MatProductSetFromOptions_HYPRE_AB(C)); 1131d71ae5a4SJacob Faibussowitsch break; 1132d71ae5a4SJacob Faibussowitsch case MATPRODUCT_PtAP: 1133d71ae5a4SJacob Faibussowitsch PetscCall(MatProductSetFromOptions_HYPRE_PtAP(C)); 1134d71ae5a4SJacob Faibussowitsch break; 1135d71ae5a4SJacob Faibussowitsch default: 1136d71ae5a4SJacob Faibussowitsch break; 11374222ddf1SHong Zhang } 11383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 11394222ddf1SHong Zhang } 11404222ddf1SHong Zhang 1141d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMultTranspose_HYPRE(Mat A, Vec x, Vec y) 1142d71ae5a4SJacob Faibussowitsch { 114363c07aadSStefano Zampini PetscFunctionBegin; 11449566063dSJacob Faibussowitsch PetscCall(MatHYPRE_MultKernel_Private(A, 1.0, x, 0.0, y, PETSC_TRUE)); 11453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 114663c07aadSStefano Zampini } 114763c07aadSStefano Zampini 1148d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMult_HYPRE(Mat A, Vec x, Vec y) 1149d71ae5a4SJacob Faibussowitsch { 115063c07aadSStefano Zampini PetscFunctionBegin; 11519566063dSJacob Faibussowitsch PetscCall(MatHYPRE_MultKernel_Private(A, 1.0, x, 0.0, y, PETSC_FALSE)); 11523ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 115363c07aadSStefano Zampini } 115463c07aadSStefano Zampini 1155d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMultAdd_HYPRE(Mat A, Vec x, Vec y, Vec z) 1156d71ae5a4SJacob Faibussowitsch { 1157414bd5c3SStefano Zampini PetscFunctionBegin; 115848a46eb9SPierre Jolivet if (y != z) PetscCall(VecCopy(y, z)); 11599566063dSJacob Faibussowitsch PetscCall(MatHYPRE_MultKernel_Private(A, 1.0, x, 1.0, z, PETSC_FALSE)); 11603ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1161414bd5c3SStefano Zampini } 1162414bd5c3SStefano Zampini 1163d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMultTransposeAdd_HYPRE(Mat A, Vec x, Vec y, Vec z) 1164d71ae5a4SJacob Faibussowitsch { 1165414bd5c3SStefano Zampini PetscFunctionBegin; 116648a46eb9SPierre Jolivet if (y != z) PetscCall(VecCopy(y, z)); 11679566063dSJacob Faibussowitsch PetscCall(MatHYPRE_MultKernel_Private(A, 1.0, x, 1.0, z, PETSC_TRUE)); 11683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1169414bd5c3SStefano Zampini } 1170414bd5c3SStefano Zampini 1171414bd5c3SStefano Zampini /* y = a * A * x + b * y or y = a * A^t * x + b * y depending on trans */ 1172d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_MultKernel_Private(Mat A, HYPRE_Complex a, Vec x, HYPRE_Complex b, Vec y, PetscBool trans) 1173d71ae5a4SJacob Faibussowitsch { 117463c07aadSStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 117563c07aadSStefano Zampini hypre_ParCSRMatrix *parcsr; 117663c07aadSStefano Zampini hypre_ParVector *hx, *hy; 117763c07aadSStefano Zampini 117863c07aadSStefano Zampini PetscFunctionBegin; 117963c07aadSStefano Zampini if (trans) { 11809566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorPushVecRead(hA->b, x)); 11819566063dSJacob Faibussowitsch if (b != 0.0) PetscCall(VecHYPRE_IJVectorPushVec(hA->x, y)); 11829566063dSJacob Faibussowitsch else PetscCall(VecHYPRE_IJVectorPushVecWrite(hA->x, y)); 1183792fecdfSBarry Smith PetscCallExternal(HYPRE_IJVectorGetObject, hA->b->ij, (void **)&hx); 1184792fecdfSBarry Smith PetscCallExternal(HYPRE_IJVectorGetObject, hA->x->ij, (void **)&hy); 118563c07aadSStefano Zampini } else { 11869566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorPushVecRead(hA->x, x)); 11879566063dSJacob Faibussowitsch if (b != 0.0) PetscCall(VecHYPRE_IJVectorPushVec(hA->b, y)); 11889566063dSJacob Faibussowitsch else PetscCall(VecHYPRE_IJVectorPushVecWrite(hA->b, y)); 1189792fecdfSBarry Smith PetscCallExternal(HYPRE_IJVectorGetObject, hA->x->ij, (void **)&hx); 1190792fecdfSBarry Smith PetscCallExternal(HYPRE_IJVectorGetObject, hA->b->ij, (void **)&hy); 119163c07aadSStefano Zampini } 1192792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, hA->ij, (void **)&parcsr); 11936ea7df73SStefano Zampini if (trans) { 1194792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixMatvecT, a, parcsr, hx, b, hy); 11956ea7df73SStefano Zampini } else { 1196792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixMatvec, a, parcsr, hx, b, hy); 11976ea7df73SStefano Zampini } 11989566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorPopVec(hA->x)); 11999566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorPopVec(hA->b)); 12003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 120163c07aadSStefano Zampini } 120263c07aadSStefano Zampini 1203d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatDestroy_HYPRE(Mat A) 1204d71ae5a4SJacob Faibussowitsch { 120563c07aadSStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 120663c07aadSStefano Zampini 120763c07aadSStefano Zampini PetscFunctionBegin; 12089566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorDestroy(&hA->x)); 12099566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorDestroy(&hA->b)); 1210978814f1SStefano Zampini if (hA->ij) { 1211978814f1SStefano Zampini if (!hA->inner_free) hypre_IJMatrixObject(hA->ij) = NULL; 1212792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixDestroy, hA->ij); 1213978814f1SStefano Zampini } 12149566063dSJacob Faibussowitsch if (hA->comm) PetscCall(PetscCommRestoreComm(PetscObjectComm((PetscObject)A), &hA->comm)); 1215c69f721fSFande Kong 12169566063dSJacob Faibussowitsch PetscCall(MatStashDestroy_Private(&A->stash)); 12179566063dSJacob Faibussowitsch PetscCall(PetscFree(hA->array)); 1218c69f721fSFande Kong 12195fbaff96SJunchao Zhang if (hA->cooMat) { 12205fbaff96SJunchao Zhang PetscCall(MatDestroy(&hA->cooMat)); 1221e77caa6dSBarry Smith PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hA->diagJ, hA->memType)); 1222e77caa6dSBarry Smith PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hA->offdJ, hA->memType)); 1223e77caa6dSBarry Smith PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hA->diag, hA->memType)); 12245fbaff96SJunchao Zhang } 12255fbaff96SJunchao Zhang 12269566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_hypre_aij_C", NULL)); 12279566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_hypre_is_C", NULL)); 12289566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_hypre_C", NULL)); 12299566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_mpiaij_hypre_C", NULL)); 12309566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatHYPRESetPreallocation_C", NULL)); 12319566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatHYPREGetParCSR_C", NULL)); 12325fbaff96SJunchao Zhang PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL)); 12335fbaff96SJunchao Zhang PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL)); 12349566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 12353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 123663c07aadSStefano Zampini } 123763c07aadSStefano Zampini 1238d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetUp_HYPRE(Mat A) 1239d71ae5a4SJacob Faibussowitsch { 12404ec6421dSstefano_zampini PetscFunctionBegin; 12419566063dSJacob Faibussowitsch PetscCall(MatHYPRESetPreallocation(A, PETSC_DEFAULT, NULL, PETSC_DEFAULT, NULL)); 12423ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12434ec6421dSstefano_zampini } 12444ec6421dSstefano_zampini 12456ea7df73SStefano Zampini //TODO FIX hypre_CSRMatrixMatvecOutOfPlace 12466ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 1247d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatBindToCPU_HYPRE(Mat A, PetscBool bind) 1248d71ae5a4SJacob Faibussowitsch { 12496ea7df73SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 12506ea7df73SStefano Zampini HYPRE_MemoryLocation hmem = bind ? HYPRE_MEMORY_HOST : HYPRE_MEMORY_DEVICE; 12516ea7df73SStefano Zampini 12526ea7df73SStefano Zampini PetscFunctionBegin; 12536ea7df73SStefano Zampini A->boundtocpu = bind; 12545fbaff96SJunchao Zhang if (hA->ij && hypre_IJMatrixAssembleFlag(hA->ij) && hmem != hypre_IJMatrixMemoryLocation(hA->ij)) { 12556ea7df73SStefano Zampini hypre_ParCSRMatrix *parcsr; 1256792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, hA->ij, (void **)&parcsr); 1257792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixMigrate, parcsr, hmem); 12586ea7df73SStefano Zampini } 12599566063dSJacob Faibussowitsch if (hA->x) PetscCall(VecHYPRE_IJBindToCPU(hA->x, bind)); 12609566063dSJacob Faibussowitsch if (hA->b) PetscCall(VecHYPRE_IJBindToCPU(hA->b, bind)); 12613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12626ea7df73SStefano Zampini } 12636ea7df73SStefano Zampini #endif 12646ea7df73SStefano Zampini 1265d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAssemblyEnd_HYPRE(Mat A, MatAssemblyType mode) 1266d71ae5a4SJacob Faibussowitsch { 126763c07aadSStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 1268c69f721fSFande Kong PetscMPIInt n; 1269c69f721fSFande Kong PetscInt i, j, rstart, ncols, flg; 1270c69f721fSFande Kong PetscInt *row, *col; 1271c69f721fSFande Kong PetscScalar *val; 127263c07aadSStefano Zampini 127363c07aadSStefano Zampini PetscFunctionBegin; 127408401ef6SPierre Jolivet PetscCheck(mode != MAT_FLUSH_ASSEMBLY, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "MAT_FLUSH_ASSEMBLY currently not supported with MATHYPRE"); 1275c69f721fSFande Kong 1276c69f721fSFande Kong if (!A->nooffprocentries) { 1277c69f721fSFande Kong while (1) { 12789566063dSJacob Faibussowitsch PetscCall(MatStashScatterGetMesg_Private(&A->stash, &n, &row, &col, &val, &flg)); 1279c69f721fSFande Kong if (!flg) break; 1280c69f721fSFande Kong 1281c69f721fSFande Kong for (i = 0; i < n;) { 1282c69f721fSFande Kong /* Now identify the consecutive vals belonging to the same row */ 1283c69f721fSFande Kong for (j = i, rstart = row[j]; j < n; j++) { 1284c69f721fSFande Kong if (row[j] != rstart) break; 1285c69f721fSFande Kong } 1286c69f721fSFande Kong if (j < n) ncols = j - i; 1287c69f721fSFande Kong else ncols = n - i; 1288c69f721fSFande Kong /* Now assemble all these values with a single function call */ 12899566063dSJacob Faibussowitsch PetscCall(MatSetValues_HYPRE(A, 1, row + i, ncols, col + i, val + i, A->insertmode)); 1290c69f721fSFande Kong 1291c69f721fSFande Kong i = j; 1292c69f721fSFande Kong } 1293c69f721fSFande Kong } 12949566063dSJacob Faibussowitsch PetscCall(MatStashScatterEnd_Private(&A->stash)); 1295c69f721fSFande Kong } 1296c69f721fSFande Kong 1297792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixAssemble, hA->ij); 1298336664bdSPierre Jolivet /* The assembly routine destroys the aux_matrix, we recreate it here by calling HYPRE_IJMatrixInitialize */ 1299336664bdSPierre Jolivet /* If the option MAT_SORTED_FULL is set to true, the indices and values can be passed to hypre directly, so we don't need the aux_matrix */ 1300336664bdSPierre Jolivet if (!hA->sorted_full) { 1301af1cf968SStefano Zampini hypre_AuxParCSRMatrix *aux_matrix; 1302af1cf968SStefano Zampini 1303af1cf968SStefano Zampini /* call destroy just to make sure we do not leak anything */ 1304af1cf968SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(hA->ij); 1305792fecdfSBarry Smith PetscCallExternal(hypre_AuxParCSRMatrixDestroy, aux_matrix); 1306af1cf968SStefano Zampini hypre_IJMatrixTranslator(hA->ij) = NULL; 1307af1cf968SStefano Zampini 1308af1cf968SStefano Zampini /* Initialize with assembled flag -> it only recreates the aux_par_matrix */ 1309792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixInitialize, hA->ij); 1310af1cf968SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(hA->ij); 13116ea7df73SStefano Zampini if (aux_matrix) { 1312af1cf968SStefano Zampini hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 1; /* see comment in MatHYPRESetPreallocation_HYPRE */ 131322235d61SPierre Jolivet #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0) 1314792fecdfSBarry Smith PetscCallExternal(hypre_AuxParCSRMatrixInitialize, aux_matrix); 131522235d61SPierre Jolivet #else 1316792fecdfSBarry Smith PetscCallExternal(hypre_AuxParCSRMatrixInitialize_v2, aux_matrix, HYPRE_MEMORY_HOST); 131722235d61SPierre Jolivet #endif 1318af1cf968SStefano Zampini } 13196ea7df73SStefano Zampini } 13206ea7df73SStefano Zampini { 13216ea7df73SStefano Zampini hypre_ParCSRMatrix *parcsr; 13226ea7df73SStefano Zampini 1323792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, hA->ij, (void **)&parcsr); 1324792fecdfSBarry Smith if (!hypre_ParCSRMatrixCommPkg(parcsr)) PetscCallExternal(hypre_MatvecCommPkgCreate, parcsr); 13256ea7df73SStefano Zampini } 13269566063dSJacob Faibussowitsch if (!hA->x) PetscCall(VecHYPRE_IJVectorCreate(A->cmap, &hA->x)); 13279566063dSJacob Faibussowitsch if (!hA->b) PetscCall(VecHYPRE_IJVectorCreate(A->rmap, &hA->b)); 13286ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 13299566063dSJacob Faibussowitsch PetscCall(MatBindToCPU_HYPRE(A, A->boundtocpu)); 13306ea7df73SStefano Zampini #endif 13313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 133263c07aadSStefano Zampini } 133363c07aadSStefano Zampini 1334d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetArray_HYPRE(Mat A, PetscInt size, void **array) 1335d71ae5a4SJacob Faibussowitsch { 1336c69f721fSFande Kong Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 1337c69f721fSFande Kong 1338c69f721fSFande Kong PetscFunctionBegin; 133928b400f6SJacob Faibussowitsch PetscCheck(hA->available, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Temporary space is in use"); 1340c69f721fSFande Kong 134139accc25SStefano Zampini if (hA->size >= size) { 134239accc25SStefano Zampini *array = hA->array; 134339accc25SStefano Zampini } else { 13449566063dSJacob Faibussowitsch PetscCall(PetscFree(hA->array)); 1345c69f721fSFande Kong hA->size = size; 13469566063dSJacob Faibussowitsch PetscCall(PetscMalloc(hA->size, &hA->array)); 1347c69f721fSFande Kong *array = hA->array; 1348c69f721fSFande Kong } 1349c69f721fSFande Kong 1350c69f721fSFande Kong hA->available = PETSC_FALSE; 13513ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1352c69f721fSFande Kong } 1353c69f721fSFande Kong 1354d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatRestoreArray_HYPRE(Mat A, void **array) 1355d71ae5a4SJacob Faibussowitsch { 1356c69f721fSFande Kong Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 1357c69f721fSFande Kong 1358c69f721fSFande Kong PetscFunctionBegin; 1359c69f721fSFande Kong *array = NULL; 1360c69f721fSFande Kong hA->available = PETSC_TRUE; 13613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1362c69f721fSFande Kong } 1363c69f721fSFande Kong 1364d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValues_HYPRE(Mat A, PetscInt nr, const PetscInt rows[], PetscInt nc, const PetscInt cols[], const PetscScalar v[], InsertMode ins) 1365d71ae5a4SJacob Faibussowitsch { 1366d975228cSstefano_zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 1367d975228cSstefano_zampini PetscScalar *vals = (PetscScalar *)v; 136839accc25SStefano Zampini HYPRE_Complex *sscr; 1369c69f721fSFande Kong PetscInt *cscr[2]; 1370c69f721fSFande Kong PetscInt i, nzc; 137108defe43SFande Kong void *array = NULL; 1372d975228cSstefano_zampini 1373d975228cSstefano_zampini PetscFunctionBegin; 13749566063dSJacob Faibussowitsch PetscCall(MatGetArray_HYPRE(A, sizeof(PetscInt) * (2 * nc) + sizeof(HYPRE_Complex) * nc * nr, &array)); 1375c69f721fSFande Kong cscr[0] = (PetscInt *)array; 1376c69f721fSFande Kong cscr[1] = ((PetscInt *)array) + nc; 137739accc25SStefano Zampini sscr = (HYPRE_Complex *)(((PetscInt *)array) + nc * 2); 1378d975228cSstefano_zampini for (i = 0, nzc = 0; i < nc; i++) { 1379d975228cSstefano_zampini if (cols[i] >= 0) { 1380d975228cSstefano_zampini cscr[0][nzc] = cols[i]; 1381d975228cSstefano_zampini cscr[1][nzc++] = i; 1382d975228cSstefano_zampini } 1383d975228cSstefano_zampini } 1384c69f721fSFande Kong if (!nzc) { 13859566063dSJacob Faibussowitsch PetscCall(MatRestoreArray_HYPRE(A, &array)); 13863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1387c69f721fSFande Kong } 1388d975228cSstefano_zampini 13896ea7df73SStefano Zampini #if 0 //defined(PETSC_HAVE_HYPRE_DEVICE) 13906ea7df73SStefano Zampini if (HYPRE_MEMORY_HOST != hypre_IJMatrixMemoryLocation(hA->ij)) { 13916ea7df73SStefano Zampini hypre_ParCSRMatrix *parcsr; 13926ea7df73SStefano Zampini 1393792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject,hA->ij,(void**)&parcsr); 1394792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixMigrate,parcsr, HYPRE_MEMORY_HOST); 13956ea7df73SStefano Zampini } 13966ea7df73SStefano Zampini #endif 13976ea7df73SStefano Zampini 1398d975228cSstefano_zampini if (ins == ADD_VALUES) { 1399d975228cSstefano_zampini for (i = 0; i < nr; i++) { 14006ea7df73SStefano Zampini if (rows[i] >= 0) { 1401d975228cSstefano_zampini PetscInt j; 14022cf14000SStefano Zampini HYPRE_Int hnc = (HYPRE_Int)nzc; 14032cf14000SStefano Zampini 1404aed4548fSBarry Smith PetscCheck((PetscInt)hnc == nzc, PETSC_COMM_SELF, PETSC_ERR_SUP, "Hypre overflow! number of columns %" PetscInt_FMT " for row %" PetscInt_FMT, nzc, rows[i]); 14059566063dSJacob Faibussowitsch for (j = 0; j < nzc; j++) PetscCall(PetscHYPREScalarCast(vals[cscr[1][j]], &sscr[j])); 1406792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixAddToValues, hA->ij, 1, &hnc, (HYPRE_BigInt *)(rows + i), (HYPRE_BigInt *)cscr[0], sscr); 1407d975228cSstefano_zampini } 1408d975228cSstefano_zampini vals += nc; 1409d975228cSstefano_zampini } 1410d975228cSstefano_zampini } else { /* INSERT_VALUES */ 1411d975228cSstefano_zampini PetscInt rst, ren; 1412c69f721fSFande Kong 14139566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(A, &rst, &ren)); 1414d975228cSstefano_zampini for (i = 0; i < nr; i++) { 14156ea7df73SStefano Zampini if (rows[i] >= 0) { 1416d975228cSstefano_zampini PetscInt j; 14172cf14000SStefano Zampini HYPRE_Int hnc = (HYPRE_Int)nzc; 14182cf14000SStefano Zampini 1419aed4548fSBarry Smith PetscCheck((PetscInt)hnc == nzc, PETSC_COMM_SELF, PETSC_ERR_SUP, "Hypre overflow! number of columns %" PetscInt_FMT " for row %" PetscInt_FMT, nzc, rows[i]); 14209566063dSJacob Faibussowitsch for (j = 0; j < nzc; j++) PetscCall(PetscHYPREScalarCast(vals[cscr[1][j]], &sscr[j])); 1421c69f721fSFande Kong /* nonlocal values */ 14229566063dSJacob Faibussowitsch if (rows[i] < rst || rows[i] >= ren) PetscCall(MatStashValuesRow_Private(&A->stash, rows[i], nzc, cscr[0], (PetscScalar *)sscr, PETSC_FALSE)); 1423c69f721fSFande Kong /* local values */ 1424792fecdfSBarry Smith else PetscCallExternal(HYPRE_IJMatrixSetValues, hA->ij, 1, &hnc, (HYPRE_BigInt *)(rows + i), (HYPRE_BigInt *)cscr[0], sscr); 1425d975228cSstefano_zampini } 1426d975228cSstefano_zampini vals += nc; 1427d975228cSstefano_zampini } 1428d975228cSstefano_zampini } 1429c69f721fSFande Kong 14309566063dSJacob Faibussowitsch PetscCall(MatRestoreArray_HYPRE(A, &array)); 14313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1432d975228cSstefano_zampini } 1433d975228cSstefano_zampini 1434d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRESetPreallocation_HYPRE(Mat A, PetscInt dnz, const PetscInt dnnz[], PetscInt onz, const PetscInt onnz[]) 1435d71ae5a4SJacob Faibussowitsch { 1436d975228cSstefano_zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 14377d968826Sstefano_zampini HYPRE_Int *hdnnz, *honnz; 143806a29025Sstefano_zampini PetscInt i, rs, re, cs, ce, bs; 1439d975228cSstefano_zampini PetscMPIInt size; 1440d975228cSstefano_zampini 1441d975228cSstefano_zampini PetscFunctionBegin; 14429566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 14439566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 1444d975228cSstefano_zampini rs = A->rmap->rstart; 1445d975228cSstefano_zampini re = A->rmap->rend; 1446d975228cSstefano_zampini cs = A->cmap->rstart; 1447d975228cSstefano_zampini ce = A->cmap->rend; 1448d975228cSstefano_zampini if (!hA->ij) { 1449792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixCreate, hA->comm, rs, re - 1, cs, ce - 1, &hA->ij); 1450792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetObjectType, hA->ij, HYPRE_PARCSR); 1451d975228cSstefano_zampini } else { 14522cf14000SStefano Zampini HYPRE_BigInt hrs, hre, hcs, hce; 1453792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetLocalRange, hA->ij, &hrs, &hre, &hcs, &hce); 1454aed4548fSBarry Smith PetscCheck(hre - hrs + 1 == re - rs, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Inconsistent local rows: IJMatrix [%" PetscHYPRE_BigInt_FMT ",%" PetscHYPRE_BigInt_FMT "), PETSc [%" PetscInt_FMT ",%" PetscInt_FMT ")", hrs, hre + 1, rs, re); 1455aed4548fSBarry Smith PetscCheck(hce - hcs + 1 == ce - cs, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Inconsistent local cols: IJMatrix [%" PetscHYPRE_BigInt_FMT ",%" PetscHYPRE_BigInt_FMT "), PETSc [%" PetscInt_FMT ",%" PetscInt_FMT ")", hcs, hce + 1, cs, ce); 1456d975228cSstefano_zampini } 14579566063dSJacob Faibussowitsch PetscCall(MatGetBlockSize(A, &bs)); 145806a29025Sstefano_zampini if (dnz == PETSC_DEFAULT || dnz == PETSC_DECIDE) dnz = 10 * bs; 145906a29025Sstefano_zampini if (onz == PETSC_DEFAULT || onz == PETSC_DECIDE) onz = 10 * bs; 146006a29025Sstefano_zampini 1461d975228cSstefano_zampini if (!dnnz) { 14629566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &hdnnz)); 1463d975228cSstefano_zampini for (i = 0; i < A->rmap->n; i++) hdnnz[i] = dnz; 1464d975228cSstefano_zampini } else { 14657d968826Sstefano_zampini hdnnz = (HYPRE_Int *)dnnz; 1466d975228cSstefano_zampini } 14679566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)A), &size)); 1468d975228cSstefano_zampini if (size > 1) { 1469ddbeb582SStefano Zampini hypre_AuxParCSRMatrix *aux_matrix; 1470d975228cSstefano_zampini if (!onnz) { 14719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &honnz)); 1472d975228cSstefano_zampini for (i = 0; i < A->rmap->n; i++) honnz[i] = onz; 147322235d61SPierre Jolivet } else honnz = (HYPRE_Int *)onnz; 1474ddbeb582SStefano Zampini /* SetDiagOffdSizes sets hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0, since it seems 1475ddbeb582SStefano Zampini they assume the user will input the entire row values, properly sorted 1476336664bdSPierre Jolivet In PETSc, we don't make such an assumption and set this flag to 1, 1477336664bdSPierre Jolivet unless the option MAT_SORTED_FULL is set to true. 1478ddbeb582SStefano Zampini Also, to avoid possible memory leaks, we destroy and recreate the translator 1479ddbeb582SStefano Zampini This has to be done here, as HYPRE_IJMatrixInitialize will properly initialize 1480ddbeb582SStefano Zampini the IJ matrix for us */ 1481ddbeb582SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(hA->ij); 1482ddbeb582SStefano Zampini hypre_AuxParCSRMatrixDestroy(aux_matrix); 1483ddbeb582SStefano Zampini hypre_IJMatrixTranslator(hA->ij) = NULL; 1484792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetDiagOffdSizes, hA->ij, hdnnz, honnz); 1485ddbeb582SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(hA->ij); 1486336664bdSPierre Jolivet hypre_AuxParCSRMatrixNeedAux(aux_matrix) = !hA->sorted_full; 1487d975228cSstefano_zampini } else { 1488d975228cSstefano_zampini honnz = NULL; 1489792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetRowSizes, hA->ij, hdnnz); 1490d975228cSstefano_zampini } 1491ddbeb582SStefano Zampini 1492af1cf968SStefano Zampini /* reset assembled flag and call the initialize method */ 1493af1cf968SStefano Zampini hypre_IJMatrixAssembleFlag(hA->ij) = 0; 14946ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0) 1495792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixInitialize, hA->ij); 14966ea7df73SStefano Zampini #else 1497792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixInitialize_v2, hA->ij, HYPRE_MEMORY_HOST); 14986ea7df73SStefano Zampini #endif 149948a46eb9SPierre Jolivet if (!dnnz) PetscCall(PetscFree(hdnnz)); 150048a46eb9SPierre Jolivet if (!onnz && honnz) PetscCall(PetscFree(honnz)); 1501af1cf968SStefano Zampini /* Match AIJ logic */ 150206a29025Sstefano_zampini A->preallocated = PETSC_TRUE; 1503af1cf968SStefano Zampini A->assembled = PETSC_FALSE; 15043ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1505d975228cSstefano_zampini } 1506d975228cSstefano_zampini 1507d975228cSstefano_zampini /*@C 1508d975228cSstefano_zampini MatHYPRESetPreallocation - Preallocates memory for a sparse parallel matrix in HYPRE IJ format 1509d975228cSstefano_zampini 1510c3339decSBarry Smith Collective 1511d975228cSstefano_zampini 1512d975228cSstefano_zampini Input Parameters: 1513d975228cSstefano_zampini + A - the matrix 1514d975228cSstefano_zampini . dnz - number of nonzeros per row in DIAGONAL portion of local submatrix 1515d975228cSstefano_zampini (same value is used for all local rows) 1516d975228cSstefano_zampini . dnnz - array containing the number of nonzeros in the various rows of the 1517d975228cSstefano_zampini DIAGONAL portion of the local submatrix (possibly different for each row) 15182ef1f0ffSBarry Smith or `NULL` (`PETSC_NULL_INTEGER` in Fortran), if `d_nz` is used to specify the nonzero structure. 15192ef1f0ffSBarry Smith The size of this array is equal to the number of local rows, i.e `m`. 1520d975228cSstefano_zampini For matrices that will be factored, you must leave room for (and set) 1521d975228cSstefano_zampini the diagonal entry even if it is zero. 1522d975228cSstefano_zampini . onz - number of nonzeros per row in the OFF-DIAGONAL portion of local 1523d975228cSstefano_zampini submatrix (same value is used for all local rows). 1524d975228cSstefano_zampini - onnz - array containing the number of nonzeros in the various rows of the 1525d975228cSstefano_zampini OFF-DIAGONAL portion of the local submatrix (possibly different for 15262ef1f0ffSBarry Smith each row) or `NULL` (`PETSC_NULL_INTEGER` in Fortran), if `o_nz` is used to specify the nonzero 1527d975228cSstefano_zampini structure. The size of this array is equal to the number 15282ef1f0ffSBarry Smith of local rows, i.e `m`. 1529d975228cSstefano_zampini 15302fe279fdSBarry Smith Level: intermediate 15312fe279fdSBarry Smith 153211a5261eSBarry Smith Note: 15332ef1f0ffSBarry Smith If the *nnz parameter is given then the *nz parameter is ignored; for sequential matrices, `onz` and `onnz` are ignored. 1534d975228cSstefano_zampini 1535*1cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatMPIAIJSetPreallocation()`, `MATHYPRE`, `MATAIJ` 1536d975228cSstefano_zampini @*/ 1537d71ae5a4SJacob Faibussowitsch PetscErrorCode MatHYPRESetPreallocation(Mat A, PetscInt dnz, const PetscInt dnnz[], PetscInt onz, const PetscInt onnz[]) 1538d71ae5a4SJacob Faibussowitsch { 1539d975228cSstefano_zampini PetscFunctionBegin; 1540d975228cSstefano_zampini PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 1541d975228cSstefano_zampini PetscValidType(A, 1); 1542cac4c232SBarry Smith PetscTryMethod(A, "MatHYPRESetPreallocation_C", (Mat, PetscInt, const PetscInt[], PetscInt, const PetscInt[]), (A, dnz, dnnz, onz, onnz)); 15433ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1544d975228cSstefano_zampini } 1545d975228cSstefano_zampini 154620f4b53cSBarry Smith /*@C 15472ef1f0ffSBarry Smith MatCreateFromParCSR - Creates a `Mat` from a `hypre_ParCSRMatrix` 1548225daaf8SStefano Zampini 1549225daaf8SStefano Zampini Collective 1550225daaf8SStefano Zampini 1551225daaf8SStefano Zampini Input Parameters: 15522ef1f0ffSBarry Smith + parcsr - the pointer to the `hypre_ParCSRMatrix` 15532ef1f0ffSBarry Smith . mtype - matrix type to be created. Currently `MATAIJ`, `MATIS` and `MATHYPRE` are supported. 155420f4b53cSBarry Smith - copymode - PETSc copying options, see `PetscCopyMode` 1555225daaf8SStefano Zampini 1556225daaf8SStefano Zampini Output Parameter: 1557225daaf8SStefano Zampini . A - the matrix 1558225daaf8SStefano Zampini 1559225daaf8SStefano Zampini Level: intermediate 1560225daaf8SStefano Zampini 1561*1cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatHYPRE`, `PetscCopyMode` 156220f4b53cSBarry Smith @*/ 1563d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreateFromParCSR(hypre_ParCSRMatrix *parcsr, MatType mtype, PetscCopyMode copymode, Mat *A) 1564d71ae5a4SJacob Faibussowitsch { 1565225daaf8SStefano Zampini Mat T; 1566978814f1SStefano Zampini Mat_HYPRE *hA; 1567978814f1SStefano Zampini MPI_Comm comm; 1568978814f1SStefano Zampini PetscInt rstart, rend, cstart, cend, M, N; 1569d248a85cSRichard Tran Mills PetscBool isseqaij, isseqaijmkl, ismpiaij, isaij, ishyp, isis; 1570978814f1SStefano Zampini 1571978814f1SStefano Zampini PetscFunctionBegin; 1572978814f1SStefano Zampini comm = hypre_ParCSRMatrixComm(parcsr); 15739566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype, MATSEQAIJ, &isseqaij)); 15749566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype, MATSEQAIJMKL, &isseqaijmkl)); 15759566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype, MATMPIAIJ, &ismpiaij)); 15769566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype, MATAIJ, &isaij)); 15779566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype, MATHYPRE, &ishyp)); 15789566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype, MATIS, &isis)); 1579d248a85cSRichard Tran Mills isaij = (PetscBool)(isseqaij || isseqaijmkl || ismpiaij || isaij); 15806ea7df73SStefano Zampini /* TODO */ 1581aed4548fSBarry Smith PetscCheck(isaij || ishyp || isis, comm, PETSC_ERR_SUP, "Unsupported MatType %s! Supported types are %s, %s, %s, %s, %s, and %s", mtype, MATAIJ, MATSEQAIJ, MATSEQAIJMKL, MATMPIAIJ, MATIS, MATHYPRE); 1582978814f1SStefano Zampini /* access ParCSRMatrix */ 1583978814f1SStefano Zampini rstart = hypre_ParCSRMatrixFirstRowIndex(parcsr); 1584978814f1SStefano Zampini rend = hypre_ParCSRMatrixLastRowIndex(parcsr); 1585978814f1SStefano Zampini cstart = hypre_ParCSRMatrixFirstColDiag(parcsr); 1586978814f1SStefano Zampini cend = hypre_ParCSRMatrixLastColDiag(parcsr); 1587978814f1SStefano Zampini M = hypre_ParCSRMatrixGlobalNumRows(parcsr); 1588978814f1SStefano Zampini N = hypre_ParCSRMatrixGlobalNumCols(parcsr); 1589978814f1SStefano Zampini 1590fa92c42cSstefano_zampini /* fix for empty local rows/columns */ 1591fa92c42cSstefano_zampini if (rend < rstart) rend = rstart; 1592fa92c42cSstefano_zampini if (cend < cstart) cend = cstart; 1593fa92c42cSstefano_zampini 1594e6471dc9SStefano Zampini /* PETSc convention */ 1595e6471dc9SStefano Zampini rend++; 1596e6471dc9SStefano Zampini cend++; 1597e6471dc9SStefano Zampini rend = PetscMin(rend, M); 1598e6471dc9SStefano Zampini cend = PetscMin(cend, N); 1599e6471dc9SStefano Zampini 1600978814f1SStefano Zampini /* create PETSc matrix with MatHYPRE */ 16019566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, &T)); 16029566063dSJacob Faibussowitsch PetscCall(MatSetSizes(T, rend - rstart, cend - cstart, M, N)); 16039566063dSJacob Faibussowitsch PetscCall(MatSetType(T, MATHYPRE)); 1604225daaf8SStefano Zampini hA = (Mat_HYPRE *)(T->data); 1605978814f1SStefano Zampini 1606978814f1SStefano Zampini /* create HYPRE_IJMatrix */ 1607792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixCreate, hA->comm, rstart, rend - 1, cstart, cend - 1, &hA->ij); 1608792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetObjectType, hA->ij, HYPRE_PARCSR); 160945b8d346SStefano Zampini 16106ea7df73SStefano Zampini // TODO DEV 161145b8d346SStefano Zampini /* create new ParCSR object if needed */ 161245b8d346SStefano Zampini if (ishyp && copymode == PETSC_COPY_VALUES) { 161345b8d346SStefano Zampini hypre_ParCSRMatrix *new_parcsr; 16146ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 18, 0) 161545b8d346SStefano Zampini hypre_CSRMatrix *hdiag, *hoffd, *ndiag, *noffd; 161645b8d346SStefano Zampini 16170e6427aaSSatish Balay new_parcsr = hypre_ParCSRMatrixClone(parcsr, 0); 161845b8d346SStefano Zampini hdiag = hypre_ParCSRMatrixDiag(parcsr); 161945b8d346SStefano Zampini hoffd = hypre_ParCSRMatrixOffd(parcsr); 162045b8d346SStefano Zampini ndiag = hypre_ParCSRMatrixDiag(new_parcsr); 162145b8d346SStefano Zampini noffd = hypre_ParCSRMatrixOffd(new_parcsr); 16229566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hypre_CSRMatrixData(ndiag), hypre_CSRMatrixData(hdiag), hypre_CSRMatrixNumNonzeros(hdiag))); 16239566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hypre_CSRMatrixData(noffd), hypre_CSRMatrixData(hoffd), hypre_CSRMatrixNumNonzeros(hoffd))); 16246ea7df73SStefano Zampini #else 16256ea7df73SStefano Zampini new_parcsr = hypre_ParCSRMatrixClone(parcsr, 1); 16266ea7df73SStefano Zampini #endif 162745b8d346SStefano Zampini parcsr = new_parcsr; 162845b8d346SStefano Zampini copymode = PETSC_OWN_POINTER; 162945b8d346SStefano Zampini } 1630978814f1SStefano Zampini 1631978814f1SStefano Zampini /* set ParCSR object */ 1632978814f1SStefano Zampini hypre_IJMatrixObject(hA->ij) = parcsr; 16334ec6421dSstefano_zampini T->preallocated = PETSC_TRUE; 1634978814f1SStefano Zampini 1635978814f1SStefano Zampini /* set assembled flag */ 1636978814f1SStefano Zampini hypre_IJMatrixAssembleFlag(hA->ij) = 1; 16376ea7df73SStefano Zampini #if 0 1638792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixInitialize,hA->ij); 16396ea7df73SStefano Zampini #endif 1640225daaf8SStefano Zampini if (ishyp) { 16416d2a658fSstefano_zampini PetscMPIInt myid = 0; 16426d2a658fSstefano_zampini 16436d2a658fSstefano_zampini /* make sure we always have row_starts and col_starts available */ 164448a46eb9SPierre Jolivet if (HYPRE_AssumedPartitionCheck()) PetscCallMPI(MPI_Comm_rank(comm, &myid)); 1645a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts) 16466d2a658fSstefano_zampini if (!hypre_ParCSRMatrixOwnsColStarts(parcsr)) { 16476d2a658fSstefano_zampini PetscLayout map; 16486d2a658fSstefano_zampini 16499566063dSJacob Faibussowitsch PetscCall(MatGetLayouts(T, NULL, &map)); 16509566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(map)); 16512cf14000SStefano Zampini hypre_ParCSRMatrixColStarts(parcsr) = (HYPRE_BigInt *)(map->range + myid); 16526d2a658fSstefano_zampini } 16536d2a658fSstefano_zampini if (!hypre_ParCSRMatrixOwnsRowStarts(parcsr)) { 16546d2a658fSstefano_zampini PetscLayout map; 16556d2a658fSstefano_zampini 16569566063dSJacob Faibussowitsch PetscCall(MatGetLayouts(T, &map, NULL)); 16579566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(map)); 16582cf14000SStefano Zampini hypre_ParCSRMatrixRowStarts(parcsr) = (HYPRE_BigInt *)(map->range + myid); 16596d2a658fSstefano_zampini } 1660a1d2239cSSatish Balay #endif 1661978814f1SStefano Zampini /* prevent from freeing the pointer */ 1662978814f1SStefano Zampini if (copymode == PETSC_USE_POINTER) hA->inner_free = PETSC_FALSE; 1663225daaf8SStefano Zampini *A = T; 16649566063dSJacob Faibussowitsch PetscCall(MatSetOption(*A, MAT_SORTED_FULL, PETSC_TRUE)); 16659566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*A, MAT_FINAL_ASSEMBLY)); 16669566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*A, MAT_FINAL_ASSEMBLY)); 1667bb4689ddSStefano Zampini } else if (isaij) { 1668bb4689ddSStefano Zampini if (copymode != PETSC_OWN_POINTER) { 1669225daaf8SStefano Zampini /* prevent from freeing the pointer */ 1670225daaf8SStefano Zampini hA->inner_free = PETSC_FALSE; 16719566063dSJacob Faibussowitsch PetscCall(MatConvert_HYPRE_AIJ(T, MATAIJ, MAT_INITIAL_MATRIX, A)); 16729566063dSJacob Faibussowitsch PetscCall(MatDestroy(&T)); 1673225daaf8SStefano Zampini } else { /* AIJ return type with PETSC_OWN_POINTER */ 16749566063dSJacob Faibussowitsch PetscCall(MatConvert_HYPRE_AIJ(T, MATAIJ, MAT_INPLACE_MATRIX, &T)); 1675225daaf8SStefano Zampini *A = T; 1676225daaf8SStefano Zampini } 1677bb4689ddSStefano Zampini } else if (isis) { 16789566063dSJacob Faibussowitsch PetscCall(MatConvert_HYPRE_IS(T, MATIS, MAT_INITIAL_MATRIX, A)); 16798cfe8d00SStefano Zampini if (copymode != PETSC_OWN_POINTER) hA->inner_free = PETSC_FALSE; 16809566063dSJacob Faibussowitsch PetscCall(MatDestroy(&T)); 1681bb4689ddSStefano Zampini } 16823ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1683978814f1SStefano Zampini } 1684978814f1SStefano Zampini 1685d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPREGetParCSR_HYPRE(Mat A, hypre_ParCSRMatrix **parcsr) 1686d71ae5a4SJacob Faibussowitsch { 1687dd9c0a25Sstefano_zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 1688dd9c0a25Sstefano_zampini HYPRE_Int type; 1689dd9c0a25Sstefano_zampini 1690dd9c0a25Sstefano_zampini PetscFunctionBegin; 169128b400f6SJacob Faibussowitsch PetscCheck(hA->ij, PetscObjectComm((PetscObject)A), PETSC_ERR_PLIB, "HYPRE_IJMatrix not present"); 1692792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType, hA->ij, &type); 169308401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "HYPRE_IJMatrix is not of type HYPRE_PARCSR"); 1694792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, hA->ij, (void **)parcsr); 16953ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1696dd9c0a25Sstefano_zampini } 1697dd9c0a25Sstefano_zampini 169820f4b53cSBarry Smith /*@C 1699dd9c0a25Sstefano_zampini MatHYPREGetParCSR - Gets the pointer to the ParCSR matrix 1700dd9c0a25Sstefano_zampini 17012ef1f0ffSBarry Smith Not Collective 1702dd9c0a25Sstefano_zampini 170320f4b53cSBarry Smith Input Parameter: 170420f4b53cSBarry Smith . A - the `MATHYPRE` object 1705dd9c0a25Sstefano_zampini 1706dd9c0a25Sstefano_zampini Output Parameter: 17072ef1f0ffSBarry Smith . parcsr - the pointer to the `hypre_ParCSRMatrix` 1708dd9c0a25Sstefano_zampini 1709dd9c0a25Sstefano_zampini Level: intermediate 1710dd9c0a25Sstefano_zampini 1711*1cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatHYPRE`, `PetscCopyMode` 171220f4b53cSBarry Smith @*/ 1713d71ae5a4SJacob Faibussowitsch PetscErrorCode MatHYPREGetParCSR(Mat A, hypre_ParCSRMatrix **parcsr) 1714d71ae5a4SJacob Faibussowitsch { 1715dd9c0a25Sstefano_zampini PetscFunctionBegin; 1716dd9c0a25Sstefano_zampini PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 1717dd9c0a25Sstefano_zampini PetscValidType(A, 1); 1718cac4c232SBarry Smith PetscUseMethod(A, "MatHYPREGetParCSR_C", (Mat, hypre_ParCSRMatrix **), (A, parcsr)); 17193ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1720dd9c0a25Sstefano_zampini } 1721dd9c0a25Sstefano_zampini 1722d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMissingDiagonal_HYPRE(Mat A, PetscBool *missing, PetscInt *dd) 1723d71ae5a4SJacob Faibussowitsch { 172468ec7858SStefano Zampini hypre_ParCSRMatrix *parcsr; 172568ec7858SStefano Zampini hypre_CSRMatrix *ha; 172668ec7858SStefano Zampini PetscInt rst; 172768ec7858SStefano Zampini 172868ec7858SStefano Zampini PetscFunctionBegin; 172908401ef6SPierre Jolivet PetscCheck(A->rmap->n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_SUP, "Not implemented with non-square diagonal blocks"); 17309566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(A, &rst, NULL)); 17319566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 173268ec7858SStefano Zampini if (missing) *missing = PETSC_FALSE; 173368ec7858SStefano Zampini if (dd) *dd = -1; 173468ec7858SStefano Zampini ha = hypre_ParCSRMatrixDiag(parcsr); 173568ec7858SStefano Zampini if (ha) { 173668299464SStefano Zampini PetscInt size, i; 173768299464SStefano Zampini HYPRE_Int *ii, *jj; 173868ec7858SStefano Zampini 173968ec7858SStefano Zampini size = hypre_CSRMatrixNumRows(ha); 174068ec7858SStefano Zampini ii = hypre_CSRMatrixI(ha); 174168ec7858SStefano Zampini jj = hypre_CSRMatrixJ(ha); 174268ec7858SStefano Zampini for (i = 0; i < size; i++) { 174368ec7858SStefano Zampini PetscInt j; 174468ec7858SStefano Zampini PetscBool found = PETSC_FALSE; 174568ec7858SStefano Zampini 17469371c9d4SSatish Balay for (j = ii[i]; j < ii[i + 1] && !found; j++) found = (jj[j] == i) ? PETSC_TRUE : PETSC_FALSE; 174768ec7858SStefano Zampini 174868ec7858SStefano Zampini if (!found) { 17493ba16761SJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix is missing local diagonal entry %" PetscInt_FMT "\n", i)); 175068ec7858SStefano Zampini if (missing) *missing = PETSC_TRUE; 175168ec7858SStefano Zampini if (dd) *dd = i + rst; 17523ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 175368ec7858SStefano Zampini } 175468ec7858SStefano Zampini } 175568ec7858SStefano Zampini if (!size) { 17563ba16761SJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no diagonal entries therefore is missing diagonal\n")); 175768ec7858SStefano Zampini if (missing) *missing = PETSC_TRUE; 175868ec7858SStefano Zampini if (dd) *dd = rst; 175968ec7858SStefano Zampini } 176068ec7858SStefano Zampini } else { 17613ba16761SJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no diagonal entries therefore is missing diagonal\n")); 176268ec7858SStefano Zampini if (missing) *missing = PETSC_TRUE; 176368ec7858SStefano Zampini if (dd) *dd = rst; 176468ec7858SStefano Zampini } 17653ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 176668ec7858SStefano Zampini } 176768ec7858SStefano Zampini 1768d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatScale_HYPRE(Mat A, PetscScalar s) 1769d71ae5a4SJacob Faibussowitsch { 177068ec7858SStefano Zampini hypre_ParCSRMatrix *parcsr; 17716ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0) 177268ec7858SStefano Zampini hypre_CSRMatrix *ha; 17736ea7df73SStefano Zampini #endif 177439accc25SStefano Zampini HYPRE_Complex hs; 177568ec7858SStefano Zampini 177668ec7858SStefano Zampini PetscFunctionBegin; 17779566063dSJacob Faibussowitsch PetscCall(PetscHYPREScalarCast(s, &hs)); 17789566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 17796ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2, 19, 0) 1780792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixScale, parcsr, hs); 17816ea7df73SStefano Zampini #else /* diagonal part */ 178268ec7858SStefano Zampini ha = hypre_ParCSRMatrixDiag(parcsr); 178368ec7858SStefano Zampini if (ha) { 178468299464SStefano Zampini PetscInt size, i; 178568299464SStefano Zampini HYPRE_Int *ii; 178639accc25SStefano Zampini HYPRE_Complex *a; 178768ec7858SStefano Zampini 178868ec7858SStefano Zampini size = hypre_CSRMatrixNumRows(ha); 178968ec7858SStefano Zampini a = hypre_CSRMatrixData(ha); 179068ec7858SStefano Zampini ii = hypre_CSRMatrixI(ha); 179139accc25SStefano Zampini for (i = 0; i < ii[size]; i++) a[i] *= hs; 179268ec7858SStefano Zampini } 179368ec7858SStefano Zampini /* offdiagonal part */ 179468ec7858SStefano Zampini ha = hypre_ParCSRMatrixOffd(parcsr); 179568ec7858SStefano Zampini if (ha) { 179668299464SStefano Zampini PetscInt size, i; 179768299464SStefano Zampini HYPRE_Int *ii; 179839accc25SStefano Zampini HYPRE_Complex *a; 179968ec7858SStefano Zampini 180068ec7858SStefano Zampini size = hypre_CSRMatrixNumRows(ha); 180168ec7858SStefano Zampini a = hypre_CSRMatrixData(ha); 180268ec7858SStefano Zampini ii = hypre_CSRMatrixI(ha); 180339accc25SStefano Zampini for (i = 0; i < ii[size]; i++) a[i] *= hs; 180468ec7858SStefano Zampini } 18056ea7df73SStefano Zampini #endif 18063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 180768ec7858SStefano Zampini } 180868ec7858SStefano Zampini 1809d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatZeroRowsColumns_HYPRE(Mat A, PetscInt numRows, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 1810d71ae5a4SJacob Faibussowitsch { 181168ec7858SStefano Zampini hypre_ParCSRMatrix *parcsr; 181268299464SStefano Zampini HYPRE_Int *lrows; 181368299464SStefano Zampini PetscInt rst, ren, i; 181468ec7858SStefano Zampini 181568ec7858SStefano Zampini PetscFunctionBegin; 181608401ef6SPierre Jolivet PetscCheck(!x && !b, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "To be implemented"); 18179566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 18189566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(numRows, &lrows)); 18199566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(A, &rst, &ren)); 182068ec7858SStefano Zampini for (i = 0; i < numRows; i++) { 18217a46b595SBarry Smith PetscCheck(rows[i] >= rst && rows[i] < ren, PETSC_COMM_SELF, PETSC_ERR_SUP, "Non-local rows not yet supported"); 182268ec7858SStefano Zampini lrows[i] = rows[i] - rst; 182368ec7858SStefano Zampini } 1824792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixEliminateRowsCols, parcsr, numRows, lrows); 18259566063dSJacob Faibussowitsch PetscCall(PetscFree(lrows)); 18263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 182768ec7858SStefano Zampini } 182868ec7858SStefano Zampini 1829d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatZeroEntries_HYPRE_CSRMatrix(hypre_CSRMatrix *ha) 1830d71ae5a4SJacob Faibussowitsch { 1831c69f721fSFande Kong PetscFunctionBegin; 1832c69f721fSFande Kong if (ha) { 1833c69f721fSFande Kong HYPRE_Int *ii, size; 1834c69f721fSFande Kong HYPRE_Complex *a; 1835c69f721fSFande Kong 1836c69f721fSFande Kong size = hypre_CSRMatrixNumRows(ha); 1837c69f721fSFande Kong a = hypre_CSRMatrixData(ha); 1838c69f721fSFande Kong ii = hypre_CSRMatrixI(ha); 1839c69f721fSFande Kong 18409566063dSJacob Faibussowitsch if (a) PetscCall(PetscArrayzero(a, ii[size])); 1841c69f721fSFande Kong } 18423ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1843c69f721fSFande Kong } 1844c69f721fSFande Kong 1845d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_HYPRE(Mat A) 1846d71ae5a4SJacob Faibussowitsch { 18476ea7df73SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 18486ea7df73SStefano Zampini 18496ea7df73SStefano Zampini PetscFunctionBegin; 18506ea7df73SStefano Zampini if (HYPRE_MEMORY_DEVICE == hypre_IJMatrixMemoryLocation(hA->ij)) { 1851792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetConstantValues, hA->ij, 0.0); 18526ea7df73SStefano Zampini } else { 1853c69f721fSFande Kong hypre_ParCSRMatrix *parcsr; 1854c69f721fSFande Kong 18559566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 18569566063dSJacob Faibussowitsch PetscCall(MatZeroEntries_HYPRE_CSRMatrix(hypre_ParCSRMatrixDiag(parcsr))); 18579566063dSJacob Faibussowitsch PetscCall(MatZeroEntries_HYPRE_CSRMatrix(hypre_ParCSRMatrixOffd(parcsr))); 18586ea7df73SStefano Zampini } 18593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1860c69f721fSFande Kong } 1861c69f721fSFande Kong 1862d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatZeroRows_HYPRE_CSRMatrix(hypre_CSRMatrix *hA, PetscInt N, const PetscInt rows[], HYPRE_Complex diag) 1863d71ae5a4SJacob Faibussowitsch { 186439accc25SStefano Zampini PetscInt ii; 186539accc25SStefano Zampini HYPRE_Int *i, *j; 186639accc25SStefano Zampini HYPRE_Complex *a; 1867c69f721fSFande Kong 1868c69f721fSFande Kong PetscFunctionBegin; 18693ba16761SJacob Faibussowitsch if (!hA) PetscFunctionReturn(PETSC_SUCCESS); 1870c69f721fSFande Kong 187139accc25SStefano Zampini i = hypre_CSRMatrixI(hA); 187239accc25SStefano Zampini j = hypre_CSRMatrixJ(hA); 1873c69f721fSFande Kong a = hypre_CSRMatrixData(hA); 1874c69f721fSFande Kong 1875c69f721fSFande Kong for (ii = 0; ii < N; ii++) { 187639accc25SStefano Zampini HYPRE_Int jj, ibeg, iend, irow; 187739accc25SStefano Zampini 1878c69f721fSFande Kong irow = rows[ii]; 1879c69f721fSFande Kong ibeg = i[irow]; 1880c69f721fSFande Kong iend = i[irow + 1]; 1881c69f721fSFande Kong for (jj = ibeg; jj < iend; jj++) 1882c69f721fSFande Kong if (j[jj] == irow) a[jj] = diag; 1883c69f721fSFande Kong else a[jj] = 0.0; 1884c69f721fSFande Kong } 18853ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1886c69f721fSFande Kong } 1887c69f721fSFande Kong 1888d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatZeroRows_HYPRE(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 1889d71ae5a4SJacob Faibussowitsch { 1890c69f721fSFande Kong hypre_ParCSRMatrix *parcsr; 1891c69f721fSFande Kong PetscInt *lrows, len; 189239accc25SStefano Zampini HYPRE_Complex hdiag; 1893c69f721fSFande Kong 1894c69f721fSFande Kong PetscFunctionBegin; 189508401ef6SPierre Jolivet PetscCheck(!x && !b, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Does not support to modify the solution and the right hand size"); 18969566063dSJacob Faibussowitsch PetscCall(PetscHYPREScalarCast(diag, &hdiag)); 1897c69f721fSFande Kong /* retrieve the internal matrix */ 18989566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 1899c69f721fSFande Kong /* get locally owned rows */ 19009566063dSJacob Faibussowitsch PetscCall(MatZeroRowsMapLocal_Private(A, N, rows, &len, &lrows)); 1901c69f721fSFande Kong /* zero diagonal part */ 19029566063dSJacob Faibussowitsch PetscCall(MatZeroRows_HYPRE_CSRMatrix(hypre_ParCSRMatrixDiag(parcsr), len, lrows, hdiag)); 1903c69f721fSFande Kong /* zero off-diagonal part */ 19049566063dSJacob Faibussowitsch PetscCall(MatZeroRows_HYPRE_CSRMatrix(hypre_ParCSRMatrixOffd(parcsr), len, lrows, 0.0)); 1905c69f721fSFande Kong 19069566063dSJacob Faibussowitsch PetscCall(PetscFree(lrows)); 19073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1908c69f721fSFande Kong } 1909c69f721fSFande Kong 1910d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAssemblyBegin_HYPRE(Mat mat, MatAssemblyType mode) 1911d71ae5a4SJacob Faibussowitsch { 1912c69f721fSFande Kong PetscFunctionBegin; 19133ba16761SJacob Faibussowitsch if (mat->nooffprocentries) PetscFunctionReturn(PETSC_SUCCESS); 1914c69f721fSFande Kong 19159566063dSJacob Faibussowitsch PetscCall(MatStashScatterBegin_Private(mat, &mat->stash, mat->rmap->range)); 19163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1917c69f721fSFande Kong } 1918c69f721fSFande Kong 1919d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetRow_HYPRE(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 1920d71ae5a4SJacob Faibussowitsch { 1921c69f721fSFande Kong hypre_ParCSRMatrix *parcsr; 19222cf14000SStefano Zampini HYPRE_Int hnz; 1923c69f721fSFande Kong 1924c69f721fSFande Kong PetscFunctionBegin; 1925c69f721fSFande Kong /* retrieve the internal matrix */ 19269566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 1927c69f721fSFande Kong /* call HYPRE API */ 1928792fecdfSBarry Smith PetscCallExternal(HYPRE_ParCSRMatrixGetRow, parcsr, row, &hnz, (HYPRE_BigInt **)idx, (HYPRE_Complex **)v); 19292cf14000SStefano Zampini if (nz) *nz = (PetscInt)hnz; 19303ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1931c69f721fSFande Kong } 1932c69f721fSFande Kong 1933d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatRestoreRow_HYPRE(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 1934d71ae5a4SJacob Faibussowitsch { 1935c69f721fSFande Kong hypre_ParCSRMatrix *parcsr; 19362cf14000SStefano Zampini HYPRE_Int hnz; 1937c69f721fSFande Kong 1938c69f721fSFande Kong PetscFunctionBegin; 1939c69f721fSFande Kong /* retrieve the internal matrix */ 19409566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 1941c69f721fSFande Kong /* call HYPRE API */ 19422cf14000SStefano Zampini hnz = nz ? (HYPRE_Int)(*nz) : 0; 1943792fecdfSBarry Smith PetscCallExternal(HYPRE_ParCSRMatrixRestoreRow, parcsr, row, &hnz, (HYPRE_BigInt **)idx, (HYPRE_Complex **)v); 19443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1945c69f721fSFande Kong } 1946c69f721fSFande Kong 1947d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetValues_HYPRE(Mat A, PetscInt m, const PetscInt idxm[], PetscInt n, const PetscInt idxn[], PetscScalar v[]) 1948d71ae5a4SJacob Faibussowitsch { 194945b8d346SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 1950c69f721fSFande Kong PetscInt i; 19511d4906efSStefano Zampini 1952c69f721fSFande Kong PetscFunctionBegin; 19533ba16761SJacob Faibussowitsch if (!m || !n) PetscFunctionReturn(PETSC_SUCCESS); 1954c69f721fSFande Kong /* Ignore negative row indices 1955c69f721fSFande Kong * And negative column indices should be automatically ignored in hypre 1956c69f721fSFande Kong * */ 19572cf14000SStefano Zampini for (i = 0; i < m; i++) { 19582cf14000SStefano Zampini if (idxm[i] >= 0) { 19592cf14000SStefano Zampini HYPRE_Int hn = (HYPRE_Int)n; 1960792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetValues, hA->ij, 1, &hn, (HYPRE_BigInt *)&idxm[i], (HYPRE_BigInt *)idxn, (HYPRE_Complex *)(v + i * n)); 19612cf14000SStefano Zampini } 19622cf14000SStefano Zampini } 19633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1964c69f721fSFande Kong } 1965c69f721fSFande Kong 1966d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetOption_HYPRE(Mat A, MatOption op, PetscBool flg) 1967d71ae5a4SJacob Faibussowitsch { 1968ddbeb582SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 1969ddbeb582SStefano Zampini 1970ddbeb582SStefano Zampini PetscFunctionBegin; 1971c6698e78SStefano Zampini switch (op) { 1972ddbeb582SStefano Zampini case MAT_NO_OFF_PROC_ENTRIES: 197348a46eb9SPierre Jolivet if (flg) PetscCallExternal(HYPRE_IJMatrixSetMaxOffProcElmts, hA->ij, 0); 1974ddbeb582SStefano Zampini break; 1975d71ae5a4SJacob Faibussowitsch case MAT_SORTED_FULL: 1976d71ae5a4SJacob Faibussowitsch hA->sorted_full = flg; 1977d71ae5a4SJacob Faibussowitsch break; 1978d71ae5a4SJacob Faibussowitsch default: 1979d71ae5a4SJacob Faibussowitsch break; 1980ddbeb582SStefano Zampini } 19813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1982ddbeb582SStefano Zampini } 1983c69f721fSFande Kong 1984d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_HYPRE(Mat A, PetscViewer view) 1985d71ae5a4SJacob Faibussowitsch { 198645b8d346SStefano Zampini PetscViewerFormat format; 198745b8d346SStefano Zampini 198845b8d346SStefano Zampini PetscFunctionBegin; 19899566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(view, &format)); 19903ba16761SJacob Faibussowitsch if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS); 199145b8d346SStefano Zampini if (format != PETSC_VIEWER_NATIVE) { 19926ea7df73SStefano Zampini Mat B; 19936ea7df73SStefano Zampini hypre_ParCSRMatrix *parcsr; 19946ea7df73SStefano Zampini PetscErrorCode (*mview)(Mat, PetscViewer) = NULL; 19956ea7df73SStefano Zampini 19969566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 19979566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(parcsr, MATAIJ, PETSC_USE_POINTER, &B)); 19989566063dSJacob Faibussowitsch PetscCall(MatGetOperation(B, MATOP_VIEW, (void (**)(void)) & mview)); 199928b400f6SJacob Faibussowitsch PetscCheck(mview, PetscObjectComm((PetscObject)A), PETSC_ERR_PLIB, "Missing view operation"); 20009566063dSJacob Faibussowitsch PetscCall((*mview)(B, view)); 20019566063dSJacob Faibussowitsch PetscCall(MatDestroy(&B)); 200245b8d346SStefano Zampini } else { 200345b8d346SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 200445b8d346SStefano Zampini PetscMPIInt size; 200545b8d346SStefano Zampini PetscBool isascii; 200645b8d346SStefano Zampini const char *filename; 200745b8d346SStefano Zampini 200845b8d346SStefano Zampini /* HYPRE uses only text files */ 20099566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)view, PETSCVIEWERASCII, &isascii)); 201028b400f6SJacob Faibussowitsch PetscCheck(isascii, PetscObjectComm((PetscObject)view), PETSC_ERR_SUP, "PetscViewerType %s: native HYPRE format needs PETSCVIEWERASCII", ((PetscObject)view)->type_name); 20119566063dSJacob Faibussowitsch PetscCall(PetscViewerFileGetName(view, &filename)); 2012792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixPrint, hA->ij, filename); 20139566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(hA->comm, &size)); 201445b8d346SStefano Zampini if (size > 1) { 20159566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(view, "Matrix files: %s.%05d ... %s.%05d\n", filename, 0, filename, size - 1)); 201645b8d346SStefano Zampini } else { 20179566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(view, "Matrix file: %s.%05d\n", filename, 0)); 201845b8d346SStefano Zampini } 201945b8d346SStefano Zampini } 20203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 202145b8d346SStefano Zampini } 202245b8d346SStefano Zampini 2023d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatDuplicate_HYPRE(Mat A, MatDuplicateOption op, Mat *B) 2024d71ae5a4SJacob Faibussowitsch { 20256abb4441SStefano Zampini hypre_ParCSRMatrix *parcsr = NULL; 202645b8d346SStefano Zampini PetscCopyMode cpmode; 202745b8d346SStefano Zampini 202845b8d346SStefano Zampini PetscFunctionBegin; 20299566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 203045b8d346SStefano Zampini if (op == MAT_DO_NOT_COPY_VALUES || op == MAT_SHARE_NONZERO_PATTERN) { 20310e6427aaSSatish Balay parcsr = hypre_ParCSRMatrixClone(parcsr, 0); 203245b8d346SStefano Zampini cpmode = PETSC_OWN_POINTER; 203345b8d346SStefano Zampini } else { 203445b8d346SStefano Zampini cpmode = PETSC_COPY_VALUES; 203545b8d346SStefano Zampini } 20369566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(parcsr, MATHYPRE, cpmode, B)); 20373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 203845b8d346SStefano Zampini } 203945b8d346SStefano Zampini 2040d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatCopy_HYPRE(Mat A, Mat B, MatStructure str) 2041d71ae5a4SJacob Faibussowitsch { 2042465edc17SStefano Zampini hypre_ParCSRMatrix *acsr, *bcsr; 2043465edc17SStefano Zampini 2044465edc17SStefano Zampini PetscFunctionBegin; 2045465edc17SStefano Zampini if (str == SAME_NONZERO_PATTERN && A->ops->copy == B->ops->copy) { 20469566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &acsr)); 20479566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(B, &bcsr)); 2048792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixCopy, acsr, bcsr, 1); 20499566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_SORTED_FULL, PETSC_TRUE)); /* "perfect" preallocation, so no need for hypre_AuxParCSRMatrixNeedAux */ 20509566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 20519566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 2052465edc17SStefano Zampini } else { 20539566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 2054465edc17SStefano Zampini } 20553ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2056465edc17SStefano Zampini } 2057465edc17SStefano Zampini 2058d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetDiagonal_HYPRE(Mat A, Vec d) 2059d71ae5a4SJacob Faibussowitsch { 20606305df00SStefano Zampini hypre_ParCSRMatrix *parcsr; 20616305df00SStefano Zampini hypre_CSRMatrix *dmat; 206239accc25SStefano Zampini HYPRE_Complex *a; 206339accc25SStefano Zampini HYPRE_Complex *data = NULL; 20642cf14000SStefano Zampini HYPRE_Int *diag = NULL; 20652cf14000SStefano Zampini PetscInt i; 20666305df00SStefano Zampini PetscBool cong; 20676305df00SStefano Zampini 20686305df00SStefano Zampini PetscFunctionBegin; 20699566063dSJacob Faibussowitsch PetscCall(MatHasCongruentLayouts(A, &cong)); 207028b400f6SJacob Faibussowitsch PetscCheck(cong, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only for square matrices with same local distributions of rows and columns"); 207176bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 20726305df00SStefano Zampini PetscBool miss; 20739566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal(A, &miss, NULL)); 207408401ef6SPierre Jolivet PetscCheck(!miss || !A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_SUP, "Not implemented when diagonal entries are missing"); 20756305df00SStefano Zampini } 20769566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 20776305df00SStefano Zampini dmat = hypre_ParCSRMatrixDiag(parcsr); 20786305df00SStefano Zampini if (dmat) { 207939accc25SStefano Zampini /* this cast fixes the clang error: implicit conversion from 'HYPRE_Complex' (aka '_Complex double') to 'double' is not permitted in C++ */ 20809566063dSJacob Faibussowitsch PetscCall(VecGetArray(d, (PetscScalar **)&a)); 20812cf14000SStefano Zampini diag = hypre_CSRMatrixI(dmat); 208239accc25SStefano Zampini data = hypre_CSRMatrixData(dmat); 20836305df00SStefano Zampini for (i = 0; i < A->rmap->n; i++) a[i] = data[diag[i]]; 20849566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(d, (PetscScalar **)&a)); 20856305df00SStefano Zampini } 20863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 20876305df00SStefano Zampini } 20886305df00SStefano Zampini 2089363d496dSStefano Zampini #include <petscblaslapack.h> 2090363d496dSStefano Zampini 2091d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAXPY_HYPRE(Mat Y, PetscScalar a, Mat X, MatStructure str) 2092d71ae5a4SJacob Faibussowitsch { 2093363d496dSStefano Zampini PetscFunctionBegin; 20946ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 20956ea7df73SStefano Zampini { 20966ea7df73SStefano Zampini Mat B; 20976ea7df73SStefano Zampini hypre_ParCSRMatrix *x, *y, *z; 20986ea7df73SStefano Zampini 20999566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR(Y, &y)); 21009566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR(X, &x)); 2101792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixAdd, 1.0, y, 1.0, x, &z); 21029566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(z, MATHYPRE, PETSC_OWN_POINTER, &B)); 21039566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 21046ea7df73SStefano Zampini } 21056ea7df73SStefano Zampini #else 2106363d496dSStefano Zampini if (str == SAME_NONZERO_PATTERN) { 2107363d496dSStefano Zampini hypre_ParCSRMatrix *x, *y; 2108363d496dSStefano Zampini hypre_CSRMatrix *xloc, *yloc; 2109363d496dSStefano Zampini PetscInt xnnz, ynnz; 211039accc25SStefano Zampini HYPRE_Complex *xarr, *yarr; 2111363d496dSStefano Zampini PetscBLASInt one = 1, bnz; 2112363d496dSStefano Zampini 21139566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR(Y, &y)); 21149566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR(X, &x)); 2115363d496dSStefano Zampini 2116363d496dSStefano Zampini /* diagonal block */ 2117363d496dSStefano Zampini xloc = hypre_ParCSRMatrixDiag(x); 2118363d496dSStefano Zampini yloc = hypre_ParCSRMatrixDiag(y); 2119363d496dSStefano Zampini xnnz = 0; 2120363d496dSStefano Zampini ynnz = 0; 2121363d496dSStefano Zampini xarr = NULL; 2122363d496dSStefano Zampini yarr = NULL; 2123363d496dSStefano Zampini if (xloc) { 212439accc25SStefano Zampini xarr = hypre_CSRMatrixData(xloc); 2125363d496dSStefano Zampini xnnz = hypre_CSRMatrixNumNonzeros(xloc); 2126363d496dSStefano Zampini } 2127363d496dSStefano Zampini if (yloc) { 212839accc25SStefano Zampini yarr = hypre_CSRMatrixData(yloc); 2129363d496dSStefano Zampini ynnz = hypre_CSRMatrixNumNonzeros(yloc); 2130363d496dSStefano Zampini } 213108401ef6SPierre Jolivet PetscCheck(xnnz == ynnz, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Different number of nonzeros in diagonal block %" PetscInt_FMT " != %" PetscInt_FMT, xnnz, ynnz); 21329566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(xnnz, &bnz)); 2133792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &a, (PetscScalar *)xarr, &one, (PetscScalar *)yarr, &one)); 2134363d496dSStefano Zampini 2135363d496dSStefano Zampini /* off-diagonal block */ 2136363d496dSStefano Zampini xloc = hypre_ParCSRMatrixOffd(x); 2137363d496dSStefano Zampini yloc = hypre_ParCSRMatrixOffd(y); 2138363d496dSStefano Zampini xnnz = 0; 2139363d496dSStefano Zampini ynnz = 0; 2140363d496dSStefano Zampini xarr = NULL; 2141363d496dSStefano Zampini yarr = NULL; 2142363d496dSStefano Zampini if (xloc) { 214339accc25SStefano Zampini xarr = hypre_CSRMatrixData(xloc); 2144363d496dSStefano Zampini xnnz = hypre_CSRMatrixNumNonzeros(xloc); 2145363d496dSStefano Zampini } 2146363d496dSStefano Zampini if (yloc) { 214739accc25SStefano Zampini yarr = hypre_CSRMatrixData(yloc); 2148363d496dSStefano Zampini ynnz = hypre_CSRMatrixNumNonzeros(yloc); 2149363d496dSStefano Zampini } 215008401ef6SPierre Jolivet PetscCheck(xnnz == ynnz, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Different number of nonzeros in off-diagonal block %" PetscInt_FMT " != %" PetscInt_FMT, xnnz, ynnz); 21519566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(xnnz, &bnz)); 2152792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &a, (PetscScalar *)xarr, &one, (PetscScalar *)yarr, &one)); 2153363d496dSStefano Zampini } else if (str == SUBSET_NONZERO_PATTERN) { 21549566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 2155363d496dSStefano Zampini } else { 2156363d496dSStefano Zampini Mat B; 2157363d496dSStefano Zampini 21589566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic_Preallocate(Y, X, &B)); 21599566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 21609566063dSJacob Faibussowitsch PetscCall(MatHeaderReplace(Y, &B)); 2161363d496dSStefano Zampini } 21626ea7df73SStefano Zampini #endif 21633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2164363d496dSStefano Zampini } 2165363d496dSStefano Zampini 2166d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetPreallocationCOO_HYPRE(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[]) 2167d71ae5a4SJacob Faibussowitsch { 21685fbaff96SJunchao Zhang MPI_Comm comm; 21695fbaff96SJunchao Zhang PetscMPIInt size; 21705fbaff96SJunchao Zhang PetscLayout rmap, cmap; 21715fbaff96SJunchao Zhang Mat_HYPRE *hmat; 21725fbaff96SJunchao Zhang hypre_ParCSRMatrix *parCSR; 21735fbaff96SJunchao Zhang hypre_CSRMatrix *diag, *offd; 21745fbaff96SJunchao Zhang Mat A, B, cooMat; 21755fbaff96SJunchao Zhang PetscScalar *Aa, *Ba; 21765fbaff96SJunchao Zhang HYPRE_MemoryLocation hypreMemtype = HYPRE_MEMORY_HOST; 21775fbaff96SJunchao Zhang PetscMemType petscMemtype; 21785fbaff96SJunchao Zhang MatType matType = MATAIJ; /* default type of cooMat */ 21795fbaff96SJunchao Zhang 21805fbaff96SJunchao Zhang PetscFunctionBegin; 21815fbaff96SJunchao Zhang /* Build an agent matrix cooMat whose type is either MATAIJ or MATAIJKOKKOS. 21825fbaff96SJunchao Zhang It has the same sparsity pattern as mat, and also shares the data array with mat. We use cooMat to do the COO work. 21835fbaff96SJunchao Zhang */ 21845fbaff96SJunchao Zhang PetscCall(PetscObjectGetComm((PetscObject)mat, &comm)); 21855fbaff96SJunchao Zhang PetscCallMPI(MPI_Comm_size(comm, &size)); 21865fbaff96SJunchao Zhang PetscCall(PetscLayoutSetUp(mat->rmap)); 21875fbaff96SJunchao Zhang PetscCall(PetscLayoutSetUp(mat->cmap)); 21885fbaff96SJunchao Zhang PetscCall(MatGetLayouts(mat, &rmap, &cmap)); 21895fbaff96SJunchao Zhang 21905fbaff96SJunchao Zhang /* I do not know how hypre_ParCSRMatrix stores diagonal elements for non-square matrices, so I just give up now */ 21915fbaff96SJunchao Zhang PetscCheck(rmap->N == cmap->N, comm, PETSC_ERR_SUP, "MATHYPRE COO cannot handle non-square matrices"); 21925fbaff96SJunchao Zhang 21935fbaff96SJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 21945fbaff96SJunchao Zhang if (!mat->boundtocpu) { /* mat will be on device, so will cooMat */ 21955fbaff96SJunchao Zhang #if defined(PETSC_HAVE_KOKKOS) 21965fbaff96SJunchao Zhang matType = MATAIJKOKKOS; 21975fbaff96SJunchao Zhang #else 21985fbaff96SJunchao Zhang SETERRQ(comm, PETSC_ERR_SUP, "To support MATHYPRE COO assembly on device, we need Kokkos, e.g., --download-kokkos --download-kokkos-kernels"); 21995fbaff96SJunchao Zhang #endif 22005fbaff96SJunchao Zhang } 22015fbaff96SJunchao Zhang #endif 22025fbaff96SJunchao Zhang 22035fbaff96SJunchao Zhang /* Do COO preallocation through cooMat */ 22045fbaff96SJunchao Zhang hmat = (Mat_HYPRE *)mat->data; 22055fbaff96SJunchao Zhang PetscCall(MatDestroy(&hmat->cooMat)); 22065fbaff96SJunchao Zhang PetscCall(MatCreate(comm, &cooMat)); 22075fbaff96SJunchao Zhang PetscCall(MatSetType(cooMat, matType)); 22085fbaff96SJunchao Zhang PetscCall(MatSetLayouts(cooMat, rmap, cmap)); 22095fbaff96SJunchao Zhang PetscCall(MatSetPreallocationCOO(cooMat, coo_n, coo_i, coo_j)); 22105fbaff96SJunchao Zhang 22115fbaff96SJunchao Zhang /* Copy the sparsity pattern from cooMat to hypre IJMatrix hmat->ij */ 22125fbaff96SJunchao Zhang PetscCall(MatSetOption(mat, MAT_SORTED_FULL, PETSC_TRUE)); 22135fbaff96SJunchao Zhang PetscCall(MatSetOption(mat, MAT_NO_OFF_PROC_ENTRIES, PETSC_TRUE)); 22145fbaff96SJunchao Zhang PetscCall(MatHYPRE_CreateFromMat(cooMat, hmat)); /* Create hmat->ij and preallocate it */ 22155fbaff96SJunchao Zhang PetscCall(MatHYPRE_IJMatrixCopy(cooMat, hmat->ij)); /* Copy A's (a,i,j) to hmat->ij. To reuse code. Copying 'a' is not really needed */ 22165fbaff96SJunchao Zhang 22175fbaff96SJunchao Zhang mat->preallocated = PETSC_TRUE; 22185fbaff96SJunchao Zhang PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY)); 22195fbaff96SJunchao Zhang PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY)); /* Migrate mat to device if it is bound to. Hypre builds its own SpMV context here */ 22205fbaff96SJunchao Zhang 22215fbaff96SJunchao Zhang /* Alias cooMat's data array to IJMatrix's */ 2222792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, hmat->ij, (void **)&parCSR); 22235fbaff96SJunchao Zhang diag = hypre_ParCSRMatrixDiag(parCSR); 22245fbaff96SJunchao Zhang offd = hypre_ParCSRMatrixOffd(parCSR); 22255fbaff96SJunchao Zhang 22265fbaff96SJunchao Zhang hypreMemtype = hypre_CSRMatrixMemoryLocation(diag); 22275fbaff96SJunchao Zhang A = (size == 1) ? cooMat : ((Mat_MPIAIJ *)cooMat->data)->A; 22285fbaff96SJunchao Zhang PetscCall(MatSeqAIJGetCSRAndMemType(A, NULL, NULL, &Aa, &petscMemtype)); 22299371c9d4SSatish Balay PetscAssert((PetscMemTypeHost(petscMemtype) && hypreMemtype == HYPRE_MEMORY_HOST) || (PetscMemTypeDevice(petscMemtype) && hypreMemtype == HYPRE_MEMORY_DEVICE), comm, PETSC_ERR_PLIB, "PETSc and hypre's memory types mismatch"); 22305fbaff96SJunchao Zhang 22315fbaff96SJunchao Zhang hmat->diagJ = hypre_CSRMatrixJ(diag); 2232e77caa6dSBarry Smith PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hypre_CSRMatrixData(diag), hypreMemtype)); 22335fbaff96SJunchao Zhang hypre_CSRMatrixData(diag) = (HYPRE_Complex *)Aa; 22345fbaff96SJunchao Zhang hypre_CSRMatrixOwnsData(diag) = 0; /* Take ownership of (j,a) away from hypre. As a result, we need to free them on our own */ 22355fbaff96SJunchao Zhang 22365fbaff96SJunchao Zhang /* Copy diagonal pointers of A to device to facilitate MatSeqAIJMoveDiagonalValuesFront_SeqAIJKokkos */ 22375fbaff96SJunchao Zhang if (hypreMemtype == HYPRE_MEMORY_DEVICE) { 2238e77caa6dSBarry Smith PetscStackCallExternalVoid("hypre_TAlloc", hmat->diag = hypre_TAlloc(PetscInt, rmap->n, hypreMemtype)); 22395fbaff96SJunchao Zhang PetscCall(MatMarkDiagonal_SeqAIJ(A)); /* We need updated diagonal positions */ 2240e77caa6dSBarry Smith PetscStackCallExternalVoid("hypre_TMemcpy", hypre_TMemcpy(hmat->diag, ((Mat_SeqAIJ *)A->data)->diag, PetscInt, rmap->n, hypreMemtype, HYPRE_MEMORY_HOST)); 22415fbaff96SJunchao Zhang } 22425fbaff96SJunchao Zhang 22435fbaff96SJunchao Zhang if (size > 1) { 22445fbaff96SJunchao Zhang B = ((Mat_MPIAIJ *)cooMat->data)->B; 22455fbaff96SJunchao Zhang PetscCall(MatSeqAIJGetCSRAndMemType(B, NULL, NULL, &Ba, &petscMemtype)); 22465fbaff96SJunchao Zhang hmat->offdJ = hypre_CSRMatrixJ(offd); 2247e77caa6dSBarry Smith PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hypre_CSRMatrixData(offd), hypreMemtype)); 22485fbaff96SJunchao Zhang hypre_CSRMatrixData(offd) = (HYPRE_Complex *)Ba; 22495fbaff96SJunchao Zhang hypre_CSRMatrixOwnsData(offd) = 0; 22505fbaff96SJunchao Zhang } 22515fbaff96SJunchao Zhang 22525fbaff96SJunchao Zhang /* Record cooMat for use in MatSetValuesCOO_HYPRE */ 22535fbaff96SJunchao Zhang hmat->cooMat = cooMat; 22545fbaff96SJunchao Zhang hmat->memType = hypreMemtype; 22553ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22565fbaff96SJunchao Zhang } 22575fbaff96SJunchao Zhang 2258d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_HYPRE(Mat mat, const PetscScalar v[], InsertMode imode) 2259d71ae5a4SJacob Faibussowitsch { 22605fbaff96SJunchao Zhang Mat_HYPRE *hmat = (Mat_HYPRE *)mat->data; 22615fbaff96SJunchao Zhang PetscMPIInt size; 22625fbaff96SJunchao Zhang Mat A; 22635fbaff96SJunchao Zhang 22645fbaff96SJunchao Zhang PetscFunctionBegin; 22655fbaff96SJunchao Zhang PetscCheck(hmat->cooMat, hmat->comm, PETSC_ERR_PLIB, "HYPRE COO delegate matrix has not been created yet"); 22665fbaff96SJunchao Zhang PetscCallMPI(MPI_Comm_size(hmat->comm, &size)); 22675fbaff96SJunchao Zhang PetscCall(MatSetValuesCOO(hmat->cooMat, v, imode)); 22685fbaff96SJunchao Zhang 22695fbaff96SJunchao Zhang /* Move diagonal elements of the diagonal block to the front of their row, as needed by ParCSRMatrix. So damn hacky */ 22705fbaff96SJunchao Zhang A = (size == 1) ? hmat->cooMat : ((Mat_MPIAIJ *)hmat->cooMat->data)->A; 22715fbaff96SJunchao Zhang if (hmat->memType == HYPRE_MEMORY_HOST) { 22725fbaff96SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 22735fbaff96SJunchao Zhang PetscInt i, m, *Ai = aij->i, *Adiag = aij->diag; 22745fbaff96SJunchao Zhang PetscScalar *Aa = aij->a, tmp; 22755fbaff96SJunchao Zhang 22765fbaff96SJunchao Zhang PetscCall(MatGetSize(A, &m, NULL)); 22775fbaff96SJunchao Zhang for (i = 0; i < m; i++) { 22785fbaff96SJunchao Zhang if (Adiag[i] >= Ai[i] && Adiag[i] < Ai[i + 1]) { /* Digonal element of this row exists in a[] and j[] */ 22795fbaff96SJunchao Zhang tmp = Aa[Ai[i]]; 22805fbaff96SJunchao Zhang Aa[Ai[i]] = Aa[Adiag[i]]; 22815fbaff96SJunchao Zhang Aa[Adiag[i]] = tmp; 22825fbaff96SJunchao Zhang } 22835fbaff96SJunchao Zhang } 22845fbaff96SJunchao Zhang } else { 22855fbaff96SJunchao Zhang #if defined(PETSC_HAVE_KOKKOS_KERNELS) 22865fbaff96SJunchao Zhang PetscCall(MatSeqAIJMoveDiagonalValuesFront_SeqAIJKokkos(A, hmat->diag)); 22875fbaff96SJunchao Zhang #endif 22885fbaff96SJunchao Zhang } 22893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22905fbaff96SJunchao Zhang } 22915fbaff96SJunchao Zhang 2292a055b5aaSBarry Smith /*MC 22932ef1f0ffSBarry Smith MATHYPRE - "hypre" - A matrix type to be used for sequential and parallel sparse matrices 2294a055b5aaSBarry Smith based on the hypre IJ interface. 2295a055b5aaSBarry Smith 2296a055b5aaSBarry Smith Level: intermediate 2297a055b5aaSBarry Smith 2298*1cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatHYPRESetPreallocation` 2299a055b5aaSBarry Smith M*/ 2300a055b5aaSBarry Smith 2301d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_HYPRE(Mat B) 2302d71ae5a4SJacob Faibussowitsch { 230363c07aadSStefano Zampini Mat_HYPRE *hB; 230463c07aadSStefano Zampini 230563c07aadSStefano Zampini PetscFunctionBegin; 23064dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&hB)); 23076ea7df73SStefano Zampini 2308978814f1SStefano Zampini hB->inner_free = PETSC_TRUE; 2309c69f721fSFande Kong hB->available = PETSC_TRUE; 2310336664bdSPierre Jolivet hB->sorted_full = PETSC_FALSE; /* no assumption whether column indices are sorted or not */ 2311c69f721fSFande Kong hB->size = 0; 2312c69f721fSFande Kong hB->array = NULL; 2313978814f1SStefano Zampini 231463c07aadSStefano Zampini B->data = (void *)hB; 231563c07aadSStefano Zampini B->assembled = PETSC_FALSE; 231663c07aadSStefano Zampini 23179566063dSJacob Faibussowitsch PetscCall(PetscMemzero(B->ops, sizeof(struct _MatOps))); 231863c07aadSStefano Zampini B->ops->mult = MatMult_HYPRE; 231963c07aadSStefano Zampini B->ops->multtranspose = MatMultTranspose_HYPRE; 2320414bd5c3SStefano Zampini B->ops->multadd = MatMultAdd_HYPRE; 2321414bd5c3SStefano Zampini B->ops->multtransposeadd = MatMultTransposeAdd_HYPRE; 232263c07aadSStefano Zampini B->ops->setup = MatSetUp_HYPRE; 232363c07aadSStefano Zampini B->ops->destroy = MatDestroy_HYPRE; 232463c07aadSStefano Zampini B->ops->assemblyend = MatAssemblyEnd_HYPRE; 2325c69f721fSFande Kong B->ops->assemblybegin = MatAssemblyBegin_HYPRE; 2326d975228cSstefano_zampini B->ops->setvalues = MatSetValues_HYPRE; 232768ec7858SStefano Zampini B->ops->missingdiagonal = MatMissingDiagonal_HYPRE; 232868ec7858SStefano Zampini B->ops->scale = MatScale_HYPRE; 232968ec7858SStefano Zampini B->ops->zerorowscolumns = MatZeroRowsColumns_HYPRE; 2330c69f721fSFande Kong B->ops->zeroentries = MatZeroEntries_HYPRE; 2331c69f721fSFande Kong B->ops->zerorows = MatZeroRows_HYPRE; 2332c69f721fSFande Kong B->ops->getrow = MatGetRow_HYPRE; 2333c69f721fSFande Kong B->ops->restorerow = MatRestoreRow_HYPRE; 2334c69f721fSFande Kong B->ops->getvalues = MatGetValues_HYPRE; 2335ddbeb582SStefano Zampini B->ops->setoption = MatSetOption_HYPRE; 233645b8d346SStefano Zampini B->ops->duplicate = MatDuplicate_HYPRE; 2337465edc17SStefano Zampini B->ops->copy = MatCopy_HYPRE; 233845b8d346SStefano Zampini B->ops->view = MatView_HYPRE; 23396305df00SStefano Zampini B->ops->getdiagonal = MatGetDiagonal_HYPRE; 2340363d496dSStefano Zampini B->ops->axpy = MatAXPY_HYPRE; 23414222ddf1SHong Zhang B->ops->productsetfromoptions = MatProductSetFromOptions_HYPRE; 23426ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 23436ea7df73SStefano Zampini B->ops->bindtocpu = MatBindToCPU_HYPRE; 23446ea7df73SStefano Zampini B->boundtocpu = PETSC_FALSE; 23456ea7df73SStefano Zampini #endif 234645b8d346SStefano Zampini 234745b8d346SStefano Zampini /* build cache for off array entries formed */ 23489566063dSJacob Faibussowitsch PetscCall(MatStashCreate_Private(PetscObjectComm((PetscObject)B), 1, &B->stash)); 234963c07aadSStefano Zampini 23509566063dSJacob Faibussowitsch PetscCall(PetscCommGetComm(PetscObjectComm((PetscObject)B), &hB->comm)); 23519566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATHYPRE)); 23529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_hypre_aij_C", MatConvert_HYPRE_AIJ)); 23539566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_hypre_is_C", MatConvert_HYPRE_IS)); 23549566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_hypre_C", MatProductSetFromOptions_HYPRE)); 23559566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_mpiaij_hypre_C", MatProductSetFromOptions_HYPRE)); 23569566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatHYPRESetPreallocation_C", MatHYPRESetPreallocation_HYPRE)); 23579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatHYPREGetParCSR_C", MatHYPREGetParCSR_HYPRE)); 23585fbaff96SJunchao Zhang PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_HYPRE)); 23595fbaff96SJunchao Zhang PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_HYPRE)); 23606ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 23616ea7df73SStefano Zampini #if defined(HYPRE_USING_HIP) 23629566063dSJacob Faibussowitsch PetscCall(PetscDeviceInitialize(PETSC_DEVICE_HIP)); 23639566063dSJacob Faibussowitsch PetscCall(MatSetVecType(B, VECHIP)); 23646ea7df73SStefano Zampini #endif 23656ea7df73SStefano Zampini #if defined(HYPRE_USING_CUDA) 23669566063dSJacob Faibussowitsch PetscCall(PetscDeviceInitialize(PETSC_DEVICE_CUDA)); 23679566063dSJacob Faibussowitsch PetscCall(MatSetVecType(B, VECCUDA)); 23686ea7df73SStefano Zampini #endif 23696ea7df73SStefano Zampini #endif 23703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 237163c07aadSStefano Zampini } 237263c07aadSStefano Zampini 2373d71ae5a4SJacob Faibussowitsch static PetscErrorCode hypre_array_destroy(void *ptr) 2374d71ae5a4SJacob Faibussowitsch { 2375225daaf8SStefano Zampini PetscFunctionBegin; 2376e6de0934SSatish Balay hypre_TFree(ptr, HYPRE_MEMORY_HOST); 23773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2378225daaf8SStefano Zampini } 2379