163c07aadSStefano Zampini 263c07aadSStefano Zampini /* 363c07aadSStefano Zampini Creates hypre ijmatrix from PETSc matrix 463c07aadSStefano Zampini */ 5225daaf8SStefano Zampini 6c6698e78SStefano Zampini #include <petscpkg_version.h> 739accc25SStefano Zampini #include <petsc/private/petschypre.h> 8dd9c0a25Sstefano_zampini #include <petscmathypre.h> 963c07aadSStefano Zampini #include <petsc/private/matimpl.h> 10a4af0ceeSJacob Faibussowitsch #include <petsc/private/deviceimpl.h> 1163c07aadSStefano Zampini #include <../src/mat/impls/hypre/mhypre.h> 1263c07aadSStefano Zampini #include <../src/mat/impls/aij/mpi/mpiaij.h> 1358968eb6SStefano Zampini #include <../src/vec/vec/impls/hypre/vhyp.h> 1458968eb6SStefano Zampini #include <HYPRE.h> 15c1a070e6SStefano Zampini #include <HYPRE_utilities.h> 16cd8bc7baSStefano Zampini #include <_hypre_parcsr_ls.h> 1768ec7858SStefano Zampini #include <_hypre_sstruct_ls.h> 1863c07aadSStefano Zampini 190e6427aaSSatish Balay #if PETSC_PKG_HYPRE_VERSION_LT(2, 18, 0) 200e6427aaSSatish Balay #define hypre_ParCSRMatrixClone(A, B) hypre_ParCSRMatrixCompleteClone(A) 210e6427aaSSatish Balay #endif 220e6427aaSSatish Balay 2363c07aadSStefano Zampini static PetscErrorCode MatHYPRE_CreateFromMat(Mat, Mat_HYPRE *); 2463c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixPreallocate(Mat, Mat, HYPRE_IJMatrix); 2563c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixFastCopy_MPIAIJ(Mat, HYPRE_IJMatrix); 2663c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixFastCopy_SeqAIJ(Mat, HYPRE_IJMatrix); 2739accc25SStefano Zampini static PetscErrorCode MatHYPRE_MultKernel_Private(Mat, HYPRE_Complex, Vec, HYPRE_Complex, Vec, PetscBool); 28225daaf8SStefano Zampini static PetscErrorCode hypre_array_destroy(void *); 296ea7df73SStefano Zampini static PetscErrorCode MatSetValues_HYPRE(Mat, PetscInt, const PetscInt[], PetscInt, const PetscInt[], const PetscScalar[], InsertMode ins); 3063c07aadSStefano Zampini 31d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_IJMatrixPreallocate(Mat A_d, Mat A_o, HYPRE_IJMatrix ij) 32d71ae5a4SJacob Faibussowitsch { 3363c07aadSStefano Zampini PetscInt i, n_d, n_o; 3463c07aadSStefano Zampini const PetscInt *ia_d, *ia_o; 3563c07aadSStefano Zampini PetscBool done_d = PETSC_FALSE, done_o = PETSC_FALSE; 362cf14000SStefano Zampini HYPRE_Int *nnz_d = NULL, *nnz_o = NULL; 3763c07aadSStefano Zampini 3863c07aadSStefano Zampini PetscFunctionBegin; 3963c07aadSStefano Zampini if (A_d) { /* determine number of nonzero entries in local diagonal part */ 409566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(A_d, 0, PETSC_FALSE, PETSC_FALSE, &n_d, &ia_d, NULL, &done_d)); 4163c07aadSStefano Zampini if (done_d) { 429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n_d, &nnz_d)); 43ad540459SPierre Jolivet for (i = 0; i < n_d; i++) nnz_d[i] = ia_d[i + 1] - ia_d[i]; 4463c07aadSStefano Zampini } 459566063dSJacob Faibussowitsch PetscCall(MatRestoreRowIJ(A_d, 0, PETSC_FALSE, PETSC_FALSE, NULL, &ia_d, NULL, &done_d)); 4663c07aadSStefano Zampini } 4763c07aadSStefano Zampini if (A_o) { /* determine number of nonzero entries in local off-diagonal part */ 489566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(A_o, 0, PETSC_FALSE, PETSC_FALSE, &n_o, &ia_o, NULL, &done_o)); 4963c07aadSStefano Zampini if (done_o) { 509566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n_o, &nnz_o)); 51ad540459SPierre Jolivet for (i = 0; i < n_o; i++) nnz_o[i] = ia_o[i + 1] - ia_o[i]; 5263c07aadSStefano Zampini } 539566063dSJacob Faibussowitsch PetscCall(MatRestoreRowIJ(A_o, 0, PETSC_FALSE, PETSC_FALSE, &n_o, &ia_o, NULL, &done_o)); 5463c07aadSStefano Zampini } 5563c07aadSStefano Zampini if (done_d) { /* set number of nonzeros in HYPRE IJ matrix */ 5663c07aadSStefano Zampini if (!done_o) { /* only diagonal part */ 579566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n_d, &nnz_o)); 5863c07aadSStefano Zampini } 59c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2, 16, 0) 60c6698e78SStefano Zampini { /* If we don't do this, the columns of the matrix will be all zeros! */ 61c6698e78SStefano Zampini hypre_AuxParCSRMatrix *aux_matrix; 62c6698e78SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij); 63c6698e78SStefano Zampini hypre_AuxParCSRMatrixDestroy(aux_matrix); 64c6698e78SStefano Zampini hypre_IJMatrixTranslator(ij) = NULL; 65792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetDiagOffdSizes, ij, nnz_d, nnz_o); 6622235d61SPierre Jolivet /* it seems they partially fixed it in 2.19.0 */ 6722235d61SPierre Jolivet #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0) 68c6698e78SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij); 69c6698e78SStefano Zampini hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 1; 7022235d61SPierre Jolivet #endif 71c6698e78SStefano Zampini } 72c6698e78SStefano Zampini #else 73792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetDiagOffdSizes, ij, nnz_d, nnz_o); 74c6698e78SStefano Zampini #endif 759566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz_d)); 769566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz_o)); 7763c07aadSStefano Zampini } 783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7963c07aadSStefano Zampini } 8063c07aadSStefano Zampini 81d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_CreateFromMat(Mat A, Mat_HYPRE *hA) 82d71ae5a4SJacob Faibussowitsch { 8363c07aadSStefano Zampini PetscInt rstart, rend, cstart, cend; 8463c07aadSStefano Zampini 8563c07aadSStefano Zampini PetscFunctionBegin; 869566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 879566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 8863c07aadSStefano Zampini rstart = A->rmap->rstart; 8963c07aadSStefano Zampini rend = A->rmap->rend; 9063c07aadSStefano Zampini cstart = A->cmap->rstart; 9163c07aadSStefano Zampini cend = A->cmap->rend; 92*ea9ee2c1SPierre Jolivet PetscHYPREInitialize(); 93792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixCreate, hA->comm, rstart, rend - 1, cstart, cend - 1, &hA->ij); 94792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetObjectType, hA->ij, HYPRE_PARCSR); 9563c07aadSStefano Zampini { 9663c07aadSStefano Zampini PetscBool same; 9763c07aadSStefano Zampini Mat A_d, A_o; 9863c07aadSStefano Zampini const PetscInt *colmap; 999566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &same)); 10063c07aadSStefano Zampini if (same) { 1019566063dSJacob Faibussowitsch PetscCall(MatMPIAIJGetSeqAIJ(A, &A_d, &A_o, &colmap)); 1029566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixPreallocate(A_d, A_o, hA->ij)); 1033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10463c07aadSStefano Zampini } 1059566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIBAIJ, &same)); 10663c07aadSStefano Zampini if (same) { 1079566063dSJacob Faibussowitsch PetscCall(MatMPIBAIJGetSeqBAIJ(A, &A_d, &A_o, &colmap)); 1089566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixPreallocate(A_d, A_o, hA->ij)); 1093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 11063c07aadSStefano Zampini } 1119566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATSEQAIJ, &same)); 11263c07aadSStefano Zampini if (same) { 1139566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixPreallocate(A, NULL, hA->ij)); 1143ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 11563c07aadSStefano Zampini } 1169566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATSEQBAIJ, &same)); 11763c07aadSStefano Zampini if (same) { 1189566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixPreallocate(A, NULL, hA->ij)); 1193ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12063c07aadSStefano Zampini } 12163c07aadSStefano Zampini } 1223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12363c07aadSStefano Zampini } 12463c07aadSStefano Zampini 125d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_IJMatrixCopy(Mat A, HYPRE_IJMatrix ij) 126d71ae5a4SJacob Faibussowitsch { 12763c07aadSStefano Zampini PetscInt i, rstart, rend, ncols, nr, nc; 12863c07aadSStefano Zampini const PetscScalar *values; 12963c07aadSStefano Zampini const PetscInt *cols; 13063c07aadSStefano Zampini PetscBool flg; 13163c07aadSStefano Zampini 13263c07aadSStefano Zampini PetscFunctionBegin; 1336ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0) 134792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixInitialize, ij); 1356ea7df73SStefano Zampini #else 136792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixInitialize_v2, ij, HYPRE_MEMORY_HOST); 1376ea7df73SStefano Zampini #endif 1389566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &flg)); 1399566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &nr, &nc)); 14063c07aadSStefano Zampini if (flg && nr == nc) { 1419566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixFastCopy_MPIAIJ(A, ij)); 1423ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 14363c07aadSStefano Zampini } 1449566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATSEQAIJ, &flg)); 14563c07aadSStefano Zampini if (flg) { 1469566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixFastCopy_SeqAIJ(A, ij)); 1473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 14863c07aadSStefano Zampini } 14963c07aadSStefano Zampini 1505fbaff96SJunchao Zhang /* Do not need Aux since we have done precise i[],j[] allocation in MatHYPRE_CreateFromMat() */ 1515fbaff96SJunchao Zhang hypre_AuxParCSRMatrixNeedAux((hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij)) = 0; 1525fbaff96SJunchao Zhang 1539566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(A, &rstart, &rend)); 15463c07aadSStefano Zampini for (i = rstart; i < rend; i++) { 1559566063dSJacob Faibussowitsch PetscCall(MatGetRow(A, i, &ncols, &cols, &values)); 156e3977e59Sstefano_zampini if (ncols) { 1572cf14000SStefano Zampini HYPRE_Int nc = (HYPRE_Int)ncols; 1582cf14000SStefano Zampini 159aed4548fSBarry Smith PetscCheck((PetscInt)nc == ncols, PETSC_COMM_SELF, PETSC_ERR_SUP, "Hypre overflow! number of columns %" PetscInt_FMT " for row %" PetscInt_FMT, ncols, i); 160792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetValues, ij, 1, &nc, (HYPRE_BigInt *)&i, (HYPRE_BigInt *)cols, (HYPRE_Complex *)values); 161e3977e59Sstefano_zampini } 1629566063dSJacob Faibussowitsch PetscCall(MatRestoreRow(A, i, &ncols, &cols, &values)); 16363c07aadSStefano Zampini } 1643ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 16563c07aadSStefano Zampini } 16663c07aadSStefano Zampini 167d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_IJMatrixFastCopy_SeqAIJ(Mat A, HYPRE_IJMatrix ij) 168d71ae5a4SJacob Faibussowitsch { 16963c07aadSStefano Zampini Mat_SeqAIJ *pdiag = (Mat_SeqAIJ *)A->data; 17058968eb6SStefano Zampini HYPRE_Int type; 17163c07aadSStefano Zampini hypre_ParCSRMatrix *par_matrix; 17263c07aadSStefano Zampini hypre_AuxParCSRMatrix *aux_matrix; 17363c07aadSStefano Zampini hypre_CSRMatrix *hdiag; 1742cf14000SStefano Zampini PetscBool sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int)); 1756ea7df73SStefano Zampini const PetscScalar *pa; 17663c07aadSStefano Zampini 17763c07aadSStefano Zampini PetscFunctionBegin; 178792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType, ij, &type); 17908401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported"); 180792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, ij, (void **)&par_matrix); 18163c07aadSStefano Zampini hdiag = hypre_ParCSRMatrixDiag(par_matrix); 18263c07aadSStefano Zampini /* 18363c07aadSStefano Zampini this is the Hack part where we monkey directly with the hypre datastructures 18463c07aadSStefano Zampini */ 1852cf14000SStefano Zampini if (sameint) { 1869566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hdiag->i, pdiag->i, A->rmap->n + 1)); 1879566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hdiag->j, pdiag->j, pdiag->nz)); 1882cf14000SStefano Zampini } else { 1892cf14000SStefano Zampini PetscInt i; 1902cf14000SStefano Zampini 1912cf14000SStefano Zampini for (i = 0; i < A->rmap->n + 1; i++) hdiag->i[i] = (HYPRE_Int)pdiag->i[i]; 1922cf14000SStefano Zampini for (i = 0; i < pdiag->nz; i++) hdiag->j[i] = (HYPRE_Int)pdiag->j[i]; 1932cf14000SStefano Zampini } 1946ea7df73SStefano Zampini 1959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &pa)); 1969566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hdiag->data, pa, pdiag->nz)); 1979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &pa)); 198ea9daf28SStefano Zampini 199ea9daf28SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij); 20063c07aadSStefano Zampini hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0; 2013ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 20263c07aadSStefano Zampini } 20363c07aadSStefano Zampini 204d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_IJMatrixFastCopy_MPIAIJ(Mat A, HYPRE_IJMatrix ij) 205d71ae5a4SJacob Faibussowitsch { 20663c07aadSStefano Zampini Mat_MPIAIJ *pA = (Mat_MPIAIJ *)A->data; 20763c07aadSStefano Zampini Mat_SeqAIJ *pdiag, *poffd; 20863c07aadSStefano Zampini PetscInt i, *garray = pA->garray, *jj, cstart, *pjj; 2092cf14000SStefano Zampini HYPRE_Int *hjj, type; 21063c07aadSStefano Zampini hypre_ParCSRMatrix *par_matrix; 21163c07aadSStefano Zampini hypre_AuxParCSRMatrix *aux_matrix; 21263c07aadSStefano Zampini hypre_CSRMatrix *hdiag, *hoffd; 2132cf14000SStefano Zampini PetscBool sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int)); 2146ea7df73SStefano Zampini const PetscScalar *pa; 21563c07aadSStefano Zampini 21663c07aadSStefano Zampini PetscFunctionBegin; 21763c07aadSStefano Zampini pdiag = (Mat_SeqAIJ *)pA->A->data; 21863c07aadSStefano Zampini poffd = (Mat_SeqAIJ *)pA->B->data; 219da81f932SPierre Jolivet /* cstart is only valid for square MPIAIJ laid out in the usual way */ 2209566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(A, &cstart, NULL)); 22163c07aadSStefano Zampini 222792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType, ij, &type); 22308401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported"); 224792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, ij, (void **)&par_matrix); 22563c07aadSStefano Zampini hdiag = hypre_ParCSRMatrixDiag(par_matrix); 22663c07aadSStefano Zampini hoffd = hypre_ParCSRMatrixOffd(par_matrix); 22763c07aadSStefano Zampini 22863c07aadSStefano Zampini /* 22963c07aadSStefano Zampini this is the Hack part where we monkey directly with the hypre datastructures 23063c07aadSStefano Zampini */ 2312cf14000SStefano Zampini if (sameint) { 2329566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hdiag->i, pdiag->i, pA->A->rmap->n + 1)); 2332cf14000SStefano Zampini } else { 2342cf14000SStefano Zampini for (i = 0; i < pA->A->rmap->n + 1; i++) hdiag->i[i] = (HYPRE_Int)(pdiag->i[i]); 2352cf14000SStefano Zampini } 23663c07aadSStefano Zampini /* need to shift the diag column indices (hdiag->j) back to global numbering since hypre is expecting this */ 2372cf14000SStefano Zampini hjj = hdiag->j; 2382cf14000SStefano Zampini pjj = pdiag->j; 239c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2, 16, 0) 2402cf14000SStefano Zampini for (i = 0; i < pdiag->nz; i++) hjj[i] = pjj[i]; 241c6698e78SStefano Zampini #else 2422cf14000SStefano Zampini for (i = 0; i < pdiag->nz; i++) hjj[i] = cstart + pjj[i]; 243c6698e78SStefano Zampini #endif 2449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(pA->A, &pa)); 2459566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hdiag->data, pa, pdiag->nz)); 2469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(pA->A, &pa)); 2472cf14000SStefano Zampini if (sameint) { 2489566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hoffd->i, poffd->i, pA->A->rmap->n + 1)); 2492cf14000SStefano Zampini } else { 2502cf14000SStefano Zampini for (i = 0; i < pA->A->rmap->n + 1; i++) hoffd->i[i] = (HYPRE_Int)(poffd->i[i]); 2512cf14000SStefano Zampini } 2522cf14000SStefano Zampini 25363c07aadSStefano Zampini /* need to move the offd column indices (hoffd->j) back to global numbering since hypre is expecting this 25463c07aadSStefano Zampini If we hacked a hypre a bit more we might be able to avoid this step */ 255c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2, 16, 0) 256792fecdfSBarry Smith PetscCallExternal(hypre_CSRMatrixBigInitialize, hoffd); 257c6698e78SStefano Zampini jj = (PetscInt *)hoffd->big_j; 258c6698e78SStefano Zampini #else 25963c07aadSStefano Zampini jj = (PetscInt *)hoffd->j; 260c6698e78SStefano Zampini #endif 2612cf14000SStefano Zampini pjj = poffd->j; 26263c07aadSStefano Zampini for (i = 0; i < poffd->nz; i++) jj[i] = garray[pjj[i]]; 263c6698e78SStefano Zampini 2649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(pA->B, &pa)); 2659566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hoffd->data, pa, poffd->nz)); 2669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(pA->B, &pa)); 26763c07aadSStefano Zampini 268ea9daf28SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij); 26963c07aadSStefano Zampini hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0; 2703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 27163c07aadSStefano Zampini } 27263c07aadSStefano Zampini 273d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatConvert_HYPRE_IS(Mat A, MatType mtype, MatReuse reuse, Mat *B) 274d71ae5a4SJacob Faibussowitsch { 2752df22349SStefano Zampini Mat_HYPRE *mhA = (Mat_HYPRE *)(A->data); 2762df22349SStefano Zampini Mat lA; 2772df22349SStefano Zampini ISLocalToGlobalMapping rl2g, cl2g; 2782df22349SStefano Zampini IS is; 2792df22349SStefano Zampini hypre_ParCSRMatrix *hA; 2802df22349SStefano Zampini hypre_CSRMatrix *hdiag, *hoffd; 2812df22349SStefano Zampini MPI_Comm comm; 28239accc25SStefano Zampini HYPRE_Complex *hdd, *hod, *aa; 28339accc25SStefano Zampini PetscScalar *data; 2842cf14000SStefano Zampini HYPRE_BigInt *col_map_offd; 2852cf14000SStefano Zampini HYPRE_Int *hdi, *hdj, *hoi, *hoj; 2862df22349SStefano Zampini PetscInt *ii, *jj, *iptr, *jptr; 2872df22349SStefano Zampini PetscInt cum, dr, dc, oc, str, stc, nnz, i, jd, jo, M, N; 28858968eb6SStefano Zampini HYPRE_Int type; 2892df22349SStefano Zampini 2902df22349SStefano Zampini PetscFunctionBegin; 291a1787963SStefano Zampini comm = PetscObjectComm((PetscObject)A); 292792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType, mhA->ij, &type); 29308401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, comm, PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported"); 294792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, mhA->ij, (void **)&hA); 2952df22349SStefano Zampini M = hypre_ParCSRMatrixGlobalNumRows(hA); 2962df22349SStefano Zampini N = hypre_ParCSRMatrixGlobalNumCols(hA); 2972df22349SStefano Zampini str = hypre_ParCSRMatrixFirstRowIndex(hA); 2982df22349SStefano Zampini stc = hypre_ParCSRMatrixFirstColDiag(hA); 2992df22349SStefano Zampini hdiag = hypre_ParCSRMatrixDiag(hA); 3002df22349SStefano Zampini hoffd = hypre_ParCSRMatrixOffd(hA); 3012df22349SStefano Zampini dr = hypre_CSRMatrixNumRows(hdiag); 3022df22349SStefano Zampini dc = hypre_CSRMatrixNumCols(hdiag); 3032df22349SStefano Zampini nnz = hypre_CSRMatrixNumNonzeros(hdiag); 3042df22349SStefano Zampini hdi = hypre_CSRMatrixI(hdiag); 3052df22349SStefano Zampini hdj = hypre_CSRMatrixJ(hdiag); 3062df22349SStefano Zampini hdd = hypre_CSRMatrixData(hdiag); 3072df22349SStefano Zampini oc = hypre_CSRMatrixNumCols(hoffd); 3082df22349SStefano Zampini nnz += hypre_CSRMatrixNumNonzeros(hoffd); 3092df22349SStefano Zampini hoi = hypre_CSRMatrixI(hoffd); 3102df22349SStefano Zampini hoj = hypre_CSRMatrixJ(hoffd); 3112df22349SStefano Zampini hod = hypre_CSRMatrixData(hoffd); 3122df22349SStefano Zampini if (reuse != MAT_REUSE_MATRIX) { 3132df22349SStefano Zampini PetscInt *aux; 3142df22349SStefano Zampini 3152df22349SStefano Zampini /* generate l2g maps for rows and cols */ 3169566063dSJacob Faibussowitsch PetscCall(ISCreateStride(comm, dr, str, 1, &is)); 3179566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreateIS(is, &rl2g)); 3189566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is)); 3192df22349SStefano Zampini col_map_offd = hypre_ParCSRMatrixColMapOffd(hA); 3209566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(dc + oc, &aux)); 3212df22349SStefano Zampini for (i = 0; i < dc; i++) aux[i] = i + stc; 3222df22349SStefano Zampini for (i = 0; i < oc; i++) aux[i + dc] = col_map_offd[i]; 3239566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(comm, dc + oc, aux, PETSC_OWN_POINTER, &is)); 3249566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreateIS(is, &cl2g)); 3259566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is)); 3262df22349SStefano Zampini /* create MATIS object */ 3279566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, B)); 3289566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, dr, dc, M, N)); 3299566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, MATIS)); 3309566063dSJacob Faibussowitsch PetscCall(MatSetLocalToGlobalMapping(*B, rl2g, cl2g)); 3319566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingDestroy(&rl2g)); 3329566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingDestroy(&cl2g)); 3332df22349SStefano Zampini 3342df22349SStefano Zampini /* allocate CSR for local matrix */ 3359566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(dr + 1, &iptr)); 3369566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz, &jptr)); 3379566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz, &data)); 3382df22349SStefano Zampini } else { 3392df22349SStefano Zampini PetscInt nr; 3402df22349SStefano Zampini PetscBool done; 3419566063dSJacob Faibussowitsch PetscCall(MatISGetLocalMat(*B, &lA)); 3429566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(lA, 0, PETSC_FALSE, PETSC_FALSE, &nr, (const PetscInt **)&iptr, (const PetscInt **)&jptr, &done)); 34308401ef6SPierre Jolivet PetscCheck(nr == dr, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of rows in local mat! %" PetscInt_FMT " != %" PetscInt_FMT, nr, dr); 34408401ef6SPierre Jolivet PetscCheck(iptr[nr] >= nnz, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of nonzeros in local mat! reuse %" PetscInt_FMT " requested %" PetscInt_FMT, iptr[nr], nnz); 3459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(lA, &data)); 3462df22349SStefano Zampini } 3472df22349SStefano Zampini /* merge local matrices */ 3482df22349SStefano Zampini ii = iptr; 3492df22349SStefano Zampini jj = jptr; 35039accc25SStefano Zampini aa = (HYPRE_Complex *)data; /* this cast fixes the clang error when doing the assignments below: implicit conversion from 'HYPRE_Complex' (aka '_Complex double') to 'double' is not permitted in C++ */ 3512df22349SStefano Zampini *ii = *(hdi++) + *(hoi++); 3522df22349SStefano Zampini for (jd = 0, jo = 0, cum = 0; *ii < nnz; cum++) { 35339accc25SStefano Zampini PetscScalar *aold = (PetscScalar *)aa; 3542df22349SStefano Zampini PetscInt *jold = jj, nc = jd + jo; 3559371c9d4SSatish Balay for (; jd < *hdi; jd++) { 3569371c9d4SSatish Balay *jj++ = *hdj++; 3579371c9d4SSatish Balay *aa++ = *hdd++; 3589371c9d4SSatish Balay } 3599371c9d4SSatish Balay for (; jo < *hoi; jo++) { 3609371c9d4SSatish Balay *jj++ = *hoj++ + dc; 3619371c9d4SSatish Balay *aa++ = *hod++; 3629371c9d4SSatish Balay } 3632df22349SStefano Zampini *(++ii) = *(hdi++) + *(hoi++); 3649566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(jd + jo - nc, jold, aold)); 3652df22349SStefano Zampini } 3662df22349SStefano Zampini for (; cum < dr; cum++) *(++ii) = nnz; 3672df22349SStefano Zampini if (reuse != MAT_REUSE_MATRIX) { 368a033916dSStefano Zampini Mat_SeqAIJ *a; 369a033916dSStefano Zampini 3709566063dSJacob Faibussowitsch PetscCall(MatCreateSeqAIJWithArrays(PETSC_COMM_SELF, dr, dc + oc, iptr, jptr, data, &lA)); 3719566063dSJacob Faibussowitsch PetscCall(MatISSetLocalMat(*B, lA)); 372a033916dSStefano Zampini /* hack SeqAIJ */ 373a033916dSStefano Zampini a = (Mat_SeqAIJ *)(lA->data); 374a033916dSStefano Zampini a->free_a = PETSC_TRUE; 375a033916dSStefano Zampini a->free_ij = PETSC_TRUE; 3769566063dSJacob Faibussowitsch PetscCall(MatDestroy(&lA)); 3772df22349SStefano Zampini } 3789566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 3799566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 38048a46eb9SPierre Jolivet if (reuse == MAT_INPLACE_MATRIX) PetscCall(MatHeaderReplace(A, B)); 3813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3822df22349SStefano Zampini } 3832df22349SStefano Zampini 384d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType type, MatReuse reuse, Mat *B) 385d71ae5a4SJacob Faibussowitsch { 38684d4e069SStefano Zampini Mat M = NULL; 38763c07aadSStefano Zampini Mat_HYPRE *hB; 38863c07aadSStefano Zampini MPI_Comm comm = PetscObjectComm((PetscObject)A); 38963c07aadSStefano Zampini 39063c07aadSStefano Zampini PetscFunctionBegin; 39163c07aadSStefano Zampini if (reuse == MAT_REUSE_MATRIX) { 39263c07aadSStefano Zampini /* always destroy the old matrix and create a new memory; 39363c07aadSStefano Zampini hope this does not churn the memory too much. The problem 39463c07aadSStefano Zampini is I do not know if it is possible to put the matrix back to 39563c07aadSStefano Zampini its initial state so that we can directly copy the values 39663c07aadSStefano Zampini the second time through. */ 39763c07aadSStefano Zampini hB = (Mat_HYPRE *)((*B)->data); 398792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixDestroy, hB->ij); 39963c07aadSStefano Zampini } else { 4009566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, &M)); 4019566063dSJacob Faibussowitsch PetscCall(MatSetType(M, MATHYPRE)); 4029566063dSJacob Faibussowitsch PetscCall(MatSetSizes(M, A->rmap->n, A->cmap->n, A->rmap->N, A->cmap->N)); 40384d4e069SStefano Zampini hB = (Mat_HYPRE *)(M->data); 40484d4e069SStefano Zampini if (reuse == MAT_INITIAL_MATRIX) *B = M; 40563c07aadSStefano Zampini } 4069566063dSJacob Faibussowitsch PetscCall(MatSetOption(*B, MAT_SORTED_FULL, PETSC_TRUE)); /* "perfect" preallocation, so no need for hypre_AuxParCSRMatrixNeedAux */ 4079566063dSJacob Faibussowitsch PetscCall(MatSetOption(*B, MAT_NO_OFF_PROC_ENTRIES, PETSC_TRUE)); 4089566063dSJacob Faibussowitsch PetscCall(MatHYPRE_CreateFromMat(A, hB)); 4099566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixCopy(A, hB->ij)); 41048a46eb9SPierre Jolivet if (reuse == MAT_INPLACE_MATRIX) PetscCall(MatHeaderReplace(A, &M)); 4114ec6421dSstefano_zampini (*B)->preallocated = PETSC_TRUE; 4129566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 4139566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 4143ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 41563c07aadSStefano Zampini } 41663c07aadSStefano Zampini 417d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatConvert_HYPRE_AIJ(Mat A, MatType mtype, MatReuse reuse, Mat *B) 418d71ae5a4SJacob Faibussowitsch { 41963c07aadSStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 42063c07aadSStefano Zampini hypre_ParCSRMatrix *parcsr; 42163c07aadSStefano Zampini hypre_CSRMatrix *hdiag, *hoffd; 42263c07aadSStefano Zampini MPI_Comm comm; 42363c07aadSStefano Zampini PetscScalar *da, *oa, *aptr; 42463c07aadSStefano Zampini PetscInt *dii, *djj, *oii, *ojj, *iptr; 42563c07aadSStefano Zampini PetscInt i, dnnz, onnz, m, n; 42658968eb6SStefano Zampini HYPRE_Int type; 42763c07aadSStefano Zampini PetscMPIInt size; 4282cf14000SStefano Zampini PetscBool sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int)); 42963c07aadSStefano Zampini 43063c07aadSStefano Zampini PetscFunctionBegin; 43163c07aadSStefano Zampini comm = PetscObjectComm((PetscObject)A); 432792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType, hA->ij, &type); 43308401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, comm, PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported"); 43463c07aadSStefano Zampini if (reuse == MAT_REUSE_MATRIX) { 43563c07aadSStefano Zampini PetscBool ismpiaij, isseqaij; 4369566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)*B, MATMPIAIJ, &ismpiaij)); 4379566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)*B, MATSEQAIJ, &isseqaij)); 43808401ef6SPierre Jolivet PetscCheck(ismpiaij || isseqaij, comm, PETSC_ERR_SUP, "Only MATMPIAIJ or MATSEQAIJ are supported"); 43963c07aadSStefano Zampini } 4406ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 44108401ef6SPierre Jolivet PetscCheck(HYPRE_MEMORY_DEVICE != hypre_IJMatrixMemoryLocation(hA->ij), comm, PETSC_ERR_SUP, "Not yet implemented"); 4426ea7df73SStefano Zampini #endif 4439566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(comm, &size)); 44463c07aadSStefano Zampini 445792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, hA->ij, (void **)&parcsr); 44663c07aadSStefano Zampini hdiag = hypre_ParCSRMatrixDiag(parcsr); 44763c07aadSStefano Zampini hoffd = hypre_ParCSRMatrixOffd(parcsr); 44863c07aadSStefano Zampini m = hypre_CSRMatrixNumRows(hdiag); 44963c07aadSStefano Zampini n = hypre_CSRMatrixNumCols(hdiag); 45063c07aadSStefano Zampini dnnz = hypre_CSRMatrixNumNonzeros(hdiag); 45163c07aadSStefano Zampini onnz = hypre_CSRMatrixNumNonzeros(hoffd); 452225daaf8SStefano Zampini if (reuse == MAT_INITIAL_MATRIX) { 4539566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &dii)); 4549566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(dnnz, &djj)); 4559566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(dnnz, &da)); 456225daaf8SStefano Zampini } else if (reuse == MAT_REUSE_MATRIX) { 45763c07aadSStefano Zampini PetscInt nr; 45863c07aadSStefano Zampini PetscBool done; 45963c07aadSStefano Zampini if (size > 1) { 46063c07aadSStefano Zampini Mat_MPIAIJ *b = (Mat_MPIAIJ *)((*B)->data); 46163c07aadSStefano Zampini 4629566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(b->A, 0, PETSC_FALSE, PETSC_FALSE, &nr, (const PetscInt **)&dii, (const PetscInt **)&djj, &done)); 46308401ef6SPierre Jolivet PetscCheck(nr == m, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of local rows in diag part! %" PetscInt_FMT " != %" PetscInt_FMT, nr, m); 46408401ef6SPierre Jolivet PetscCheck(dii[nr] >= dnnz, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of nonzeros in diag part! reuse %" PetscInt_FMT " hypre %" PetscInt_FMT, dii[nr], dnnz); 4659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(b->A, &da)); 46663c07aadSStefano Zampini } else { 4679566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(*B, 0, PETSC_FALSE, PETSC_FALSE, &nr, (const PetscInt **)&dii, (const PetscInt **)&djj, &done)); 46808401ef6SPierre Jolivet PetscCheck(nr == m, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of local rows! %" PetscInt_FMT " != %" PetscInt_FMT, nr, m); 46908401ef6SPierre Jolivet PetscCheck(dii[nr] >= dnnz, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of nonzeros! reuse %" PetscInt_FMT " hypre %" PetscInt_FMT, dii[nr], dnnz); 4709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*B, &da)); 47163c07aadSStefano Zampini } 472225daaf8SStefano Zampini } else { /* MAT_INPLACE_MATRIX */ 4732cf14000SStefano Zampini if (!sameint) { 4749566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &dii)); 4759566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(dnnz, &djj)); 4762cf14000SStefano Zampini } else { 4777d968826Sstefano_zampini dii = (PetscInt *)hypre_CSRMatrixI(hdiag); 4787d968826Sstefano_zampini djj = (PetscInt *)hypre_CSRMatrixJ(hdiag); 47963c07aadSStefano Zampini } 48039accc25SStefano Zampini da = (PetscScalar *)hypre_CSRMatrixData(hdiag); 48163c07aadSStefano Zampini } 4822cf14000SStefano Zampini 4832cf14000SStefano Zampini if (!sameint) { 4849371c9d4SSatish Balay if (reuse != MAT_REUSE_MATRIX) { 4859371c9d4SSatish Balay for (i = 0; i < m + 1; i++) dii[i] = (PetscInt)(hypre_CSRMatrixI(hdiag)[i]); 4869371c9d4SSatish Balay } 4872cf14000SStefano Zampini for (i = 0; i < dnnz; i++) djj[i] = (PetscInt)(hypre_CSRMatrixJ(hdiag)[i]); 4882cf14000SStefano Zampini } else { 4899566063dSJacob Faibussowitsch if (reuse != MAT_REUSE_MATRIX) PetscCall(PetscArraycpy(dii, hypre_CSRMatrixI(hdiag), m + 1)); 4909566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(djj, hypre_CSRMatrixJ(hdiag), dnnz)); 4912cf14000SStefano Zampini } 4929566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(da, hypre_CSRMatrixData(hdiag), dnnz)); 49363c07aadSStefano Zampini iptr = djj; 49463c07aadSStefano Zampini aptr = da; 49563c07aadSStefano Zampini for (i = 0; i < m; i++) { 49663c07aadSStefano Zampini PetscInt nc = dii[i + 1] - dii[i]; 4979566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(nc, iptr, aptr)); 49863c07aadSStefano Zampini iptr += nc; 49963c07aadSStefano Zampini aptr += nc; 50063c07aadSStefano Zampini } 50163c07aadSStefano Zampini if (size > 1) { 5022cf14000SStefano Zampini HYPRE_BigInt *coffd; 5032cf14000SStefano Zampini HYPRE_Int *offdj; 50463c07aadSStefano Zampini 505225daaf8SStefano Zampini if (reuse == MAT_INITIAL_MATRIX) { 5069566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &oii)); 5079566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(onnz, &ojj)); 5089566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(onnz, &oa)); 509225daaf8SStefano Zampini } else if (reuse == MAT_REUSE_MATRIX) { 51063c07aadSStefano Zampini Mat_MPIAIJ *b = (Mat_MPIAIJ *)((*B)->data); 51163c07aadSStefano Zampini PetscInt nr, hr = hypre_CSRMatrixNumRows(hoffd); 51263c07aadSStefano Zampini PetscBool done; 51363c07aadSStefano Zampini 5149566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(b->B, 0, PETSC_FALSE, PETSC_FALSE, &nr, (const PetscInt **)&oii, (const PetscInt **)&ojj, &done)); 51508401ef6SPierre Jolivet PetscCheck(nr == hr, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of local rows in offdiag part! %" PetscInt_FMT " != %" PetscInt_FMT, nr, hr); 51608401ef6SPierre Jolivet PetscCheck(oii[nr] >= onnz, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of nonzeros in offdiag part! reuse %" PetscInt_FMT " hypre %" PetscInt_FMT, oii[nr], onnz); 5179566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(b->B, &oa)); 518225daaf8SStefano Zampini } else { /* MAT_INPLACE_MATRIX */ 5192cf14000SStefano Zampini if (!sameint) { 5209566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &oii)); 5219566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(onnz, &ojj)); 5222cf14000SStefano Zampini } else { 5237d968826Sstefano_zampini oii = (PetscInt *)hypre_CSRMatrixI(hoffd); 5247d968826Sstefano_zampini ojj = (PetscInt *)hypre_CSRMatrixJ(hoffd); 52563c07aadSStefano Zampini } 52639accc25SStefano Zampini oa = (PetscScalar *)hypre_CSRMatrixData(hoffd); 52763c07aadSStefano Zampini } 528a16187a7SStefano Zampini if (reuse != MAT_REUSE_MATRIX) { 5292cf14000SStefano Zampini if (!sameint) { 5302cf14000SStefano Zampini for (i = 0; i < m + 1; i++) oii[i] = (PetscInt)(hypre_CSRMatrixI(hoffd)[i]); 5312cf14000SStefano Zampini } else { 5329566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(oii, hypre_CSRMatrixI(hoffd), m + 1)); 5332cf14000SStefano Zampini } 534a16187a7SStefano Zampini } 5359566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(oa, hypre_CSRMatrixData(hoffd), onnz)); 536a16187a7SStefano Zampini 53763c07aadSStefano Zampini offdj = hypre_CSRMatrixJ(hoffd); 53863c07aadSStefano Zampini coffd = hypre_ParCSRMatrixColMapOffd(parcsr); 539a16187a7SStefano Zampini /* we only need the permutation to be computed properly, I don't know if HYPRE 540a16187a7SStefano Zampini messes up with the ordering. Just in case, allocate some memory and free it 541a16187a7SStefano Zampini later */ 542a16187a7SStefano Zampini if (reuse == MAT_REUSE_MATRIX) { 543a16187a7SStefano Zampini Mat_MPIAIJ *b = (Mat_MPIAIJ *)((*B)->data); 544a16187a7SStefano Zampini PetscInt mnz; 545a16187a7SStefano Zampini 5469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetMaxRowNonzeros(b->B, &mnz)); 5479566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mnz, &ojj)); 5489371c9d4SSatish Balay } else 5499371c9d4SSatish Balay for (i = 0; i < onnz; i++) ojj[i] = coffd[offdj[i]]; 55063c07aadSStefano Zampini iptr = ojj; 55163c07aadSStefano Zampini aptr = oa; 55263c07aadSStefano Zampini for (i = 0; i < m; i++) { 55363c07aadSStefano Zampini PetscInt nc = oii[i + 1] - oii[i]; 554a16187a7SStefano Zampini if (reuse == MAT_REUSE_MATRIX) { 555a16187a7SStefano Zampini PetscInt j; 556a16187a7SStefano Zampini 557a16187a7SStefano Zampini iptr = ojj; 558a16187a7SStefano Zampini for (j = 0; j < nc; j++) iptr[j] = coffd[offdj[oii[i] + j]]; 559a16187a7SStefano Zampini } 5609566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(nc, iptr, aptr)); 56163c07aadSStefano Zampini iptr += nc; 56263c07aadSStefano Zampini aptr += nc; 56363c07aadSStefano Zampini } 5649566063dSJacob Faibussowitsch if (reuse == MAT_REUSE_MATRIX) PetscCall(PetscFree(ojj)); 565225daaf8SStefano Zampini if (reuse == MAT_INITIAL_MATRIX) { 56663c07aadSStefano Zampini Mat_MPIAIJ *b; 56763c07aadSStefano Zampini Mat_SeqAIJ *d, *o; 568225daaf8SStefano Zampini 5699566063dSJacob Faibussowitsch PetscCall(MatCreateMPIAIJWithSplitArrays(comm, m, n, PETSC_DECIDE, PETSC_DECIDE, dii, djj, da, oii, ojj, oa, B)); 57063c07aadSStefano Zampini /* hack MPIAIJ */ 57163c07aadSStefano Zampini b = (Mat_MPIAIJ *)((*B)->data); 57263c07aadSStefano Zampini d = (Mat_SeqAIJ *)b->A->data; 57363c07aadSStefano Zampini o = (Mat_SeqAIJ *)b->B->data; 57463c07aadSStefano Zampini d->free_a = PETSC_TRUE; 57563c07aadSStefano Zampini d->free_ij = PETSC_TRUE; 57663c07aadSStefano Zampini o->free_a = PETSC_TRUE; 57763c07aadSStefano Zampini o->free_ij = PETSC_TRUE; 578225daaf8SStefano Zampini } else if (reuse == MAT_INPLACE_MATRIX) { 579225daaf8SStefano Zampini Mat T; 5802cf14000SStefano Zampini 5819566063dSJacob Faibussowitsch PetscCall(MatCreateMPIAIJWithSplitArrays(comm, m, n, PETSC_DECIDE, PETSC_DECIDE, dii, djj, da, oii, ojj, oa, &T)); 5822cf14000SStefano Zampini if (sameint) { /* ownership of CSR pointers is transferred to PETSc */ 583225daaf8SStefano Zampini hypre_CSRMatrixI(hdiag) = NULL; 584225daaf8SStefano Zampini hypre_CSRMatrixJ(hdiag) = NULL; 585225daaf8SStefano Zampini hypre_CSRMatrixI(hoffd) = NULL; 586225daaf8SStefano Zampini hypre_CSRMatrixJ(hoffd) = NULL; 5872cf14000SStefano Zampini } else { /* Hack MPIAIJ -> free ij but not a */ 5882cf14000SStefano Zampini Mat_MPIAIJ *b = (Mat_MPIAIJ *)(T->data); 5892cf14000SStefano Zampini Mat_SeqAIJ *d = (Mat_SeqAIJ *)(b->A->data); 5902cf14000SStefano Zampini Mat_SeqAIJ *o = (Mat_SeqAIJ *)(b->B->data); 5912cf14000SStefano Zampini 5922cf14000SStefano Zampini d->free_ij = PETSC_TRUE; 5932cf14000SStefano Zampini o->free_ij = PETSC_TRUE; 5942cf14000SStefano Zampini } 5952cf14000SStefano Zampini hypre_CSRMatrixData(hdiag) = NULL; 596225daaf8SStefano Zampini hypre_CSRMatrixData(hoffd) = NULL; 5979566063dSJacob Faibussowitsch PetscCall(MatHeaderReplace(A, &T)); 59863c07aadSStefano Zampini } 599225daaf8SStefano Zampini } else { 600225daaf8SStefano Zampini oii = NULL; 601225daaf8SStefano Zampini ojj = NULL; 602225daaf8SStefano Zampini oa = NULL; 603225daaf8SStefano Zampini if (reuse == MAT_INITIAL_MATRIX) { 60463c07aadSStefano Zampini Mat_SeqAIJ *b; 6052cf14000SStefano Zampini 6069566063dSJacob Faibussowitsch PetscCall(MatCreateSeqAIJWithArrays(comm, m, n, dii, djj, da, B)); 60763c07aadSStefano Zampini /* hack SeqAIJ */ 60863c07aadSStefano Zampini b = (Mat_SeqAIJ *)((*B)->data); 60963c07aadSStefano Zampini b->free_a = PETSC_TRUE; 61063c07aadSStefano Zampini b->free_ij = PETSC_TRUE; 611225daaf8SStefano Zampini } else if (reuse == MAT_INPLACE_MATRIX) { 612225daaf8SStefano Zampini Mat T; 6132cf14000SStefano Zampini 6149566063dSJacob Faibussowitsch PetscCall(MatCreateSeqAIJWithArrays(comm, m, n, dii, djj, da, &T)); 6152cf14000SStefano Zampini if (sameint) { /* ownership of CSR pointers is transferred to PETSc */ 616225daaf8SStefano Zampini hypre_CSRMatrixI(hdiag) = NULL; 617225daaf8SStefano Zampini hypre_CSRMatrixJ(hdiag) = NULL; 6182cf14000SStefano Zampini } else { /* free ij but not a */ 6192cf14000SStefano Zampini Mat_SeqAIJ *b = (Mat_SeqAIJ *)(T->data); 6202cf14000SStefano Zampini 6212cf14000SStefano Zampini b->free_ij = PETSC_TRUE; 6222cf14000SStefano Zampini } 623225daaf8SStefano Zampini hypre_CSRMatrixData(hdiag) = NULL; 6249566063dSJacob Faibussowitsch PetscCall(MatHeaderReplace(A, &T)); 62563c07aadSStefano Zampini } 626225daaf8SStefano Zampini } 627225daaf8SStefano Zampini 6282cf14000SStefano Zampini /* we have to use hypre_Tfree to free the HYPRE arrays 629da81f932SPierre Jolivet that PETSc now owns */ 63063c07aadSStefano Zampini if (reuse == MAT_INPLACE_MATRIX) { 6312cf14000SStefano Zampini PetscInt nh; 6322cf14000SStefano Zampini void *ptrs[6] = {da, oa, dii, djj, oii, ojj}; 6339371c9d4SSatish Balay const char *names[6] = {"_hypre_csr_da", "_hypre_csr_oa", "_hypre_csr_dii", "_hypre_csr_djj", "_hypre_csr_oii", "_hypre_csr_ojj"}; 6342cf14000SStefano Zampini nh = sameint ? 6 : 2; 6352cf14000SStefano Zampini for (i = 0; i < nh; i++) { 636225daaf8SStefano Zampini PetscContainer c; 637225daaf8SStefano Zampini 6389566063dSJacob Faibussowitsch PetscCall(PetscContainerCreate(comm, &c)); 6399566063dSJacob Faibussowitsch PetscCall(PetscContainerSetPointer(c, ptrs[i])); 6409566063dSJacob Faibussowitsch PetscCall(PetscContainerSetUserDestroy(c, hypre_array_destroy)); 6419566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)(*B), names[i], (PetscObject)c)); 6429566063dSJacob Faibussowitsch PetscCall(PetscContainerDestroy(&c)); 643225daaf8SStefano Zampini } 64463c07aadSStefano Zampini } 6453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 64663c07aadSStefano Zampini } 64763c07aadSStefano Zampini 648d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAIJGetParCSR_Private(Mat A, hypre_ParCSRMatrix **hA) 649d71ae5a4SJacob Faibussowitsch { 650613e5ff0Sstefano_zampini hypre_ParCSRMatrix *tA; 651c1a070e6SStefano Zampini hypre_CSRMatrix *hdiag, *hoffd; 652c1a070e6SStefano Zampini Mat_SeqAIJ *diag, *offd; 6532cf14000SStefano Zampini PetscInt *garray, i, noffd, dnnz, onnz, *row_starts, *col_starts; 654c1a070e6SStefano Zampini MPI_Comm comm = PetscObjectComm((PetscObject)A); 655613e5ff0Sstefano_zampini PetscBool ismpiaij, isseqaij; 6562cf14000SStefano Zampini PetscBool sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int)); 6576ea7df73SStefano Zampini HYPRE_Int *hdi = NULL, *hdj = NULL, *hoi = NULL, *hoj = NULL; 6585c97c10fSStefano Zampini PetscInt *pdi = NULL, *pdj = NULL, *poi = NULL, *poj = NULL; 6596ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 6606ea7df73SStefano Zampini PetscBool iscuda = PETSC_FALSE; 6616ea7df73SStefano Zampini #endif 662c1a070e6SStefano Zampini 663c1a070e6SStefano Zampini PetscFunctionBegin; 6649566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &ismpiaij)); 6659566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATSEQAIJ, &isseqaij)); 66608401ef6SPierre Jolivet PetscCheck(ismpiaij || isseqaij, comm, PETSC_ERR_SUP, "Unsupported type %s", ((PetscObject)A)->type_name); 667*ea9ee2c1SPierre Jolivet PetscHYPREInitialize(); 668c1a070e6SStefano Zampini if (ismpiaij) { 669c1a070e6SStefano Zampini Mat_MPIAIJ *a = (Mat_MPIAIJ *)(A->data); 670c1a070e6SStefano Zampini 671c1a070e6SStefano Zampini diag = (Mat_SeqAIJ *)a->A->data; 672c1a070e6SStefano Zampini offd = (Mat_SeqAIJ *)a->B->data; 6736ea7df73SStefano Zampini #if defined(PETSC_HAVE_CUDA) && defined(PETSC_HAVE_HYPRE_DEVICE) && defined(HYPRE_USING_CUDA) 6749566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)A, MATMPIAIJCUSPARSE, &iscuda)); 6756ea7df73SStefano Zampini if (iscuda && !A->boundtocpu) { 6766ea7df73SStefano Zampini sameint = PETSC_TRUE; 6779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJCUSPARSEGetIJ(a->A, PETSC_FALSE, (const HYPRE_Int **)&hdi, (const HYPRE_Int **)&hdj)); 6789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJCUSPARSEGetIJ(a->B, PETSC_FALSE, (const HYPRE_Int **)&hoi, (const HYPRE_Int **)&hoj)); 6796ea7df73SStefano Zampini } else { 6806ea7df73SStefano Zampini #else 6816ea7df73SStefano Zampini { 6826ea7df73SStefano Zampini #endif 6836ea7df73SStefano Zampini pdi = diag->i; 6846ea7df73SStefano Zampini pdj = diag->j; 6856ea7df73SStefano Zampini poi = offd->i; 6866ea7df73SStefano Zampini poj = offd->j; 6876ea7df73SStefano Zampini if (sameint) { 6886ea7df73SStefano Zampini hdi = (HYPRE_Int *)pdi; 6896ea7df73SStefano Zampini hdj = (HYPRE_Int *)pdj; 6906ea7df73SStefano Zampini hoi = (HYPRE_Int *)poi; 6916ea7df73SStefano Zampini hoj = (HYPRE_Int *)poj; 6926ea7df73SStefano Zampini } 6936ea7df73SStefano Zampini } 694c1a070e6SStefano Zampini garray = a->garray; 695c1a070e6SStefano Zampini noffd = a->B->cmap->N; 696c1a070e6SStefano Zampini dnnz = diag->nz; 697c1a070e6SStefano Zampini onnz = offd->nz; 698c1a070e6SStefano Zampini } else { 699c1a070e6SStefano Zampini diag = (Mat_SeqAIJ *)A->data; 700c1a070e6SStefano Zampini offd = NULL; 7016ea7df73SStefano Zampini #if defined(PETSC_HAVE_CUDA) && defined(PETSC_HAVE_HYPRE_DEVICE) 7029566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)A, MATSEQAIJCUSPARSE, &iscuda)); 7036ea7df73SStefano Zampini if (iscuda && !A->boundtocpu) { 7046ea7df73SStefano Zampini sameint = PETSC_TRUE; 7059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJCUSPARSEGetIJ(A, PETSC_FALSE, (const HYPRE_Int **)&hdi, (const HYPRE_Int **)&hdj)); 7066ea7df73SStefano Zampini } else { 7076ea7df73SStefano Zampini #else 7086ea7df73SStefano Zampini { 7096ea7df73SStefano Zampini #endif 7106ea7df73SStefano Zampini pdi = diag->i; 7116ea7df73SStefano Zampini pdj = diag->j; 7126ea7df73SStefano Zampini if (sameint) { 7136ea7df73SStefano Zampini hdi = (HYPRE_Int *)pdi; 7146ea7df73SStefano Zampini hdj = (HYPRE_Int *)pdj; 7156ea7df73SStefano Zampini } 7166ea7df73SStefano Zampini } 717c1a070e6SStefano Zampini garray = NULL; 718c1a070e6SStefano Zampini noffd = 0; 719c1a070e6SStefano Zampini dnnz = diag->nz; 720c1a070e6SStefano Zampini onnz = 0; 721c1a070e6SStefano Zampini } 722225daaf8SStefano Zampini 723c1a070e6SStefano Zampini /* create a temporary ParCSR */ 724c1a070e6SStefano Zampini if (HYPRE_AssumedPartitionCheck()) { 725c1a070e6SStefano Zampini PetscMPIInt myid; 726c1a070e6SStefano Zampini 7279566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_rank(comm, &myid)); 728c1a070e6SStefano Zampini row_starts = A->rmap->range + myid; 729c1a070e6SStefano Zampini col_starts = A->cmap->range + myid; 730c1a070e6SStefano Zampini } else { 731c1a070e6SStefano Zampini row_starts = A->rmap->range; 732c1a070e6SStefano Zampini col_starts = A->cmap->range; 733c1a070e6SStefano Zampini } 7342cf14000SStefano Zampini tA = hypre_ParCSRMatrixCreate(comm, A->rmap->N, A->cmap->N, (HYPRE_BigInt *)row_starts, (HYPRE_BigInt *)col_starts, noffd, dnnz, onnz); 735a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts) 736c1a070e6SStefano Zampini hypre_ParCSRMatrixSetRowStartsOwner(tA, 0); 737c1a070e6SStefano Zampini hypre_ParCSRMatrixSetColStartsOwner(tA, 0); 738a1d2239cSSatish Balay #endif 739c1a070e6SStefano Zampini 740225daaf8SStefano Zampini /* set diagonal part */ 741c1a070e6SStefano Zampini hdiag = hypre_ParCSRMatrixDiag(tA); 7426ea7df73SStefano Zampini if (!sameint) { /* malloc CSR pointers */ 7439566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(A->rmap->n + 1, &hdi, dnnz, &hdj)); 7446ea7df73SStefano Zampini for (i = 0; i < A->rmap->n + 1; i++) hdi[i] = (HYPRE_Int)(pdi[i]); 7456ea7df73SStefano Zampini for (i = 0; i < dnnz; i++) hdj[i] = (HYPRE_Int)(pdj[i]); 7462cf14000SStefano Zampini } 7476ea7df73SStefano Zampini hypre_CSRMatrixI(hdiag) = hdi; 7486ea7df73SStefano Zampini hypre_CSRMatrixJ(hdiag) = hdj; 74939accc25SStefano Zampini hypre_CSRMatrixData(hdiag) = (HYPRE_Complex *)diag->a; 750c1a070e6SStefano Zampini hypre_CSRMatrixNumNonzeros(hdiag) = diag->nz; 751c1a070e6SStefano Zampini hypre_CSRMatrixSetRownnz(hdiag); 752c1a070e6SStefano Zampini hypre_CSRMatrixSetDataOwner(hdiag, 0); 753c1a070e6SStefano Zampini 754225daaf8SStefano Zampini /* set offdiagonal part */ 755c1a070e6SStefano Zampini hoffd = hypre_ParCSRMatrixOffd(tA); 756c1a070e6SStefano Zampini if (offd) { 7576ea7df73SStefano Zampini if (!sameint) { /* malloc CSR pointers */ 7589566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(A->rmap->n + 1, &hoi, onnz, &hoj)); 7596ea7df73SStefano Zampini for (i = 0; i < A->rmap->n + 1; i++) hoi[i] = (HYPRE_Int)(poi[i]); 7606ea7df73SStefano Zampini for (i = 0; i < onnz; i++) hoj[i] = (HYPRE_Int)(poj[i]); 7612cf14000SStefano Zampini } 7626ea7df73SStefano Zampini hypre_CSRMatrixI(hoffd) = hoi; 7636ea7df73SStefano Zampini hypre_CSRMatrixJ(hoffd) = hoj; 76439accc25SStefano Zampini hypre_CSRMatrixData(hoffd) = (HYPRE_Complex *)offd->a; 765c1a070e6SStefano Zampini hypre_CSRMatrixNumNonzeros(hoffd) = offd->nz; 766c1a070e6SStefano Zampini hypre_CSRMatrixSetRownnz(hoffd); 767c1a070e6SStefano Zampini hypre_CSRMatrixSetDataOwner(hoffd, 0); 7686ea7df73SStefano Zampini } 7696ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 770792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixInitialize_v2, tA, iscuda ? HYPRE_MEMORY_DEVICE : HYPRE_MEMORY_HOST); 7716ea7df73SStefano Zampini #else 7726ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 18, 0) 773792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixInitialize, tA); 7746ea7df73SStefano Zampini #else 775792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixInitialize_v2, tA, HYPRE_MEMORY_HOST); 7766ea7df73SStefano Zampini #endif 7776ea7df73SStefano Zampini #endif 7786ea7df73SStefano Zampini hypre_TFree(hypre_ParCSRMatrixColMapOffd(tA), HYPRE_MEMORY_HOST); 779c1a070e6SStefano Zampini hypre_ParCSRMatrixSetNumNonzeros(tA); 7802cf14000SStefano Zampini hypre_ParCSRMatrixColMapOffd(tA) = (HYPRE_BigInt *)garray; 781792fecdfSBarry Smith if (!hypre_ParCSRMatrixCommPkg(tA)) PetscCallExternal(hypre_MatvecCommPkgCreate, tA); 782613e5ff0Sstefano_zampini *hA = tA; 7833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 784613e5ff0Sstefano_zampini } 785c1a070e6SStefano Zampini 786d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAIJRestoreParCSR_Private(Mat A, hypre_ParCSRMatrix **hA) 787d71ae5a4SJacob Faibussowitsch { 788613e5ff0Sstefano_zampini hypre_CSRMatrix *hdiag, *hoffd; 7896ea7df73SStefano Zampini PetscBool ismpiaij, sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int)); 7906ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 7916ea7df73SStefano Zampini PetscBool iscuda = PETSC_FALSE; 7926ea7df73SStefano Zampini #endif 793c1a070e6SStefano Zampini 794613e5ff0Sstefano_zampini PetscFunctionBegin; 7959566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &ismpiaij)); 7966ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 7979566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)A, &iscuda, MATSEQAIJCUSPARSE, MATMPIAIJCUSPARSE, "")); 7986ea7df73SStefano Zampini if (iscuda) sameint = PETSC_TRUE; 7996ea7df73SStefano Zampini #endif 800613e5ff0Sstefano_zampini hdiag = hypre_ParCSRMatrixDiag(*hA); 801613e5ff0Sstefano_zampini hoffd = hypre_ParCSRMatrixOffd(*hA); 8026ea7df73SStefano Zampini /* free temporary memory allocated by PETSc 8036ea7df73SStefano Zampini set pointers to NULL before destroying tA */ 8042cf14000SStefano Zampini if (!sameint) { 8052cf14000SStefano Zampini HYPRE_Int *hi, *hj; 8062cf14000SStefano Zampini 8072cf14000SStefano Zampini hi = hypre_CSRMatrixI(hdiag); 8082cf14000SStefano Zampini hj = hypre_CSRMatrixJ(hdiag); 8099566063dSJacob Faibussowitsch PetscCall(PetscFree2(hi, hj)); 8106ea7df73SStefano Zampini if (ismpiaij) { 8112cf14000SStefano Zampini hi = hypre_CSRMatrixI(hoffd); 8122cf14000SStefano Zampini hj = hypre_CSRMatrixJ(hoffd); 8139566063dSJacob Faibussowitsch PetscCall(PetscFree2(hi, hj)); 8142cf14000SStefano Zampini } 8152cf14000SStefano Zampini } 816c1a070e6SStefano Zampini hypre_CSRMatrixI(hdiag) = NULL; 817c1a070e6SStefano Zampini hypre_CSRMatrixJ(hdiag) = NULL; 818c1a070e6SStefano Zampini hypre_CSRMatrixData(hdiag) = NULL; 8196ea7df73SStefano Zampini if (ismpiaij) { 820c1a070e6SStefano Zampini hypre_CSRMatrixI(hoffd) = NULL; 821c1a070e6SStefano Zampini hypre_CSRMatrixJ(hoffd) = NULL; 822c1a070e6SStefano Zampini hypre_CSRMatrixData(hoffd) = NULL; 8236ea7df73SStefano Zampini } 824613e5ff0Sstefano_zampini hypre_ParCSRMatrixColMapOffd(*hA) = NULL; 825613e5ff0Sstefano_zampini hypre_ParCSRMatrixDestroy(*hA); 826613e5ff0Sstefano_zampini *hA = NULL; 8273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 828613e5ff0Sstefano_zampini } 829613e5ff0Sstefano_zampini 830613e5ff0Sstefano_zampini /* calls RAP from BoomerAMG: 8313dad0653Sstefano_zampini the resulting ParCSR will not own the column and row starts 8326ea7df73SStefano Zampini It looks like we don't need to have the diagonal entries ordered first */ 833d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_ParCSR_RAP(hypre_ParCSRMatrix *hR, hypre_ParCSRMatrix *hA, hypre_ParCSRMatrix *hP, hypre_ParCSRMatrix **hRAP) 834d71ae5a4SJacob Faibussowitsch { 835a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts) 836613e5ff0Sstefano_zampini HYPRE_Int P_owns_col_starts, R_owns_row_starts; 837a1d2239cSSatish Balay #endif 838613e5ff0Sstefano_zampini 839613e5ff0Sstefano_zampini PetscFunctionBegin; 840a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts) 841613e5ff0Sstefano_zampini P_owns_col_starts = hypre_ParCSRMatrixOwnsColStarts(hP); 842613e5ff0Sstefano_zampini R_owns_row_starts = hypre_ParCSRMatrixOwnsRowStarts(hR); 843a1d2239cSSatish Balay #endif 8446ea7df73SStefano Zampini /* can be replaced by version test later */ 8456ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 846792fecdfSBarry Smith PetscStackPushExternal("hypre_ParCSRMatrixRAP"); 8476ea7df73SStefano Zampini *hRAP = hypre_ParCSRMatrixRAP(hR, hA, hP); 8486ea7df73SStefano Zampini PetscStackPop; 8496ea7df73SStefano Zampini #else 850792fecdfSBarry Smith PetscCallExternal(hypre_BoomerAMGBuildCoarseOperator, hR, hA, hP, hRAP); 851792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixSetNumNonzeros, *hRAP); 8526ea7df73SStefano Zampini #endif 853613e5ff0Sstefano_zampini /* hypre_BoomerAMGBuildCoarseOperator steals the col_starts from P and the row_starts from R */ 854a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts) 855613e5ff0Sstefano_zampini hypre_ParCSRMatrixSetRowStartsOwner(*hRAP, 0); 856613e5ff0Sstefano_zampini hypre_ParCSRMatrixSetColStartsOwner(*hRAP, 0); 857613e5ff0Sstefano_zampini if (P_owns_col_starts) hypre_ParCSRMatrixSetColStartsOwner(hP, 1); 858613e5ff0Sstefano_zampini if (R_owns_row_starts) hypre_ParCSRMatrixSetRowStartsOwner(hR, 1); 859a1d2239cSSatish Balay #endif 8603ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 861613e5ff0Sstefano_zampini } 862613e5ff0Sstefano_zampini 863d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatPtAPNumeric_AIJ_AIJ_wHYPRE(Mat A, Mat P, Mat C) 864d71ae5a4SJacob Faibussowitsch { 8656f231fbdSstefano_zampini Mat B; 8666abb4441SStefano Zampini hypre_ParCSRMatrix *hA, *hP, *hPtAP = NULL; 8674222ddf1SHong Zhang Mat_Product *product = C->product; 868613e5ff0Sstefano_zampini 869613e5ff0Sstefano_zampini PetscFunctionBegin; 8709566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(A, &hA)); 8719566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(P, &hP)); 8729566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_RAP(hP, hA, hP, &hPtAP)); 8739566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(hPtAP, MATAIJ, PETSC_OWN_POINTER, &B)); 8744222ddf1SHong Zhang 8759566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(C, &B)); 8764222ddf1SHong Zhang C->product = product; 8774222ddf1SHong Zhang 8789566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(A, &hA)); 8799566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(P, &hP)); 8803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 8816f231fbdSstefano_zampini } 8826f231fbdSstefano_zampini 883d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatPtAPSymbolic_AIJ_AIJ_wHYPRE(Mat A, Mat P, PetscReal fill, Mat C) 884d71ae5a4SJacob Faibussowitsch { 8856f231fbdSstefano_zampini PetscFunctionBegin; 8869566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATAIJ)); 8874222ddf1SHong Zhang C->ops->ptapnumeric = MatPtAPNumeric_AIJ_AIJ_wHYPRE; 8884222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_PtAP; 8893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 890613e5ff0Sstefano_zampini } 891613e5ff0Sstefano_zampini 892d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatPtAPNumeric_AIJ_HYPRE(Mat A, Mat P, Mat C) 893d71ae5a4SJacob Faibussowitsch { 8944cc28894Sstefano_zampini Mat B; 8954cc28894Sstefano_zampini Mat_HYPRE *hP; 8966abb4441SStefano Zampini hypre_ParCSRMatrix *hA = NULL, *Pparcsr, *ptapparcsr = NULL; 897613e5ff0Sstefano_zampini HYPRE_Int type; 898613e5ff0Sstefano_zampini MPI_Comm comm = PetscObjectComm((PetscObject)A); 8994cc28894Sstefano_zampini PetscBool ishypre; 900613e5ff0Sstefano_zampini 901613e5ff0Sstefano_zampini PetscFunctionBegin; 9029566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)P, MATHYPRE, &ishypre)); 90328b400f6SJacob Faibussowitsch PetscCheck(ishypre, comm, PETSC_ERR_USER, "P should be of type %s", MATHYPRE); 9044cc28894Sstefano_zampini hP = (Mat_HYPRE *)P->data; 905792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType, hP->ij, &type); 90608401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, comm, PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported"); 907792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, hP->ij, (void **)&Pparcsr); 908613e5ff0Sstefano_zampini 9099566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(A, &hA)); 9109566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_RAP(Pparcsr, hA, Pparcsr, &ptapparcsr)); 9119566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(A, &hA)); 912225daaf8SStefano Zampini 9134cc28894Sstefano_zampini /* create temporary matrix and merge to C */ 9149566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(ptapparcsr, ((PetscObject)C)->type_name, PETSC_OWN_POINTER, &B)); 9159566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(C, &B)); 9163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 9174cc28894Sstefano_zampini } 9184cc28894Sstefano_zampini 919d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatPtAPNumeric_HYPRE_HYPRE(Mat A, Mat P, Mat C) 920d71ae5a4SJacob Faibussowitsch { 9214cc28894Sstefano_zampini Mat B; 9226abb4441SStefano Zampini hypre_ParCSRMatrix *Aparcsr, *Pparcsr, *ptapparcsr = NULL; 9234cc28894Sstefano_zampini Mat_HYPRE *hA, *hP; 9244cc28894Sstefano_zampini PetscBool ishypre; 9254cc28894Sstefano_zampini HYPRE_Int type; 9264cc28894Sstefano_zampini 9274cc28894Sstefano_zampini PetscFunctionBegin; 9289566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)P, MATHYPRE, &ishypre)); 92928b400f6SJacob Faibussowitsch PetscCheck(ishypre, PetscObjectComm((PetscObject)P), PETSC_ERR_USER, "P should be of type %s", MATHYPRE); 9309566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)A, MATHYPRE, &ishypre)); 93128b400f6SJacob Faibussowitsch PetscCheck(ishypre, PetscObjectComm((PetscObject)A), PETSC_ERR_USER, "A should be of type %s", MATHYPRE); 9324cc28894Sstefano_zampini hA = (Mat_HYPRE *)A->data; 9334cc28894Sstefano_zampini hP = (Mat_HYPRE *)P->data; 934792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType, hA->ij, &type); 93508401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported"); 936792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType, hP->ij, &type); 93708401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)P), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported"); 938792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, hA->ij, (void **)&Aparcsr); 939792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, hP->ij, (void **)&Pparcsr); 9409566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_RAP(Pparcsr, Aparcsr, Pparcsr, &ptapparcsr)); 9419566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(ptapparcsr, MATHYPRE, PETSC_OWN_POINTER, &B)); 9429566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(C, &B)); 9433ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 9444cc28894Sstefano_zampini } 9454cc28894Sstefano_zampini 946d501dc42Sstefano_zampini /* calls hypre_ParMatmul 947d501dc42Sstefano_zampini hypre_ParMatMul uses hypre_ParMatrixCreate with the communicator of hA 9483dad0653Sstefano_zampini hypre_ParMatrixCreate does not duplicate the communicator 9496ea7df73SStefano Zampini It looks like we don't need to have the diagonal entries ordered first */ 950d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_ParCSR_MatMatMult(hypre_ParCSRMatrix *hA, hypre_ParCSRMatrix *hB, hypre_ParCSRMatrix **hAB) 951d71ae5a4SJacob Faibussowitsch { 952d501dc42Sstefano_zampini PetscFunctionBegin; 9536ea7df73SStefano Zampini /* can be replaced by version test later */ 9546ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 955792fecdfSBarry Smith PetscStackPushExternal("hypre_ParCSRMatMat"); 9566ea7df73SStefano Zampini *hAB = hypre_ParCSRMatMat(hA, hB); 9576ea7df73SStefano Zampini #else 958792fecdfSBarry Smith PetscStackPushExternal("hypre_ParMatmul"); 959d501dc42Sstefano_zampini *hAB = hypre_ParMatmul(hA, hB); 9606ea7df73SStefano Zampini #endif 961d501dc42Sstefano_zampini PetscStackPop; 9623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 963d501dc42Sstefano_zampini } 964d501dc42Sstefano_zampini 965d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMatMultNumeric_AIJ_AIJ_wHYPRE(Mat A, Mat B, Mat C) 966d71ae5a4SJacob Faibussowitsch { 9675e5acdf2Sstefano_zampini Mat D; 968d501dc42Sstefano_zampini hypre_ParCSRMatrix *hA, *hB, *hAB = NULL; 9694222ddf1SHong Zhang Mat_Product *product = C->product; 9705e5acdf2Sstefano_zampini 9715e5acdf2Sstefano_zampini PetscFunctionBegin; 9729566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(A, &hA)); 9739566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(B, &hB)); 9749566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_MatMatMult(hA, hB, &hAB)); 9759566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(hAB, MATAIJ, PETSC_OWN_POINTER, &D)); 9764222ddf1SHong Zhang 9779566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(C, &D)); 9784222ddf1SHong Zhang C->product = product; 9794222ddf1SHong Zhang 9809566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(A, &hA)); 9819566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(B, &hB)); 9823ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 9835e5acdf2Sstefano_zampini } 9845e5acdf2Sstefano_zampini 985d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatMatMultSymbolic_AIJ_AIJ_wHYPRE(Mat A, Mat B, PetscReal fill, Mat C) 986d71ae5a4SJacob Faibussowitsch { 9875e5acdf2Sstefano_zampini PetscFunctionBegin; 9889566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATAIJ)); 9894222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_AIJ_AIJ_wHYPRE; 9904222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_AB; 9913ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 9925e5acdf2Sstefano_zampini } 9935e5acdf2Sstefano_zampini 994d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMatMultNumeric_HYPRE_HYPRE(Mat A, Mat B, Mat C) 995d71ae5a4SJacob Faibussowitsch { 996d501dc42Sstefano_zampini Mat D; 997d501dc42Sstefano_zampini hypre_ParCSRMatrix *Aparcsr, *Bparcsr, *ABparcsr = NULL; 998d501dc42Sstefano_zampini Mat_HYPRE *hA, *hB; 999d501dc42Sstefano_zampini PetscBool ishypre; 1000d501dc42Sstefano_zampini HYPRE_Int type; 10014222ddf1SHong Zhang Mat_Product *product; 1002d501dc42Sstefano_zampini 1003d501dc42Sstefano_zampini PetscFunctionBegin; 10049566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B, MATHYPRE, &ishypre)); 100528b400f6SJacob Faibussowitsch PetscCheck(ishypre, PetscObjectComm((PetscObject)B), PETSC_ERR_USER, "B should be of type %s", MATHYPRE); 10069566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)A, MATHYPRE, &ishypre)); 100728b400f6SJacob Faibussowitsch PetscCheck(ishypre, PetscObjectComm((PetscObject)A), PETSC_ERR_USER, "A should be of type %s", MATHYPRE); 1008d501dc42Sstefano_zampini hA = (Mat_HYPRE *)A->data; 1009d501dc42Sstefano_zampini hB = (Mat_HYPRE *)B->data; 1010792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType, hA->ij, &type); 101108401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported"); 1012792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType, hB->ij, &type); 101308401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)B), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported"); 1014792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, hA->ij, (void **)&Aparcsr); 1015792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, hB->ij, (void **)&Bparcsr); 10169566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_MatMatMult(Aparcsr, Bparcsr, &ABparcsr)); 10179566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(ABparcsr, MATHYPRE, PETSC_OWN_POINTER, &D)); 10184222ddf1SHong Zhang 1019d501dc42Sstefano_zampini /* need to use HeaderReplace because HeaderMerge messes up with the communicator */ 10204222ddf1SHong Zhang product = C->product; /* save it from MatHeaderReplace() */ 10214222ddf1SHong Zhang C->product = NULL; 10229566063dSJacob Faibussowitsch PetscCall(MatHeaderReplace(C, &D)); 10234222ddf1SHong Zhang C->product = product; 1024d501dc42Sstefano_zampini C->ops->matmultnumeric = MatMatMultNumeric_HYPRE_HYPRE; 10254222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_AB; 10263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1027d501dc42Sstefano_zampini } 1028d501dc42Sstefano_zampini 1029d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatTransposeMatMatMultNumeric_AIJ_AIJ_AIJ_wHYPRE(Mat A, Mat B, Mat C, Mat D) 1030d71ae5a4SJacob Faibussowitsch { 103120e1dc0dSstefano_zampini Mat E; 10326abb4441SStefano Zampini hypre_ParCSRMatrix *hA, *hB, *hC, *hABC = NULL; 103320e1dc0dSstefano_zampini 103420e1dc0dSstefano_zampini PetscFunctionBegin; 10359566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(A, &hA)); 10369566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(B, &hB)); 10379566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(C, &hC)); 10389566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_RAP(hA, hB, hC, &hABC)); 10399566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(hABC, MATAIJ, PETSC_OWN_POINTER, &E)); 10409566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(D, &E)); 10419566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(A, &hA)); 10429566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(B, &hB)); 10439566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(C, &hC)); 10443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 104520e1dc0dSstefano_zampini } 104620e1dc0dSstefano_zampini 1047d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatTransposeMatMatMultSymbolic_AIJ_AIJ_AIJ_wHYPRE(Mat A, Mat B, Mat C, PetscReal fill, Mat D) 1048d71ae5a4SJacob Faibussowitsch { 104920e1dc0dSstefano_zampini PetscFunctionBegin; 10509566063dSJacob Faibussowitsch PetscCall(MatSetType(D, MATAIJ)); 10513ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 105220e1dc0dSstefano_zampini } 105320e1dc0dSstefano_zampini 1054d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSymbolic_AB_HYPRE(Mat C) 1055d71ae5a4SJacob Faibussowitsch { 10564222ddf1SHong Zhang PetscFunctionBegin; 10574222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_AB; 10583ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10594222ddf1SHong Zhang } 10604222ddf1SHong Zhang 1061d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSetFromOptions_HYPRE_AB(Mat C) 1062d71ae5a4SJacob Faibussowitsch { 10634222ddf1SHong Zhang Mat_Product *product = C->product; 10644222ddf1SHong Zhang PetscBool Ahypre; 10654222ddf1SHong Zhang 10664222ddf1SHong Zhang PetscFunctionBegin; 10679566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)product->A, MATHYPRE, &Ahypre)); 10684222ddf1SHong Zhang if (Ahypre) { /* A is a Hypre matrix */ 10699566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATHYPRE)); 10704222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_AB_HYPRE; 10714222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_HYPRE_HYPRE; 10723ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10736718818eSStefano Zampini } 10743ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10754222ddf1SHong Zhang } 10764222ddf1SHong Zhang 1077d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSymbolic_PtAP_HYPRE(Mat C) 1078d71ae5a4SJacob Faibussowitsch { 10794222ddf1SHong Zhang PetscFunctionBegin; 10804222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_PtAP; 10813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10824222ddf1SHong Zhang } 10834222ddf1SHong Zhang 1084d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSetFromOptions_HYPRE_PtAP(Mat C) 1085d71ae5a4SJacob Faibussowitsch { 10864222ddf1SHong Zhang Mat_Product *product = C->product; 10874222ddf1SHong Zhang PetscBool flg; 10884222ddf1SHong Zhang PetscInt type = 0; 10894222ddf1SHong Zhang const char *outTypes[4] = {"aij", "seqaij", "mpiaij", "hypre"}; 10904222ddf1SHong Zhang PetscInt ntype = 4; 10914222ddf1SHong Zhang Mat A = product->A; 10924222ddf1SHong Zhang PetscBool Ahypre; 10934222ddf1SHong Zhang 10944222ddf1SHong Zhang PetscFunctionBegin; 10959566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)A, MATHYPRE, &Ahypre)); 10964222ddf1SHong Zhang if (Ahypre) { /* A is a Hypre matrix */ 10979566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATHYPRE)); 10984222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_PtAP_HYPRE; 10994222ddf1SHong Zhang C->ops->ptapnumeric = MatPtAPNumeric_HYPRE_HYPRE; 11003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 11014222ddf1SHong Zhang } 11024222ddf1SHong Zhang 11034222ddf1SHong Zhang /* A is AIJ, P is Hypre, C = PtAP can be either AIJ or Hypre format */ 11044222ddf1SHong Zhang /* Get runtime option */ 11054222ddf1SHong Zhang if (product->api_user) { 1106d0609cedSBarry Smith PetscOptionsBegin(PetscObjectComm((PetscObject)C), ((PetscObject)C)->prefix, "MatPtAP_HYPRE", "Mat"); 11079566063dSJacob Faibussowitsch PetscCall(PetscOptionsEList("-matptap_hypre_outtype", "MatPtAP outtype", "MatPtAP outtype", outTypes, ntype, outTypes[type], &type, &flg)); 1108d0609cedSBarry Smith PetscOptionsEnd(); 11094222ddf1SHong Zhang } else { 1110d0609cedSBarry Smith PetscOptionsBegin(PetscObjectComm((PetscObject)C), ((PetscObject)C)->prefix, "MatProduct_PtAP_HYPRE", "Mat"); 11119566063dSJacob Faibussowitsch PetscCall(PetscOptionsEList("-mat_product_algorithm_hypre_outtype", "MatProduct_PtAP outtype", "MatProduct_PtAP", outTypes, ntype, outTypes[type], &type, &flg)); 1112d0609cedSBarry Smith PetscOptionsEnd(); 11134222ddf1SHong Zhang } 11144222ddf1SHong Zhang 11154222ddf1SHong Zhang if (type == 0 || type == 1 || type == 2) { 11169566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATAIJ)); 11174222ddf1SHong Zhang } else if (type == 3) { 11189566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATHYPRE)); 11194222ddf1SHong Zhang } else SETERRQ(PetscObjectComm((PetscObject)C), PETSC_ERR_SUP, "MatPtAP outtype is not supported"); 11204222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_PtAP_HYPRE; 11214222ddf1SHong Zhang C->ops->ptapnumeric = MatPtAPNumeric_AIJ_HYPRE; 11223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 11234222ddf1SHong Zhang } 11244222ddf1SHong Zhang 1125d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSetFromOptions_HYPRE(Mat C) 1126d71ae5a4SJacob Faibussowitsch { 11274222ddf1SHong Zhang Mat_Product *product = C->product; 11284222ddf1SHong Zhang 11294222ddf1SHong Zhang PetscFunctionBegin; 11304222ddf1SHong Zhang switch (product->type) { 1131d71ae5a4SJacob Faibussowitsch case MATPRODUCT_AB: 1132d71ae5a4SJacob Faibussowitsch PetscCall(MatProductSetFromOptions_HYPRE_AB(C)); 1133d71ae5a4SJacob Faibussowitsch break; 1134d71ae5a4SJacob Faibussowitsch case MATPRODUCT_PtAP: 1135d71ae5a4SJacob Faibussowitsch PetscCall(MatProductSetFromOptions_HYPRE_PtAP(C)); 1136d71ae5a4SJacob Faibussowitsch break; 1137d71ae5a4SJacob Faibussowitsch default: 1138d71ae5a4SJacob Faibussowitsch break; 11394222ddf1SHong Zhang } 11403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 11414222ddf1SHong Zhang } 11424222ddf1SHong Zhang 1143d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMultTranspose_HYPRE(Mat A, Vec x, Vec y) 1144d71ae5a4SJacob Faibussowitsch { 114563c07aadSStefano Zampini PetscFunctionBegin; 11469566063dSJacob Faibussowitsch PetscCall(MatHYPRE_MultKernel_Private(A, 1.0, x, 0.0, y, PETSC_TRUE)); 11473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 114863c07aadSStefano Zampini } 114963c07aadSStefano Zampini 1150d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMult_HYPRE(Mat A, Vec x, Vec y) 1151d71ae5a4SJacob Faibussowitsch { 115263c07aadSStefano Zampini PetscFunctionBegin; 11539566063dSJacob Faibussowitsch PetscCall(MatHYPRE_MultKernel_Private(A, 1.0, x, 0.0, y, PETSC_FALSE)); 11543ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 115563c07aadSStefano Zampini } 115663c07aadSStefano Zampini 1157d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMultAdd_HYPRE(Mat A, Vec x, Vec y, Vec z) 1158d71ae5a4SJacob Faibussowitsch { 1159414bd5c3SStefano Zampini PetscFunctionBegin; 116048a46eb9SPierre Jolivet if (y != z) PetscCall(VecCopy(y, z)); 11619566063dSJacob Faibussowitsch PetscCall(MatHYPRE_MultKernel_Private(A, 1.0, x, 1.0, z, PETSC_FALSE)); 11623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1163414bd5c3SStefano Zampini } 1164414bd5c3SStefano Zampini 1165d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMultTransposeAdd_HYPRE(Mat A, Vec x, Vec y, Vec z) 1166d71ae5a4SJacob Faibussowitsch { 1167414bd5c3SStefano Zampini PetscFunctionBegin; 116848a46eb9SPierre Jolivet if (y != z) PetscCall(VecCopy(y, z)); 11699566063dSJacob Faibussowitsch PetscCall(MatHYPRE_MultKernel_Private(A, 1.0, x, 1.0, z, PETSC_TRUE)); 11703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1171414bd5c3SStefano Zampini } 1172414bd5c3SStefano Zampini 1173414bd5c3SStefano Zampini /* y = a * A * x + b * y or y = a * A^t * x + b * y depending on trans */ 1174d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_MultKernel_Private(Mat A, HYPRE_Complex a, Vec x, HYPRE_Complex b, Vec y, PetscBool trans) 1175d71ae5a4SJacob Faibussowitsch { 117663c07aadSStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 117763c07aadSStefano Zampini hypre_ParCSRMatrix *parcsr; 117863c07aadSStefano Zampini hypre_ParVector *hx, *hy; 117963c07aadSStefano Zampini 118063c07aadSStefano Zampini PetscFunctionBegin; 118163c07aadSStefano Zampini if (trans) { 11829566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorPushVecRead(hA->b, x)); 11839566063dSJacob Faibussowitsch if (b != 0.0) PetscCall(VecHYPRE_IJVectorPushVec(hA->x, y)); 11849566063dSJacob Faibussowitsch else PetscCall(VecHYPRE_IJVectorPushVecWrite(hA->x, y)); 1185792fecdfSBarry Smith PetscCallExternal(HYPRE_IJVectorGetObject, hA->b->ij, (void **)&hx); 1186792fecdfSBarry Smith PetscCallExternal(HYPRE_IJVectorGetObject, hA->x->ij, (void **)&hy); 118763c07aadSStefano Zampini } else { 11889566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorPushVecRead(hA->x, x)); 11899566063dSJacob Faibussowitsch if (b != 0.0) PetscCall(VecHYPRE_IJVectorPushVec(hA->b, y)); 11909566063dSJacob Faibussowitsch else PetscCall(VecHYPRE_IJVectorPushVecWrite(hA->b, y)); 1191792fecdfSBarry Smith PetscCallExternal(HYPRE_IJVectorGetObject, hA->x->ij, (void **)&hx); 1192792fecdfSBarry Smith PetscCallExternal(HYPRE_IJVectorGetObject, hA->b->ij, (void **)&hy); 119363c07aadSStefano Zampini } 1194792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, hA->ij, (void **)&parcsr); 11956ea7df73SStefano Zampini if (trans) { 1196792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixMatvecT, a, parcsr, hx, b, hy); 11976ea7df73SStefano Zampini } else { 1198792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixMatvec, a, parcsr, hx, b, hy); 11996ea7df73SStefano Zampini } 12009566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorPopVec(hA->x)); 12019566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorPopVec(hA->b)); 12023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 120363c07aadSStefano Zampini } 120463c07aadSStefano Zampini 1205d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatDestroy_HYPRE(Mat A) 1206d71ae5a4SJacob Faibussowitsch { 120763c07aadSStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 120863c07aadSStefano Zampini 120963c07aadSStefano Zampini PetscFunctionBegin; 12109566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorDestroy(&hA->x)); 12119566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorDestroy(&hA->b)); 1212978814f1SStefano Zampini if (hA->ij) { 1213978814f1SStefano Zampini if (!hA->inner_free) hypre_IJMatrixObject(hA->ij) = NULL; 1214792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixDestroy, hA->ij); 1215978814f1SStefano Zampini } 12169566063dSJacob Faibussowitsch if (hA->comm) PetscCall(PetscCommRestoreComm(PetscObjectComm((PetscObject)A), &hA->comm)); 1217c69f721fSFande Kong 12189566063dSJacob Faibussowitsch PetscCall(MatStashDestroy_Private(&A->stash)); 12199566063dSJacob Faibussowitsch PetscCall(PetscFree(hA->array)); 1220c69f721fSFande Kong 12215fbaff96SJunchao Zhang if (hA->cooMat) { 12225fbaff96SJunchao Zhang PetscCall(MatDestroy(&hA->cooMat)); 1223e77caa6dSBarry Smith PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hA->diagJ, hA->memType)); 1224e77caa6dSBarry Smith PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hA->offdJ, hA->memType)); 1225e77caa6dSBarry Smith PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hA->diag, hA->memType)); 12265fbaff96SJunchao Zhang } 12275fbaff96SJunchao Zhang 12289566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_hypre_aij_C", NULL)); 12299566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_hypre_is_C", NULL)); 12309566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_hypre_C", NULL)); 12319566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_mpiaij_hypre_C", NULL)); 12329566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatHYPRESetPreallocation_C", NULL)); 12339566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatHYPREGetParCSR_C", NULL)); 12345fbaff96SJunchao Zhang PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL)); 12355fbaff96SJunchao Zhang PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL)); 12369566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 12373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 123863c07aadSStefano Zampini } 123963c07aadSStefano Zampini 1240d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetUp_HYPRE(Mat A) 1241d71ae5a4SJacob Faibussowitsch { 12424ec6421dSstefano_zampini PetscFunctionBegin; 12439566063dSJacob Faibussowitsch PetscCall(MatHYPRESetPreallocation(A, PETSC_DEFAULT, NULL, PETSC_DEFAULT, NULL)); 12443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12454ec6421dSstefano_zampini } 12464ec6421dSstefano_zampini 12476ea7df73SStefano Zampini //TODO FIX hypre_CSRMatrixMatvecOutOfPlace 12486ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 1249d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatBindToCPU_HYPRE(Mat A, PetscBool bind) 1250d71ae5a4SJacob Faibussowitsch { 12516ea7df73SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 12526ea7df73SStefano Zampini HYPRE_MemoryLocation hmem = bind ? HYPRE_MEMORY_HOST : HYPRE_MEMORY_DEVICE; 12536ea7df73SStefano Zampini 12546ea7df73SStefano Zampini PetscFunctionBegin; 12556ea7df73SStefano Zampini A->boundtocpu = bind; 12565fbaff96SJunchao Zhang if (hA->ij && hypre_IJMatrixAssembleFlag(hA->ij) && hmem != hypre_IJMatrixMemoryLocation(hA->ij)) { 12576ea7df73SStefano Zampini hypre_ParCSRMatrix *parcsr; 1258792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, hA->ij, (void **)&parcsr); 1259792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixMigrate, parcsr, hmem); 12606ea7df73SStefano Zampini } 12619566063dSJacob Faibussowitsch if (hA->x) PetscCall(VecHYPRE_IJBindToCPU(hA->x, bind)); 12629566063dSJacob Faibussowitsch if (hA->b) PetscCall(VecHYPRE_IJBindToCPU(hA->b, bind)); 12633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12646ea7df73SStefano Zampini } 12656ea7df73SStefano Zampini #endif 12666ea7df73SStefano Zampini 1267d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAssemblyEnd_HYPRE(Mat A, MatAssemblyType mode) 1268d71ae5a4SJacob Faibussowitsch { 126963c07aadSStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 1270c69f721fSFande Kong PetscMPIInt n; 1271c69f721fSFande Kong PetscInt i, j, rstart, ncols, flg; 1272c69f721fSFande Kong PetscInt *row, *col; 1273c69f721fSFande Kong PetscScalar *val; 127463c07aadSStefano Zampini 127563c07aadSStefano Zampini PetscFunctionBegin; 127608401ef6SPierre Jolivet PetscCheck(mode != MAT_FLUSH_ASSEMBLY, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "MAT_FLUSH_ASSEMBLY currently not supported with MATHYPRE"); 1277c69f721fSFande Kong 1278c69f721fSFande Kong if (!A->nooffprocentries) { 1279c69f721fSFande Kong while (1) { 12809566063dSJacob Faibussowitsch PetscCall(MatStashScatterGetMesg_Private(&A->stash, &n, &row, &col, &val, &flg)); 1281c69f721fSFande Kong if (!flg) break; 1282c69f721fSFande Kong 1283c69f721fSFande Kong for (i = 0; i < n;) { 1284c69f721fSFande Kong /* Now identify the consecutive vals belonging to the same row */ 1285c69f721fSFande Kong for (j = i, rstart = row[j]; j < n; j++) { 1286c69f721fSFande Kong if (row[j] != rstart) break; 1287c69f721fSFande Kong } 1288c69f721fSFande Kong if (j < n) ncols = j - i; 1289c69f721fSFande Kong else ncols = n - i; 1290c69f721fSFande Kong /* Now assemble all these values with a single function call */ 12919566063dSJacob Faibussowitsch PetscCall(MatSetValues_HYPRE(A, 1, row + i, ncols, col + i, val + i, A->insertmode)); 1292c69f721fSFande Kong 1293c69f721fSFande Kong i = j; 1294c69f721fSFande Kong } 1295c69f721fSFande Kong } 12969566063dSJacob Faibussowitsch PetscCall(MatStashScatterEnd_Private(&A->stash)); 1297c69f721fSFande Kong } 1298c69f721fSFande Kong 1299792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixAssemble, hA->ij); 1300336664bdSPierre Jolivet /* The assembly routine destroys the aux_matrix, we recreate it here by calling HYPRE_IJMatrixInitialize */ 1301336664bdSPierre Jolivet /* If the option MAT_SORTED_FULL is set to true, the indices and values can be passed to hypre directly, so we don't need the aux_matrix */ 1302336664bdSPierre Jolivet if (!hA->sorted_full) { 1303af1cf968SStefano Zampini hypre_AuxParCSRMatrix *aux_matrix; 1304af1cf968SStefano Zampini 1305af1cf968SStefano Zampini /* call destroy just to make sure we do not leak anything */ 1306af1cf968SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(hA->ij); 1307792fecdfSBarry Smith PetscCallExternal(hypre_AuxParCSRMatrixDestroy, aux_matrix); 1308af1cf968SStefano Zampini hypre_IJMatrixTranslator(hA->ij) = NULL; 1309af1cf968SStefano Zampini 1310af1cf968SStefano Zampini /* Initialize with assembled flag -> it only recreates the aux_par_matrix */ 1311792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixInitialize, hA->ij); 1312af1cf968SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(hA->ij); 13136ea7df73SStefano Zampini if (aux_matrix) { 1314af1cf968SStefano Zampini hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 1; /* see comment in MatHYPRESetPreallocation_HYPRE */ 131522235d61SPierre Jolivet #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0) 1316792fecdfSBarry Smith PetscCallExternal(hypre_AuxParCSRMatrixInitialize, aux_matrix); 131722235d61SPierre Jolivet #else 1318792fecdfSBarry Smith PetscCallExternal(hypre_AuxParCSRMatrixInitialize_v2, aux_matrix, HYPRE_MEMORY_HOST); 131922235d61SPierre Jolivet #endif 1320af1cf968SStefano Zampini } 13216ea7df73SStefano Zampini } 13226ea7df73SStefano Zampini { 13236ea7df73SStefano Zampini hypre_ParCSRMatrix *parcsr; 13246ea7df73SStefano Zampini 1325792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, hA->ij, (void **)&parcsr); 1326792fecdfSBarry Smith if (!hypre_ParCSRMatrixCommPkg(parcsr)) PetscCallExternal(hypre_MatvecCommPkgCreate, parcsr); 13276ea7df73SStefano Zampini } 13289566063dSJacob Faibussowitsch if (!hA->x) PetscCall(VecHYPRE_IJVectorCreate(A->cmap, &hA->x)); 13299566063dSJacob Faibussowitsch if (!hA->b) PetscCall(VecHYPRE_IJVectorCreate(A->rmap, &hA->b)); 13306ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 13319566063dSJacob Faibussowitsch PetscCall(MatBindToCPU_HYPRE(A, A->boundtocpu)); 13326ea7df73SStefano Zampini #endif 13333ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 133463c07aadSStefano Zampini } 133563c07aadSStefano Zampini 1336d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetArray_HYPRE(Mat A, PetscInt size, void **array) 1337d71ae5a4SJacob Faibussowitsch { 1338c69f721fSFande Kong Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 1339c69f721fSFande Kong 1340c69f721fSFande Kong PetscFunctionBegin; 134128b400f6SJacob Faibussowitsch PetscCheck(hA->available, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Temporary space is in use"); 1342c69f721fSFande Kong 134339accc25SStefano Zampini if (hA->size >= size) { 134439accc25SStefano Zampini *array = hA->array; 134539accc25SStefano Zampini } else { 13469566063dSJacob Faibussowitsch PetscCall(PetscFree(hA->array)); 1347c69f721fSFande Kong hA->size = size; 13489566063dSJacob Faibussowitsch PetscCall(PetscMalloc(hA->size, &hA->array)); 1349c69f721fSFande Kong *array = hA->array; 1350c69f721fSFande Kong } 1351c69f721fSFande Kong 1352c69f721fSFande Kong hA->available = PETSC_FALSE; 13533ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1354c69f721fSFande Kong } 1355c69f721fSFande Kong 1356d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatRestoreArray_HYPRE(Mat A, void **array) 1357d71ae5a4SJacob Faibussowitsch { 1358c69f721fSFande Kong Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 1359c69f721fSFande Kong 1360c69f721fSFande Kong PetscFunctionBegin; 1361c69f721fSFande Kong *array = NULL; 1362c69f721fSFande Kong hA->available = PETSC_TRUE; 13633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1364c69f721fSFande Kong } 1365c69f721fSFande Kong 1366d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValues_HYPRE(Mat A, PetscInt nr, const PetscInt rows[], PetscInt nc, const PetscInt cols[], const PetscScalar v[], InsertMode ins) 1367d71ae5a4SJacob Faibussowitsch { 1368d975228cSstefano_zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 1369d975228cSstefano_zampini PetscScalar *vals = (PetscScalar *)v; 137039accc25SStefano Zampini HYPRE_Complex *sscr; 1371c69f721fSFande Kong PetscInt *cscr[2]; 1372c69f721fSFande Kong PetscInt i, nzc; 137308defe43SFande Kong void *array = NULL; 1374d975228cSstefano_zampini 1375d975228cSstefano_zampini PetscFunctionBegin; 13769566063dSJacob Faibussowitsch PetscCall(MatGetArray_HYPRE(A, sizeof(PetscInt) * (2 * nc) + sizeof(HYPRE_Complex) * nc * nr, &array)); 1377c69f721fSFande Kong cscr[0] = (PetscInt *)array; 1378c69f721fSFande Kong cscr[1] = ((PetscInt *)array) + nc; 137939accc25SStefano Zampini sscr = (HYPRE_Complex *)(((PetscInt *)array) + nc * 2); 1380d975228cSstefano_zampini for (i = 0, nzc = 0; i < nc; i++) { 1381d975228cSstefano_zampini if (cols[i] >= 0) { 1382d975228cSstefano_zampini cscr[0][nzc] = cols[i]; 1383d975228cSstefano_zampini cscr[1][nzc++] = i; 1384d975228cSstefano_zampini } 1385d975228cSstefano_zampini } 1386c69f721fSFande Kong if (!nzc) { 13879566063dSJacob Faibussowitsch PetscCall(MatRestoreArray_HYPRE(A, &array)); 13883ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1389c69f721fSFande Kong } 1390d975228cSstefano_zampini 13916ea7df73SStefano Zampini #if 0 //defined(PETSC_HAVE_HYPRE_DEVICE) 13926ea7df73SStefano Zampini if (HYPRE_MEMORY_HOST != hypre_IJMatrixMemoryLocation(hA->ij)) { 13936ea7df73SStefano Zampini hypre_ParCSRMatrix *parcsr; 13946ea7df73SStefano Zampini 1395792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject,hA->ij,(void**)&parcsr); 1396792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixMigrate,parcsr, HYPRE_MEMORY_HOST); 13976ea7df73SStefano Zampini } 13986ea7df73SStefano Zampini #endif 13996ea7df73SStefano Zampini 1400d975228cSstefano_zampini if (ins == ADD_VALUES) { 1401d975228cSstefano_zampini for (i = 0; i < nr; i++) { 14026ea7df73SStefano Zampini if (rows[i] >= 0) { 1403d975228cSstefano_zampini PetscInt j; 14042cf14000SStefano Zampini HYPRE_Int hnc = (HYPRE_Int)nzc; 14052cf14000SStefano Zampini 1406aed4548fSBarry Smith PetscCheck((PetscInt)hnc == nzc, PETSC_COMM_SELF, PETSC_ERR_SUP, "Hypre overflow! number of columns %" PetscInt_FMT " for row %" PetscInt_FMT, nzc, rows[i]); 14079566063dSJacob Faibussowitsch for (j = 0; j < nzc; j++) PetscCall(PetscHYPREScalarCast(vals[cscr[1][j]], &sscr[j])); 1408792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixAddToValues, hA->ij, 1, &hnc, (HYPRE_BigInt *)(rows + i), (HYPRE_BigInt *)cscr[0], sscr); 1409d975228cSstefano_zampini } 1410d975228cSstefano_zampini vals += nc; 1411d975228cSstefano_zampini } 1412d975228cSstefano_zampini } else { /* INSERT_VALUES */ 1413d975228cSstefano_zampini PetscInt rst, ren; 1414c69f721fSFande Kong 14159566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(A, &rst, &ren)); 1416d975228cSstefano_zampini for (i = 0; i < nr; i++) { 14176ea7df73SStefano Zampini if (rows[i] >= 0) { 1418d975228cSstefano_zampini PetscInt j; 14192cf14000SStefano Zampini HYPRE_Int hnc = (HYPRE_Int)nzc; 14202cf14000SStefano Zampini 1421aed4548fSBarry Smith PetscCheck((PetscInt)hnc == nzc, PETSC_COMM_SELF, PETSC_ERR_SUP, "Hypre overflow! number of columns %" PetscInt_FMT " for row %" PetscInt_FMT, nzc, rows[i]); 14229566063dSJacob Faibussowitsch for (j = 0; j < nzc; j++) PetscCall(PetscHYPREScalarCast(vals[cscr[1][j]], &sscr[j])); 1423c69f721fSFande Kong /* nonlocal values */ 14249566063dSJacob Faibussowitsch if (rows[i] < rst || rows[i] >= ren) PetscCall(MatStashValuesRow_Private(&A->stash, rows[i], nzc, cscr[0], (PetscScalar *)sscr, PETSC_FALSE)); 1425c69f721fSFande Kong /* local values */ 1426792fecdfSBarry Smith else PetscCallExternal(HYPRE_IJMatrixSetValues, hA->ij, 1, &hnc, (HYPRE_BigInt *)(rows + i), (HYPRE_BigInt *)cscr[0], sscr); 1427d975228cSstefano_zampini } 1428d975228cSstefano_zampini vals += nc; 1429d975228cSstefano_zampini } 1430d975228cSstefano_zampini } 1431c69f721fSFande Kong 14329566063dSJacob Faibussowitsch PetscCall(MatRestoreArray_HYPRE(A, &array)); 14333ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1434d975228cSstefano_zampini } 1435d975228cSstefano_zampini 1436d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRESetPreallocation_HYPRE(Mat A, PetscInt dnz, const PetscInt dnnz[], PetscInt onz, const PetscInt onnz[]) 1437d71ae5a4SJacob Faibussowitsch { 1438d975228cSstefano_zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 14397d968826Sstefano_zampini HYPRE_Int *hdnnz, *honnz; 144006a29025Sstefano_zampini PetscInt i, rs, re, cs, ce, bs; 1441d975228cSstefano_zampini PetscMPIInt size; 1442d975228cSstefano_zampini 1443d975228cSstefano_zampini PetscFunctionBegin; 14449566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 14459566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 1446d975228cSstefano_zampini rs = A->rmap->rstart; 1447d975228cSstefano_zampini re = A->rmap->rend; 1448d975228cSstefano_zampini cs = A->cmap->rstart; 1449d975228cSstefano_zampini ce = A->cmap->rend; 1450d975228cSstefano_zampini if (!hA->ij) { 1451792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixCreate, hA->comm, rs, re - 1, cs, ce - 1, &hA->ij); 1452792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetObjectType, hA->ij, HYPRE_PARCSR); 1453d975228cSstefano_zampini } else { 14542cf14000SStefano Zampini HYPRE_BigInt hrs, hre, hcs, hce; 1455792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetLocalRange, hA->ij, &hrs, &hre, &hcs, &hce); 1456aed4548fSBarry Smith PetscCheck(hre - hrs + 1 == re - rs, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Inconsistent local rows: IJMatrix [%" PetscHYPRE_BigInt_FMT ",%" PetscHYPRE_BigInt_FMT "), PETSc [%" PetscInt_FMT ",%" PetscInt_FMT ")", hrs, hre + 1, rs, re); 1457aed4548fSBarry Smith PetscCheck(hce - hcs + 1 == ce - cs, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Inconsistent local cols: IJMatrix [%" PetscHYPRE_BigInt_FMT ",%" PetscHYPRE_BigInt_FMT "), PETSc [%" PetscInt_FMT ",%" PetscInt_FMT ")", hcs, hce + 1, cs, ce); 1458d975228cSstefano_zampini } 14599566063dSJacob Faibussowitsch PetscCall(MatGetBlockSize(A, &bs)); 146006a29025Sstefano_zampini if (dnz == PETSC_DEFAULT || dnz == PETSC_DECIDE) dnz = 10 * bs; 146106a29025Sstefano_zampini if (onz == PETSC_DEFAULT || onz == PETSC_DECIDE) onz = 10 * bs; 146206a29025Sstefano_zampini 1463d975228cSstefano_zampini if (!dnnz) { 14649566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &hdnnz)); 1465d975228cSstefano_zampini for (i = 0; i < A->rmap->n; i++) hdnnz[i] = dnz; 1466d975228cSstefano_zampini } else { 14677d968826Sstefano_zampini hdnnz = (HYPRE_Int *)dnnz; 1468d975228cSstefano_zampini } 14699566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)A), &size)); 1470d975228cSstefano_zampini if (size > 1) { 1471ddbeb582SStefano Zampini hypre_AuxParCSRMatrix *aux_matrix; 1472d975228cSstefano_zampini if (!onnz) { 14739566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &honnz)); 1474d975228cSstefano_zampini for (i = 0; i < A->rmap->n; i++) honnz[i] = onz; 147522235d61SPierre Jolivet } else honnz = (HYPRE_Int *)onnz; 1476ddbeb582SStefano Zampini /* SetDiagOffdSizes sets hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0, since it seems 1477ddbeb582SStefano Zampini they assume the user will input the entire row values, properly sorted 1478336664bdSPierre Jolivet In PETSc, we don't make such an assumption and set this flag to 1, 1479336664bdSPierre Jolivet unless the option MAT_SORTED_FULL is set to true. 1480ddbeb582SStefano Zampini Also, to avoid possible memory leaks, we destroy and recreate the translator 1481ddbeb582SStefano Zampini This has to be done here, as HYPRE_IJMatrixInitialize will properly initialize 1482ddbeb582SStefano Zampini the IJ matrix for us */ 1483ddbeb582SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(hA->ij); 1484ddbeb582SStefano Zampini hypre_AuxParCSRMatrixDestroy(aux_matrix); 1485ddbeb582SStefano Zampini hypre_IJMatrixTranslator(hA->ij) = NULL; 1486792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetDiagOffdSizes, hA->ij, hdnnz, honnz); 1487ddbeb582SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(hA->ij); 1488336664bdSPierre Jolivet hypre_AuxParCSRMatrixNeedAux(aux_matrix) = !hA->sorted_full; 1489d975228cSstefano_zampini } else { 1490d975228cSstefano_zampini honnz = NULL; 1491792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetRowSizes, hA->ij, hdnnz); 1492d975228cSstefano_zampini } 1493ddbeb582SStefano Zampini 1494af1cf968SStefano Zampini /* reset assembled flag and call the initialize method */ 1495af1cf968SStefano Zampini hypre_IJMatrixAssembleFlag(hA->ij) = 0; 14966ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0) 1497792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixInitialize, hA->ij); 14986ea7df73SStefano Zampini #else 1499792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixInitialize_v2, hA->ij, HYPRE_MEMORY_HOST); 15006ea7df73SStefano Zampini #endif 150148a46eb9SPierre Jolivet if (!dnnz) PetscCall(PetscFree(hdnnz)); 150248a46eb9SPierre Jolivet if (!onnz && honnz) PetscCall(PetscFree(honnz)); 1503af1cf968SStefano Zampini /* Match AIJ logic */ 150406a29025Sstefano_zampini A->preallocated = PETSC_TRUE; 1505af1cf968SStefano Zampini A->assembled = PETSC_FALSE; 15063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1507d975228cSstefano_zampini } 1508d975228cSstefano_zampini 1509d975228cSstefano_zampini /*@C 1510d975228cSstefano_zampini MatHYPRESetPreallocation - Preallocates memory for a sparse parallel matrix in HYPRE IJ format 1511d975228cSstefano_zampini 1512c3339decSBarry Smith Collective 1513d975228cSstefano_zampini 1514d975228cSstefano_zampini Input Parameters: 1515d975228cSstefano_zampini + A - the matrix 1516d975228cSstefano_zampini . dnz - number of nonzeros per row in DIAGONAL portion of local submatrix 1517d975228cSstefano_zampini (same value is used for all local rows) 1518d975228cSstefano_zampini . dnnz - array containing the number of nonzeros in the various rows of the 1519d975228cSstefano_zampini DIAGONAL portion of the local submatrix (possibly different for each row) 15202ef1f0ffSBarry Smith or `NULL` (`PETSC_NULL_INTEGER` in Fortran), if `d_nz` is used to specify the nonzero structure. 15212ef1f0ffSBarry Smith The size of this array is equal to the number of local rows, i.e `m`. 1522d975228cSstefano_zampini For matrices that will be factored, you must leave room for (and set) 1523d975228cSstefano_zampini the diagonal entry even if it is zero. 1524d975228cSstefano_zampini . onz - number of nonzeros per row in the OFF-DIAGONAL portion of local 1525d975228cSstefano_zampini submatrix (same value is used for all local rows). 1526d975228cSstefano_zampini - onnz - array containing the number of nonzeros in the various rows of the 1527d975228cSstefano_zampini OFF-DIAGONAL portion of the local submatrix (possibly different for 15282ef1f0ffSBarry Smith each row) or `NULL` (`PETSC_NULL_INTEGER` in Fortran), if `o_nz` is used to specify the nonzero 1529d975228cSstefano_zampini structure. The size of this array is equal to the number 15302ef1f0ffSBarry Smith of local rows, i.e `m`. 1531d975228cSstefano_zampini 15322fe279fdSBarry Smith Level: intermediate 15332fe279fdSBarry Smith 153411a5261eSBarry Smith Note: 15352ef1f0ffSBarry Smith If the *nnz parameter is given then the *nz parameter is ignored; for sequential matrices, `onz` and `onnz` are ignored. 1536d975228cSstefano_zampini 15372ef1f0ffSBarry Smith .seealso: [](chapter_matrices), `Mat`, `MatCreate()`, `MatMPIAIJSetPreallocation()`, `MATHYPRE`, `MATAIJ` 1538d975228cSstefano_zampini @*/ 1539d71ae5a4SJacob Faibussowitsch PetscErrorCode MatHYPRESetPreallocation(Mat A, PetscInt dnz, const PetscInt dnnz[], PetscInt onz, const PetscInt onnz[]) 1540d71ae5a4SJacob Faibussowitsch { 1541d975228cSstefano_zampini PetscFunctionBegin; 1542d975228cSstefano_zampini PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 1543d975228cSstefano_zampini PetscValidType(A, 1); 1544cac4c232SBarry Smith PetscTryMethod(A, "MatHYPRESetPreallocation_C", (Mat, PetscInt, const PetscInt[], PetscInt, const PetscInt[]), (A, dnz, dnnz, onz, onnz)); 15453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1546d975228cSstefano_zampini } 1547d975228cSstefano_zampini 154820f4b53cSBarry Smith /*@C 15492ef1f0ffSBarry Smith MatCreateFromParCSR - Creates a `Mat` from a `hypre_ParCSRMatrix` 1550225daaf8SStefano Zampini 1551225daaf8SStefano Zampini Collective 1552225daaf8SStefano Zampini 1553225daaf8SStefano Zampini Input Parameters: 15542ef1f0ffSBarry Smith + parcsr - the pointer to the `hypre_ParCSRMatrix` 15552ef1f0ffSBarry Smith . mtype - matrix type to be created. Currently `MATAIJ`, `MATIS` and `MATHYPRE` are supported. 155620f4b53cSBarry Smith - copymode - PETSc copying options, see `PetscCopyMode` 1557225daaf8SStefano Zampini 1558225daaf8SStefano Zampini Output Parameter: 1559225daaf8SStefano Zampini . A - the matrix 1560225daaf8SStefano Zampini 1561225daaf8SStefano Zampini Level: intermediate 1562225daaf8SStefano Zampini 15632ef1f0ffSBarry Smith .seealso: [](chapter_matrices), `Mat`, `MatHYPRE`, `PetscCopyMode` 156420f4b53cSBarry Smith @*/ 1565d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreateFromParCSR(hypre_ParCSRMatrix *parcsr, MatType mtype, PetscCopyMode copymode, Mat *A) 1566d71ae5a4SJacob Faibussowitsch { 1567225daaf8SStefano Zampini Mat T; 1568978814f1SStefano Zampini Mat_HYPRE *hA; 1569978814f1SStefano Zampini MPI_Comm comm; 1570978814f1SStefano Zampini PetscInt rstart, rend, cstart, cend, M, N; 1571d248a85cSRichard Tran Mills PetscBool isseqaij, isseqaijmkl, ismpiaij, isaij, ishyp, isis; 1572978814f1SStefano Zampini 1573978814f1SStefano Zampini PetscFunctionBegin; 1574978814f1SStefano Zampini comm = hypre_ParCSRMatrixComm(parcsr); 15759566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype, MATSEQAIJ, &isseqaij)); 15769566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype, MATSEQAIJMKL, &isseqaijmkl)); 15779566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype, MATMPIAIJ, &ismpiaij)); 15789566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype, MATAIJ, &isaij)); 15799566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype, MATHYPRE, &ishyp)); 15809566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype, MATIS, &isis)); 1581d248a85cSRichard Tran Mills isaij = (PetscBool)(isseqaij || isseqaijmkl || ismpiaij || isaij); 15826ea7df73SStefano Zampini /* TODO */ 1583aed4548fSBarry Smith PetscCheck(isaij || ishyp || isis, comm, PETSC_ERR_SUP, "Unsupported MatType %s! Supported types are %s, %s, %s, %s, %s, and %s", mtype, MATAIJ, MATSEQAIJ, MATSEQAIJMKL, MATMPIAIJ, MATIS, MATHYPRE); 1584978814f1SStefano Zampini /* access ParCSRMatrix */ 1585978814f1SStefano Zampini rstart = hypre_ParCSRMatrixFirstRowIndex(parcsr); 1586978814f1SStefano Zampini rend = hypre_ParCSRMatrixLastRowIndex(parcsr); 1587978814f1SStefano Zampini cstart = hypre_ParCSRMatrixFirstColDiag(parcsr); 1588978814f1SStefano Zampini cend = hypre_ParCSRMatrixLastColDiag(parcsr); 1589978814f1SStefano Zampini M = hypre_ParCSRMatrixGlobalNumRows(parcsr); 1590978814f1SStefano Zampini N = hypre_ParCSRMatrixGlobalNumCols(parcsr); 1591978814f1SStefano Zampini 1592fa92c42cSstefano_zampini /* fix for empty local rows/columns */ 1593fa92c42cSstefano_zampini if (rend < rstart) rend = rstart; 1594fa92c42cSstefano_zampini if (cend < cstart) cend = cstart; 1595fa92c42cSstefano_zampini 1596e6471dc9SStefano Zampini /* PETSc convention */ 1597e6471dc9SStefano Zampini rend++; 1598e6471dc9SStefano Zampini cend++; 1599e6471dc9SStefano Zampini rend = PetscMin(rend, M); 1600e6471dc9SStefano Zampini cend = PetscMin(cend, N); 1601e6471dc9SStefano Zampini 1602978814f1SStefano Zampini /* create PETSc matrix with MatHYPRE */ 16039566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, &T)); 16049566063dSJacob Faibussowitsch PetscCall(MatSetSizes(T, rend - rstart, cend - cstart, M, N)); 16059566063dSJacob Faibussowitsch PetscCall(MatSetType(T, MATHYPRE)); 1606225daaf8SStefano Zampini hA = (Mat_HYPRE *)(T->data); 1607978814f1SStefano Zampini 1608978814f1SStefano Zampini /* create HYPRE_IJMatrix */ 1609792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixCreate, hA->comm, rstart, rend - 1, cstart, cend - 1, &hA->ij); 1610792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetObjectType, hA->ij, HYPRE_PARCSR); 161145b8d346SStefano Zampini 16126ea7df73SStefano Zampini // TODO DEV 161345b8d346SStefano Zampini /* create new ParCSR object if needed */ 161445b8d346SStefano Zampini if (ishyp && copymode == PETSC_COPY_VALUES) { 161545b8d346SStefano Zampini hypre_ParCSRMatrix *new_parcsr; 16166ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 18, 0) 161745b8d346SStefano Zampini hypre_CSRMatrix *hdiag, *hoffd, *ndiag, *noffd; 161845b8d346SStefano Zampini 16190e6427aaSSatish Balay new_parcsr = hypre_ParCSRMatrixClone(parcsr, 0); 162045b8d346SStefano Zampini hdiag = hypre_ParCSRMatrixDiag(parcsr); 162145b8d346SStefano Zampini hoffd = hypre_ParCSRMatrixOffd(parcsr); 162245b8d346SStefano Zampini ndiag = hypre_ParCSRMatrixDiag(new_parcsr); 162345b8d346SStefano Zampini noffd = hypre_ParCSRMatrixOffd(new_parcsr); 16249566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hypre_CSRMatrixData(ndiag), hypre_CSRMatrixData(hdiag), hypre_CSRMatrixNumNonzeros(hdiag))); 16259566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hypre_CSRMatrixData(noffd), hypre_CSRMatrixData(hoffd), hypre_CSRMatrixNumNonzeros(hoffd))); 16266ea7df73SStefano Zampini #else 16276ea7df73SStefano Zampini new_parcsr = hypre_ParCSRMatrixClone(parcsr, 1); 16286ea7df73SStefano Zampini #endif 162945b8d346SStefano Zampini parcsr = new_parcsr; 163045b8d346SStefano Zampini copymode = PETSC_OWN_POINTER; 163145b8d346SStefano Zampini } 1632978814f1SStefano Zampini 1633978814f1SStefano Zampini /* set ParCSR object */ 1634978814f1SStefano Zampini hypre_IJMatrixObject(hA->ij) = parcsr; 16354ec6421dSstefano_zampini T->preallocated = PETSC_TRUE; 1636978814f1SStefano Zampini 1637978814f1SStefano Zampini /* set assembled flag */ 1638978814f1SStefano Zampini hypre_IJMatrixAssembleFlag(hA->ij) = 1; 16396ea7df73SStefano Zampini #if 0 1640792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixInitialize,hA->ij); 16416ea7df73SStefano Zampini #endif 1642225daaf8SStefano Zampini if (ishyp) { 16436d2a658fSstefano_zampini PetscMPIInt myid = 0; 16446d2a658fSstefano_zampini 16456d2a658fSstefano_zampini /* make sure we always have row_starts and col_starts available */ 164648a46eb9SPierre Jolivet if (HYPRE_AssumedPartitionCheck()) PetscCallMPI(MPI_Comm_rank(comm, &myid)); 1647a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts) 16486d2a658fSstefano_zampini if (!hypre_ParCSRMatrixOwnsColStarts(parcsr)) { 16496d2a658fSstefano_zampini PetscLayout map; 16506d2a658fSstefano_zampini 16519566063dSJacob Faibussowitsch PetscCall(MatGetLayouts(T, NULL, &map)); 16529566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(map)); 16532cf14000SStefano Zampini hypre_ParCSRMatrixColStarts(parcsr) = (HYPRE_BigInt *)(map->range + myid); 16546d2a658fSstefano_zampini } 16556d2a658fSstefano_zampini if (!hypre_ParCSRMatrixOwnsRowStarts(parcsr)) { 16566d2a658fSstefano_zampini PetscLayout map; 16576d2a658fSstefano_zampini 16589566063dSJacob Faibussowitsch PetscCall(MatGetLayouts(T, &map, NULL)); 16599566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(map)); 16602cf14000SStefano Zampini hypre_ParCSRMatrixRowStarts(parcsr) = (HYPRE_BigInt *)(map->range + myid); 16616d2a658fSstefano_zampini } 1662a1d2239cSSatish Balay #endif 1663978814f1SStefano Zampini /* prevent from freeing the pointer */ 1664978814f1SStefano Zampini if (copymode == PETSC_USE_POINTER) hA->inner_free = PETSC_FALSE; 1665225daaf8SStefano Zampini *A = T; 16669566063dSJacob Faibussowitsch PetscCall(MatSetOption(*A, MAT_SORTED_FULL, PETSC_TRUE)); 16679566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*A, MAT_FINAL_ASSEMBLY)); 16689566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*A, MAT_FINAL_ASSEMBLY)); 1669bb4689ddSStefano Zampini } else if (isaij) { 1670bb4689ddSStefano Zampini if (copymode != PETSC_OWN_POINTER) { 1671225daaf8SStefano Zampini /* prevent from freeing the pointer */ 1672225daaf8SStefano Zampini hA->inner_free = PETSC_FALSE; 16739566063dSJacob Faibussowitsch PetscCall(MatConvert_HYPRE_AIJ(T, MATAIJ, MAT_INITIAL_MATRIX, A)); 16749566063dSJacob Faibussowitsch PetscCall(MatDestroy(&T)); 1675225daaf8SStefano Zampini } else { /* AIJ return type with PETSC_OWN_POINTER */ 16769566063dSJacob Faibussowitsch PetscCall(MatConvert_HYPRE_AIJ(T, MATAIJ, MAT_INPLACE_MATRIX, &T)); 1677225daaf8SStefano Zampini *A = T; 1678225daaf8SStefano Zampini } 1679bb4689ddSStefano Zampini } else if (isis) { 16809566063dSJacob Faibussowitsch PetscCall(MatConvert_HYPRE_IS(T, MATIS, MAT_INITIAL_MATRIX, A)); 16818cfe8d00SStefano Zampini if (copymode != PETSC_OWN_POINTER) hA->inner_free = PETSC_FALSE; 16829566063dSJacob Faibussowitsch PetscCall(MatDestroy(&T)); 1683bb4689ddSStefano Zampini } 16843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1685978814f1SStefano Zampini } 1686978814f1SStefano Zampini 1687d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPREGetParCSR_HYPRE(Mat A, hypre_ParCSRMatrix **parcsr) 1688d71ae5a4SJacob Faibussowitsch { 1689dd9c0a25Sstefano_zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 1690dd9c0a25Sstefano_zampini HYPRE_Int type; 1691dd9c0a25Sstefano_zampini 1692dd9c0a25Sstefano_zampini PetscFunctionBegin; 169328b400f6SJacob Faibussowitsch PetscCheck(hA->ij, PetscObjectComm((PetscObject)A), PETSC_ERR_PLIB, "HYPRE_IJMatrix not present"); 1694792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType, hA->ij, &type); 169508401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "HYPRE_IJMatrix is not of type HYPRE_PARCSR"); 1696792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject, hA->ij, (void **)parcsr); 16973ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1698dd9c0a25Sstefano_zampini } 1699dd9c0a25Sstefano_zampini 170020f4b53cSBarry Smith /*@C 1701dd9c0a25Sstefano_zampini MatHYPREGetParCSR - Gets the pointer to the ParCSR matrix 1702dd9c0a25Sstefano_zampini 17032ef1f0ffSBarry Smith Not Collective 1704dd9c0a25Sstefano_zampini 170520f4b53cSBarry Smith Input Parameter: 170620f4b53cSBarry Smith . A - the `MATHYPRE` object 1707dd9c0a25Sstefano_zampini 1708dd9c0a25Sstefano_zampini Output Parameter: 17092ef1f0ffSBarry Smith . parcsr - the pointer to the `hypre_ParCSRMatrix` 1710dd9c0a25Sstefano_zampini 1711dd9c0a25Sstefano_zampini Level: intermediate 1712dd9c0a25Sstefano_zampini 17132ef1f0ffSBarry Smith .seealso: [](chapter_matrices), `Mat`, `MatHYPRE`, `PetscCopyMode` 171420f4b53cSBarry Smith @*/ 1715d71ae5a4SJacob Faibussowitsch PetscErrorCode MatHYPREGetParCSR(Mat A, hypre_ParCSRMatrix **parcsr) 1716d71ae5a4SJacob Faibussowitsch { 1717dd9c0a25Sstefano_zampini PetscFunctionBegin; 1718dd9c0a25Sstefano_zampini PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 1719dd9c0a25Sstefano_zampini PetscValidType(A, 1); 1720cac4c232SBarry Smith PetscUseMethod(A, "MatHYPREGetParCSR_C", (Mat, hypre_ParCSRMatrix **), (A, parcsr)); 17213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1722dd9c0a25Sstefano_zampini } 1723dd9c0a25Sstefano_zampini 1724d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMissingDiagonal_HYPRE(Mat A, PetscBool *missing, PetscInt *dd) 1725d71ae5a4SJacob Faibussowitsch { 172668ec7858SStefano Zampini hypre_ParCSRMatrix *parcsr; 172768ec7858SStefano Zampini hypre_CSRMatrix *ha; 172868ec7858SStefano Zampini PetscInt rst; 172968ec7858SStefano Zampini 173068ec7858SStefano Zampini PetscFunctionBegin; 173108401ef6SPierre Jolivet PetscCheck(A->rmap->n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_SUP, "Not implemented with non-square diagonal blocks"); 17329566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(A, &rst, NULL)); 17339566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 173468ec7858SStefano Zampini if (missing) *missing = PETSC_FALSE; 173568ec7858SStefano Zampini if (dd) *dd = -1; 173668ec7858SStefano Zampini ha = hypre_ParCSRMatrixDiag(parcsr); 173768ec7858SStefano Zampini if (ha) { 173868299464SStefano Zampini PetscInt size, i; 173968299464SStefano Zampini HYPRE_Int *ii, *jj; 174068ec7858SStefano Zampini 174168ec7858SStefano Zampini size = hypre_CSRMatrixNumRows(ha); 174268ec7858SStefano Zampini ii = hypre_CSRMatrixI(ha); 174368ec7858SStefano Zampini jj = hypre_CSRMatrixJ(ha); 174468ec7858SStefano Zampini for (i = 0; i < size; i++) { 174568ec7858SStefano Zampini PetscInt j; 174668ec7858SStefano Zampini PetscBool found = PETSC_FALSE; 174768ec7858SStefano Zampini 17489371c9d4SSatish Balay for (j = ii[i]; j < ii[i + 1] && !found; j++) found = (jj[j] == i) ? PETSC_TRUE : PETSC_FALSE; 174968ec7858SStefano Zampini 175068ec7858SStefano Zampini if (!found) { 17513ba16761SJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix is missing local diagonal entry %" PetscInt_FMT "\n", i)); 175268ec7858SStefano Zampini if (missing) *missing = PETSC_TRUE; 175368ec7858SStefano Zampini if (dd) *dd = i + rst; 17543ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 175568ec7858SStefano Zampini } 175668ec7858SStefano Zampini } 175768ec7858SStefano Zampini if (!size) { 17583ba16761SJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no diagonal entries therefore is missing diagonal\n")); 175968ec7858SStefano Zampini if (missing) *missing = PETSC_TRUE; 176068ec7858SStefano Zampini if (dd) *dd = rst; 176168ec7858SStefano Zampini } 176268ec7858SStefano Zampini } else { 17633ba16761SJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no diagonal entries therefore is missing diagonal\n")); 176468ec7858SStefano Zampini if (missing) *missing = PETSC_TRUE; 176568ec7858SStefano Zampini if (dd) *dd = rst; 176668ec7858SStefano Zampini } 17673ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 176868ec7858SStefano Zampini } 176968ec7858SStefano Zampini 1770d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatScale_HYPRE(Mat A, PetscScalar s) 1771d71ae5a4SJacob Faibussowitsch { 177268ec7858SStefano Zampini hypre_ParCSRMatrix *parcsr; 17736ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0) 177468ec7858SStefano Zampini hypre_CSRMatrix *ha; 17756ea7df73SStefano Zampini #endif 177639accc25SStefano Zampini HYPRE_Complex hs; 177768ec7858SStefano Zampini 177868ec7858SStefano Zampini PetscFunctionBegin; 17799566063dSJacob Faibussowitsch PetscCall(PetscHYPREScalarCast(s, &hs)); 17809566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 17816ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2, 19, 0) 1782792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixScale, parcsr, hs); 17836ea7df73SStefano Zampini #else /* diagonal part */ 178468ec7858SStefano Zampini ha = hypre_ParCSRMatrixDiag(parcsr); 178568ec7858SStefano Zampini if (ha) { 178668299464SStefano Zampini PetscInt size, i; 178768299464SStefano Zampini HYPRE_Int *ii; 178839accc25SStefano Zampini HYPRE_Complex *a; 178968ec7858SStefano Zampini 179068ec7858SStefano Zampini size = hypre_CSRMatrixNumRows(ha); 179168ec7858SStefano Zampini a = hypre_CSRMatrixData(ha); 179268ec7858SStefano Zampini ii = hypre_CSRMatrixI(ha); 179339accc25SStefano Zampini for (i = 0; i < ii[size]; i++) a[i] *= hs; 179468ec7858SStefano Zampini } 179568ec7858SStefano Zampini /* offdiagonal part */ 179668ec7858SStefano Zampini ha = hypre_ParCSRMatrixOffd(parcsr); 179768ec7858SStefano Zampini if (ha) { 179868299464SStefano Zampini PetscInt size, i; 179968299464SStefano Zampini HYPRE_Int *ii; 180039accc25SStefano Zampini HYPRE_Complex *a; 180168ec7858SStefano Zampini 180268ec7858SStefano Zampini size = hypre_CSRMatrixNumRows(ha); 180368ec7858SStefano Zampini a = hypre_CSRMatrixData(ha); 180468ec7858SStefano Zampini ii = hypre_CSRMatrixI(ha); 180539accc25SStefano Zampini for (i = 0; i < ii[size]; i++) a[i] *= hs; 180668ec7858SStefano Zampini } 18076ea7df73SStefano Zampini #endif 18083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 180968ec7858SStefano Zampini } 181068ec7858SStefano Zampini 1811d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatZeroRowsColumns_HYPRE(Mat A, PetscInt numRows, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 1812d71ae5a4SJacob Faibussowitsch { 181368ec7858SStefano Zampini hypre_ParCSRMatrix *parcsr; 181468299464SStefano Zampini HYPRE_Int *lrows; 181568299464SStefano Zampini PetscInt rst, ren, i; 181668ec7858SStefano Zampini 181768ec7858SStefano Zampini PetscFunctionBegin; 181808401ef6SPierre Jolivet PetscCheck(!x && !b, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "To be implemented"); 18199566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 18209566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(numRows, &lrows)); 18219566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(A, &rst, &ren)); 182268ec7858SStefano Zampini for (i = 0; i < numRows; i++) { 18237a46b595SBarry Smith PetscCheck(rows[i] >= rst && rows[i] < ren, PETSC_COMM_SELF, PETSC_ERR_SUP, "Non-local rows not yet supported"); 182468ec7858SStefano Zampini lrows[i] = rows[i] - rst; 182568ec7858SStefano Zampini } 1826792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixEliminateRowsCols, parcsr, numRows, lrows); 18279566063dSJacob Faibussowitsch PetscCall(PetscFree(lrows)); 18283ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 182968ec7858SStefano Zampini } 183068ec7858SStefano Zampini 1831d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatZeroEntries_HYPRE_CSRMatrix(hypre_CSRMatrix *ha) 1832d71ae5a4SJacob Faibussowitsch { 1833c69f721fSFande Kong PetscFunctionBegin; 1834c69f721fSFande Kong if (ha) { 1835c69f721fSFande Kong HYPRE_Int *ii, size; 1836c69f721fSFande Kong HYPRE_Complex *a; 1837c69f721fSFande Kong 1838c69f721fSFande Kong size = hypre_CSRMatrixNumRows(ha); 1839c69f721fSFande Kong a = hypre_CSRMatrixData(ha); 1840c69f721fSFande Kong ii = hypre_CSRMatrixI(ha); 1841c69f721fSFande Kong 18429566063dSJacob Faibussowitsch if (a) PetscCall(PetscArrayzero(a, ii[size])); 1843c69f721fSFande Kong } 18443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1845c69f721fSFande Kong } 1846c69f721fSFande Kong 1847d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_HYPRE(Mat A) 1848d71ae5a4SJacob Faibussowitsch { 18496ea7df73SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 18506ea7df73SStefano Zampini 18516ea7df73SStefano Zampini PetscFunctionBegin; 18526ea7df73SStefano Zampini if (HYPRE_MEMORY_DEVICE == hypre_IJMatrixMemoryLocation(hA->ij)) { 1853792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetConstantValues, hA->ij, 0.0); 18546ea7df73SStefano Zampini } else { 1855c69f721fSFande Kong hypre_ParCSRMatrix *parcsr; 1856c69f721fSFande Kong 18579566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 18589566063dSJacob Faibussowitsch PetscCall(MatZeroEntries_HYPRE_CSRMatrix(hypre_ParCSRMatrixDiag(parcsr))); 18599566063dSJacob Faibussowitsch PetscCall(MatZeroEntries_HYPRE_CSRMatrix(hypre_ParCSRMatrixOffd(parcsr))); 18606ea7df73SStefano Zampini } 18613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1862c69f721fSFande Kong } 1863c69f721fSFande Kong 1864d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatZeroRows_HYPRE_CSRMatrix(hypre_CSRMatrix *hA, PetscInt N, const PetscInt rows[], HYPRE_Complex diag) 1865d71ae5a4SJacob Faibussowitsch { 186639accc25SStefano Zampini PetscInt ii; 186739accc25SStefano Zampini HYPRE_Int *i, *j; 186839accc25SStefano Zampini HYPRE_Complex *a; 1869c69f721fSFande Kong 1870c69f721fSFande Kong PetscFunctionBegin; 18713ba16761SJacob Faibussowitsch if (!hA) PetscFunctionReturn(PETSC_SUCCESS); 1872c69f721fSFande Kong 187339accc25SStefano Zampini i = hypre_CSRMatrixI(hA); 187439accc25SStefano Zampini j = hypre_CSRMatrixJ(hA); 1875c69f721fSFande Kong a = hypre_CSRMatrixData(hA); 1876c69f721fSFande Kong 1877c69f721fSFande Kong for (ii = 0; ii < N; ii++) { 187839accc25SStefano Zampini HYPRE_Int jj, ibeg, iend, irow; 187939accc25SStefano Zampini 1880c69f721fSFande Kong irow = rows[ii]; 1881c69f721fSFande Kong ibeg = i[irow]; 1882c69f721fSFande Kong iend = i[irow + 1]; 1883c69f721fSFande Kong for (jj = ibeg; jj < iend; jj++) 1884c69f721fSFande Kong if (j[jj] == irow) a[jj] = diag; 1885c69f721fSFande Kong else a[jj] = 0.0; 1886c69f721fSFande Kong } 18873ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1888c69f721fSFande Kong } 1889c69f721fSFande Kong 1890d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatZeroRows_HYPRE(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 1891d71ae5a4SJacob Faibussowitsch { 1892c69f721fSFande Kong hypre_ParCSRMatrix *parcsr; 1893c69f721fSFande Kong PetscInt *lrows, len; 189439accc25SStefano Zampini HYPRE_Complex hdiag; 1895c69f721fSFande Kong 1896c69f721fSFande Kong PetscFunctionBegin; 189708401ef6SPierre Jolivet PetscCheck(!x && !b, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Does not support to modify the solution and the right hand size"); 18989566063dSJacob Faibussowitsch PetscCall(PetscHYPREScalarCast(diag, &hdiag)); 1899c69f721fSFande Kong /* retrieve the internal matrix */ 19009566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 1901c69f721fSFande Kong /* get locally owned rows */ 19029566063dSJacob Faibussowitsch PetscCall(MatZeroRowsMapLocal_Private(A, N, rows, &len, &lrows)); 1903c69f721fSFande Kong /* zero diagonal part */ 19049566063dSJacob Faibussowitsch PetscCall(MatZeroRows_HYPRE_CSRMatrix(hypre_ParCSRMatrixDiag(parcsr), len, lrows, hdiag)); 1905c69f721fSFande Kong /* zero off-diagonal part */ 19069566063dSJacob Faibussowitsch PetscCall(MatZeroRows_HYPRE_CSRMatrix(hypre_ParCSRMatrixOffd(parcsr), len, lrows, 0.0)); 1907c69f721fSFande Kong 19089566063dSJacob Faibussowitsch PetscCall(PetscFree(lrows)); 19093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1910c69f721fSFande Kong } 1911c69f721fSFande Kong 1912d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAssemblyBegin_HYPRE(Mat mat, MatAssemblyType mode) 1913d71ae5a4SJacob Faibussowitsch { 1914c69f721fSFande Kong PetscFunctionBegin; 19153ba16761SJacob Faibussowitsch if (mat->nooffprocentries) PetscFunctionReturn(PETSC_SUCCESS); 1916c69f721fSFande Kong 19179566063dSJacob Faibussowitsch PetscCall(MatStashScatterBegin_Private(mat, &mat->stash, mat->rmap->range)); 19183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1919c69f721fSFande Kong } 1920c69f721fSFande Kong 1921d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetRow_HYPRE(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 1922d71ae5a4SJacob Faibussowitsch { 1923c69f721fSFande Kong hypre_ParCSRMatrix *parcsr; 19242cf14000SStefano Zampini HYPRE_Int hnz; 1925c69f721fSFande Kong 1926c69f721fSFande Kong PetscFunctionBegin; 1927c69f721fSFande Kong /* retrieve the internal matrix */ 19289566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 1929c69f721fSFande Kong /* call HYPRE API */ 1930792fecdfSBarry Smith PetscCallExternal(HYPRE_ParCSRMatrixGetRow, parcsr, row, &hnz, (HYPRE_BigInt **)idx, (HYPRE_Complex **)v); 19312cf14000SStefano Zampini if (nz) *nz = (PetscInt)hnz; 19323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1933c69f721fSFande Kong } 1934c69f721fSFande Kong 1935d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatRestoreRow_HYPRE(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 1936d71ae5a4SJacob Faibussowitsch { 1937c69f721fSFande Kong hypre_ParCSRMatrix *parcsr; 19382cf14000SStefano Zampini HYPRE_Int hnz; 1939c69f721fSFande Kong 1940c69f721fSFande Kong PetscFunctionBegin; 1941c69f721fSFande Kong /* retrieve the internal matrix */ 19429566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 1943c69f721fSFande Kong /* call HYPRE API */ 19442cf14000SStefano Zampini hnz = nz ? (HYPRE_Int)(*nz) : 0; 1945792fecdfSBarry Smith PetscCallExternal(HYPRE_ParCSRMatrixRestoreRow, parcsr, row, &hnz, (HYPRE_BigInt **)idx, (HYPRE_Complex **)v); 19463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1947c69f721fSFande Kong } 1948c69f721fSFande Kong 1949d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetValues_HYPRE(Mat A, PetscInt m, const PetscInt idxm[], PetscInt n, const PetscInt idxn[], PetscScalar v[]) 1950d71ae5a4SJacob Faibussowitsch { 195145b8d346SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 1952c69f721fSFande Kong PetscInt i; 19531d4906efSStefano Zampini 1954c69f721fSFande Kong PetscFunctionBegin; 19553ba16761SJacob Faibussowitsch if (!m || !n) PetscFunctionReturn(PETSC_SUCCESS); 1956c69f721fSFande Kong /* Ignore negative row indices 1957c69f721fSFande Kong * And negative column indices should be automatically ignored in hypre 1958c69f721fSFande Kong * */ 19592cf14000SStefano Zampini for (i = 0; i < m; i++) { 19602cf14000SStefano Zampini if (idxm[i] >= 0) { 19612cf14000SStefano Zampini HYPRE_Int hn = (HYPRE_Int)n; 1962792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetValues, hA->ij, 1, &hn, (HYPRE_BigInt *)&idxm[i], (HYPRE_BigInt *)idxn, (HYPRE_Complex *)(v + i * n)); 19632cf14000SStefano Zampini } 19642cf14000SStefano Zampini } 19653ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1966c69f721fSFande Kong } 1967c69f721fSFande Kong 1968d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetOption_HYPRE(Mat A, MatOption op, PetscBool flg) 1969d71ae5a4SJacob Faibussowitsch { 1970ddbeb582SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 1971ddbeb582SStefano Zampini 1972ddbeb582SStefano Zampini PetscFunctionBegin; 1973c6698e78SStefano Zampini switch (op) { 1974ddbeb582SStefano Zampini case MAT_NO_OFF_PROC_ENTRIES: 197548a46eb9SPierre Jolivet if (flg) PetscCallExternal(HYPRE_IJMatrixSetMaxOffProcElmts, hA->ij, 0); 1976ddbeb582SStefano Zampini break; 1977d71ae5a4SJacob Faibussowitsch case MAT_SORTED_FULL: 1978d71ae5a4SJacob Faibussowitsch hA->sorted_full = flg; 1979d71ae5a4SJacob Faibussowitsch break; 1980d71ae5a4SJacob Faibussowitsch default: 1981d71ae5a4SJacob Faibussowitsch break; 1982ddbeb582SStefano Zampini } 19833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1984ddbeb582SStefano Zampini } 1985c69f721fSFande Kong 1986d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_HYPRE(Mat A, PetscViewer view) 1987d71ae5a4SJacob Faibussowitsch { 198845b8d346SStefano Zampini PetscViewerFormat format; 198945b8d346SStefano Zampini 199045b8d346SStefano Zampini PetscFunctionBegin; 19919566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(view, &format)); 19923ba16761SJacob Faibussowitsch if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS); 199345b8d346SStefano Zampini if (format != PETSC_VIEWER_NATIVE) { 19946ea7df73SStefano Zampini Mat B; 19956ea7df73SStefano Zampini hypre_ParCSRMatrix *parcsr; 19966ea7df73SStefano Zampini PetscErrorCode (*mview)(Mat, PetscViewer) = NULL; 19976ea7df73SStefano Zampini 19989566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 19999566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(parcsr, MATAIJ, PETSC_USE_POINTER, &B)); 20009566063dSJacob Faibussowitsch PetscCall(MatGetOperation(B, MATOP_VIEW, (void (**)(void)) & mview)); 200128b400f6SJacob Faibussowitsch PetscCheck(mview, PetscObjectComm((PetscObject)A), PETSC_ERR_PLIB, "Missing view operation"); 20029566063dSJacob Faibussowitsch PetscCall((*mview)(B, view)); 20039566063dSJacob Faibussowitsch PetscCall(MatDestroy(&B)); 200445b8d346SStefano Zampini } else { 200545b8d346SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data; 200645b8d346SStefano Zampini PetscMPIInt size; 200745b8d346SStefano Zampini PetscBool isascii; 200845b8d346SStefano Zampini const char *filename; 200945b8d346SStefano Zampini 201045b8d346SStefano Zampini /* HYPRE uses only text files */ 20119566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)view, PETSCVIEWERASCII, &isascii)); 201228b400f6SJacob Faibussowitsch PetscCheck(isascii, PetscObjectComm((PetscObject)view), PETSC_ERR_SUP, "PetscViewerType %s: native HYPRE format needs PETSCVIEWERASCII", ((PetscObject)view)->type_name); 20139566063dSJacob Faibussowitsch PetscCall(PetscViewerFileGetName(view, &filename)); 2014792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixPrint, hA->ij, filename); 20159566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(hA->comm, &size)); 201645b8d346SStefano Zampini if (size > 1) { 20179566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(view, "Matrix files: %s.%05d ... %s.%05d\n", filename, 0, filename, size - 1)); 201845b8d346SStefano Zampini } else { 20199566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(view, "Matrix file: %s.%05d\n", filename, 0)); 202045b8d346SStefano Zampini } 202145b8d346SStefano Zampini } 20223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 202345b8d346SStefano Zampini } 202445b8d346SStefano Zampini 2025d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatCopy_HYPRE(Mat A, Mat B, MatStructure str) 2026d71ae5a4SJacob Faibussowitsch { 2027465edc17SStefano Zampini hypre_ParCSRMatrix *acsr, *bcsr; 2028465edc17SStefano Zampini 2029465edc17SStefano Zampini PetscFunctionBegin; 2030465edc17SStefano Zampini if (str == SAME_NONZERO_PATTERN && A->ops->copy == B->ops->copy) { 20319566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &acsr)); 20329566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(B, &bcsr)); 2033792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixCopy, acsr, bcsr, 1); 20349566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_SORTED_FULL, PETSC_TRUE)); /* "perfect" preallocation, so no need for hypre_AuxParCSRMatrixNeedAux */ 20359566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 20369566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 2037465edc17SStefano Zampini } else { 20389566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 2039465edc17SStefano Zampini } 20403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2041465edc17SStefano Zampini } 2042465edc17SStefano Zampini 2043d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetDiagonal_HYPRE(Mat A, Vec d) 2044d71ae5a4SJacob Faibussowitsch { 20456305df00SStefano Zampini hypre_ParCSRMatrix *parcsr; 20466305df00SStefano Zampini hypre_CSRMatrix *dmat; 204739accc25SStefano Zampini HYPRE_Complex *a; 204839accc25SStefano Zampini HYPRE_Complex *data = NULL; 20492cf14000SStefano Zampini HYPRE_Int *diag = NULL; 20502cf14000SStefano Zampini PetscInt i; 20516305df00SStefano Zampini PetscBool cong; 20526305df00SStefano Zampini 20536305df00SStefano Zampini PetscFunctionBegin; 20549566063dSJacob Faibussowitsch PetscCall(MatHasCongruentLayouts(A, &cong)); 205528b400f6SJacob Faibussowitsch PetscCheck(cong, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only for square matrices with same local distributions of rows and columns"); 205676bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 20576305df00SStefano Zampini PetscBool miss; 20589566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal(A, &miss, NULL)); 205908401ef6SPierre Jolivet PetscCheck(!miss || !A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_SUP, "Not implemented when diagonal entries are missing"); 20606305df00SStefano Zampini } 20619566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 20626305df00SStefano Zampini dmat = hypre_ParCSRMatrixDiag(parcsr); 20636305df00SStefano Zampini if (dmat) { 206439accc25SStefano Zampini /* this cast fixes the clang error: implicit conversion from 'HYPRE_Complex' (aka '_Complex double') to 'double' is not permitted in C++ */ 20659566063dSJacob Faibussowitsch PetscCall(VecGetArray(d, (PetscScalar **)&a)); 20662cf14000SStefano Zampini diag = hypre_CSRMatrixI(dmat); 206739accc25SStefano Zampini data = hypre_CSRMatrixData(dmat); 20686305df00SStefano Zampini for (i = 0; i < A->rmap->n; i++) a[i] = data[diag[i]]; 20699566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(d, (PetscScalar **)&a)); 20706305df00SStefano Zampini } 20713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 20726305df00SStefano Zampini } 20736305df00SStefano Zampini 2074363d496dSStefano Zampini #include <petscblaslapack.h> 2075363d496dSStefano Zampini 2076d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAXPY_HYPRE(Mat Y, PetscScalar a, Mat X, MatStructure str) 2077d71ae5a4SJacob Faibussowitsch { 2078363d496dSStefano Zampini PetscFunctionBegin; 20796ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 20806ea7df73SStefano Zampini { 20816ea7df73SStefano Zampini Mat B; 20826ea7df73SStefano Zampini hypre_ParCSRMatrix *x, *y, *z; 20836ea7df73SStefano Zampini 20849566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR(Y, &y)); 20859566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR(X, &x)); 2086792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixAdd, 1.0, y, 1.0, x, &z); 20879566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(z, MATHYPRE, PETSC_OWN_POINTER, &B)); 20889566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 20896ea7df73SStefano Zampini } 20906ea7df73SStefano Zampini #else 2091363d496dSStefano Zampini if (str == SAME_NONZERO_PATTERN) { 2092363d496dSStefano Zampini hypre_ParCSRMatrix *x, *y; 2093363d496dSStefano Zampini hypre_CSRMatrix *xloc, *yloc; 2094363d496dSStefano Zampini PetscInt xnnz, ynnz; 209539accc25SStefano Zampini HYPRE_Complex *xarr, *yarr; 2096363d496dSStefano Zampini PetscBLASInt one = 1, bnz; 2097363d496dSStefano Zampini 20989566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR(Y, &y)); 20999566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR(X, &x)); 2100363d496dSStefano Zampini 2101363d496dSStefano Zampini /* diagonal block */ 2102363d496dSStefano Zampini xloc = hypre_ParCSRMatrixDiag(x); 2103363d496dSStefano Zampini yloc = hypre_ParCSRMatrixDiag(y); 2104363d496dSStefano Zampini xnnz = 0; 2105363d496dSStefano Zampini ynnz = 0; 2106363d496dSStefano Zampini xarr = NULL; 2107363d496dSStefano Zampini yarr = NULL; 2108363d496dSStefano Zampini if (xloc) { 210939accc25SStefano Zampini xarr = hypre_CSRMatrixData(xloc); 2110363d496dSStefano Zampini xnnz = hypre_CSRMatrixNumNonzeros(xloc); 2111363d496dSStefano Zampini } 2112363d496dSStefano Zampini if (yloc) { 211339accc25SStefano Zampini yarr = hypre_CSRMatrixData(yloc); 2114363d496dSStefano Zampini ynnz = hypre_CSRMatrixNumNonzeros(yloc); 2115363d496dSStefano Zampini } 211608401ef6SPierre Jolivet PetscCheck(xnnz == ynnz, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Different number of nonzeros in diagonal block %" PetscInt_FMT " != %" PetscInt_FMT, xnnz, ynnz); 21179566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(xnnz, &bnz)); 2118792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &a, (PetscScalar *)xarr, &one, (PetscScalar *)yarr, &one)); 2119363d496dSStefano Zampini 2120363d496dSStefano Zampini /* off-diagonal block */ 2121363d496dSStefano Zampini xloc = hypre_ParCSRMatrixOffd(x); 2122363d496dSStefano Zampini yloc = hypre_ParCSRMatrixOffd(y); 2123363d496dSStefano Zampini xnnz = 0; 2124363d496dSStefano Zampini ynnz = 0; 2125363d496dSStefano Zampini xarr = NULL; 2126363d496dSStefano Zampini yarr = NULL; 2127363d496dSStefano Zampini if (xloc) { 212839accc25SStefano Zampini xarr = hypre_CSRMatrixData(xloc); 2129363d496dSStefano Zampini xnnz = hypre_CSRMatrixNumNonzeros(xloc); 2130363d496dSStefano Zampini } 2131363d496dSStefano Zampini if (yloc) { 213239accc25SStefano Zampini yarr = hypre_CSRMatrixData(yloc); 2133363d496dSStefano Zampini ynnz = hypre_CSRMatrixNumNonzeros(yloc); 2134363d496dSStefano Zampini } 213508401ef6SPierre Jolivet PetscCheck(xnnz == ynnz, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Different number of nonzeros in off-diagonal block %" PetscInt_FMT " != %" PetscInt_FMT, xnnz, ynnz); 21369566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(xnnz, &bnz)); 2137792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &a, (PetscScalar *)xarr, &one, (PetscScalar *)yarr, &one)); 2138363d496dSStefano Zampini } else if (str == SUBSET_NONZERO_PATTERN) { 21399566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 2140363d496dSStefano Zampini } else { 2141363d496dSStefano Zampini Mat B; 2142363d496dSStefano Zampini 21439566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic_Preallocate(Y, X, &B)); 21449566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 21459566063dSJacob Faibussowitsch PetscCall(MatHeaderReplace(Y, &B)); 2146363d496dSStefano Zampini } 21476ea7df73SStefano Zampini #endif 21483ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2149363d496dSStefano Zampini } 2150363d496dSStefano Zampini 21512c4ab24aSJunchao Zhang /* Attach cooMat to hypre matrix mat. The two matrices will share the same data array */ 21522c4ab24aSJunchao Zhang static PetscErrorCode MatAttachCOOMat_HYPRE(Mat mat, Mat cooMat) 21532c4ab24aSJunchao Zhang { 21542c4ab24aSJunchao Zhang Mat_HYPRE *hmat = (Mat_HYPRE *)mat->data; 21552c4ab24aSJunchao Zhang hypre_CSRMatrix *diag, *offd; 21562c4ab24aSJunchao Zhang hypre_ParCSRMatrix *parCSR; 21572c4ab24aSJunchao Zhang HYPRE_MemoryLocation hypreMemtype = HYPRE_MEMORY_HOST; 21582c4ab24aSJunchao Zhang PetscMemType petscMemtype; 21592c4ab24aSJunchao Zhang Mat A, B; 21602c4ab24aSJunchao Zhang PetscScalar *Aa, *Ba; 21612c4ab24aSJunchao Zhang PetscMPIInt size; 21622c4ab24aSJunchao Zhang MPI_Comm comm; 21632c4ab24aSJunchao Zhang PetscLayout rmap; 21642c4ab24aSJunchao Zhang 21652c4ab24aSJunchao Zhang PetscFunctionBegin; 21662c4ab24aSJunchao Zhang PetscCall(PetscObjectGetComm((PetscObject)mat, &comm)); 21672c4ab24aSJunchao Zhang PetscCallMPI(MPI_Comm_size(comm, &size)); 21682c4ab24aSJunchao Zhang PetscCall(MatGetLayouts(mat, &rmap, NULL)); 21692c4ab24aSJunchao Zhang 21702c4ab24aSJunchao Zhang /* Alias cooMat's data array to IJMatrix's */ 21712c4ab24aSJunchao Zhang PetscCallExternal(HYPRE_IJMatrixGetObject, hmat->ij, (void **)&parCSR); 21722c4ab24aSJunchao Zhang diag = hypre_ParCSRMatrixDiag(parCSR); 21732c4ab24aSJunchao Zhang offd = hypre_ParCSRMatrixOffd(parCSR); 21742c4ab24aSJunchao Zhang 21752c4ab24aSJunchao Zhang hypreMemtype = hypre_CSRMatrixMemoryLocation(diag); 21762c4ab24aSJunchao Zhang A = (size == 1) ? cooMat : ((Mat_MPIAIJ *)cooMat->data)->A; 21772c4ab24aSJunchao Zhang PetscCall(MatSeqAIJGetCSRAndMemType(A, NULL, NULL, &Aa, &petscMemtype)); 21782c4ab24aSJunchao Zhang PetscAssert((PetscMemTypeHost(petscMemtype) && hypreMemtype == HYPRE_MEMORY_HOST) || (PetscMemTypeDevice(petscMemtype) && hypreMemtype == HYPRE_MEMORY_DEVICE), comm, PETSC_ERR_PLIB, "PETSc and hypre's memory types mismatch"); 21792c4ab24aSJunchao Zhang 21802c4ab24aSJunchao Zhang hmat->diagJ = hypre_CSRMatrixJ(diag); 21812c4ab24aSJunchao Zhang PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hypre_CSRMatrixData(diag), hypreMemtype)); 21822c4ab24aSJunchao Zhang hypre_CSRMatrixData(diag) = (HYPRE_Complex *)Aa; 21832c4ab24aSJunchao Zhang hypre_CSRMatrixOwnsData(diag) = 0; /* Take ownership of (j,a) away from hypre. As a result, we need to free them on our own */ 21842c4ab24aSJunchao Zhang 21852c4ab24aSJunchao Zhang /* Copy diagonal pointers of A to device to facilitate MatSeqAIJMoveDiagonalValuesFront_SeqAIJKokkos */ 21862c4ab24aSJunchao Zhang if (hypreMemtype == HYPRE_MEMORY_DEVICE) { 21872c4ab24aSJunchao Zhang PetscStackCallExternalVoid("hypre_TAlloc", hmat->diag = hypre_TAlloc(PetscInt, rmap->n, hypreMemtype)); 21882c4ab24aSJunchao Zhang PetscCall(MatMarkDiagonal_SeqAIJ(A)); /* We need updated diagonal positions */ 21892c4ab24aSJunchao Zhang PetscStackCallExternalVoid("hypre_TMemcpy", hypre_TMemcpy(hmat->diag, ((Mat_SeqAIJ *)A->data)->diag, PetscInt, rmap->n, hypreMemtype, HYPRE_MEMORY_HOST)); 21902c4ab24aSJunchao Zhang } 21912c4ab24aSJunchao Zhang 21922c4ab24aSJunchao Zhang if (size > 1) { 21932c4ab24aSJunchao Zhang B = ((Mat_MPIAIJ *)cooMat->data)->B; 21942c4ab24aSJunchao Zhang PetscCall(MatSeqAIJGetCSRAndMemType(B, NULL, NULL, &Ba, &petscMemtype)); 21952c4ab24aSJunchao Zhang hmat->offdJ = hypre_CSRMatrixJ(offd); 21962c4ab24aSJunchao Zhang PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hypre_CSRMatrixData(offd), hypreMemtype)); 21972c4ab24aSJunchao Zhang hypre_CSRMatrixData(offd) = (HYPRE_Complex *)Ba; 21982c4ab24aSJunchao Zhang hypre_CSRMatrixOwnsData(offd) = 0; 21992c4ab24aSJunchao Zhang } 22002c4ab24aSJunchao Zhang 22012c4ab24aSJunchao Zhang /* Record cooMat for use in MatSetValuesCOO_HYPRE */ 22022c4ab24aSJunchao Zhang hmat->cooMat = cooMat; 22032c4ab24aSJunchao Zhang hmat->memType = hypreMemtype; 22042c4ab24aSJunchao Zhang PetscFunctionReturn(PETSC_SUCCESS); 22052c4ab24aSJunchao Zhang } 22062c4ab24aSJunchao Zhang 22072c4ab24aSJunchao Zhang static PetscErrorCode MatDuplicate_HYPRE(Mat A, MatDuplicateOption op, Mat *B) 22082c4ab24aSJunchao Zhang { 22092c4ab24aSJunchao Zhang hypre_ParCSRMatrix *parcsr = NULL; 22102c4ab24aSJunchao Zhang PetscCopyMode cpmode; 22112c4ab24aSJunchao Zhang Mat_HYPRE *hA; 22122c4ab24aSJunchao Zhang Mat cooMat; 22132c4ab24aSJunchao Zhang 22142c4ab24aSJunchao Zhang PetscFunctionBegin; 22152c4ab24aSJunchao Zhang PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr)); 22162c4ab24aSJunchao Zhang if (op == MAT_DO_NOT_COPY_VALUES || op == MAT_SHARE_NONZERO_PATTERN) { 22172c4ab24aSJunchao Zhang parcsr = hypre_ParCSRMatrixClone(parcsr, 0); 22182c4ab24aSJunchao Zhang cpmode = PETSC_OWN_POINTER; 22192c4ab24aSJunchao Zhang } else { 22202c4ab24aSJunchao Zhang cpmode = PETSC_COPY_VALUES; 22212c4ab24aSJunchao Zhang } 22222c4ab24aSJunchao Zhang PetscCall(MatCreateFromParCSR(parcsr, MATHYPRE, cpmode, B)); 22232c4ab24aSJunchao Zhang hA = (Mat_HYPRE *)A->data; 22242c4ab24aSJunchao Zhang if (hA->cooMat) { 22252c4ab24aSJunchao Zhang /* could not simply increase the reference count of hA->cooMat, since B needs to share cooMat's data array */ 22262c4ab24aSJunchao Zhang PetscCall(MatDuplicate(hA->cooMat, MAT_DO_NOT_COPY_VALUES, &cooMat)); 22272c4ab24aSJunchao Zhang PetscCall(MatAttachCOOMat_HYPRE(*B, cooMat)); 22282c4ab24aSJunchao Zhang } 22292c4ab24aSJunchao Zhang PetscFunctionReturn(PETSC_SUCCESS); 22302c4ab24aSJunchao Zhang } 22312c4ab24aSJunchao Zhang 2232d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetPreallocationCOO_HYPRE(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[]) 2233d71ae5a4SJacob Faibussowitsch { 22345fbaff96SJunchao Zhang MPI_Comm comm; 22355fbaff96SJunchao Zhang PetscMPIInt size; 22365fbaff96SJunchao Zhang PetscLayout rmap, cmap; 22375fbaff96SJunchao Zhang Mat_HYPRE *hmat; 22382c4ab24aSJunchao Zhang Mat cooMat; 22395fbaff96SJunchao Zhang MatType matType = MATAIJ; /* default type of cooMat */ 22405fbaff96SJunchao Zhang 22415fbaff96SJunchao Zhang PetscFunctionBegin; 22425fbaff96SJunchao Zhang /* Build an agent matrix cooMat whose type is either MATAIJ or MATAIJKOKKOS. 22435fbaff96SJunchao Zhang It has the same sparsity pattern as mat, and also shares the data array with mat. We use cooMat to do the COO work. 22445fbaff96SJunchao Zhang */ 22455fbaff96SJunchao Zhang PetscCall(PetscObjectGetComm((PetscObject)mat, &comm)); 22465fbaff96SJunchao Zhang PetscCallMPI(MPI_Comm_size(comm, &size)); 22475fbaff96SJunchao Zhang PetscCall(PetscLayoutSetUp(mat->rmap)); 22485fbaff96SJunchao Zhang PetscCall(PetscLayoutSetUp(mat->cmap)); 22495fbaff96SJunchao Zhang PetscCall(MatGetLayouts(mat, &rmap, &cmap)); 22505fbaff96SJunchao Zhang 22515fbaff96SJunchao Zhang /* I do not know how hypre_ParCSRMatrix stores diagonal elements for non-square matrices, so I just give up now */ 22525fbaff96SJunchao Zhang PetscCheck(rmap->N == cmap->N, comm, PETSC_ERR_SUP, "MATHYPRE COO cannot handle non-square matrices"); 22535fbaff96SJunchao Zhang 22545fbaff96SJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 22555fbaff96SJunchao Zhang if (!mat->boundtocpu) { /* mat will be on device, so will cooMat */ 22565fbaff96SJunchao Zhang #if defined(PETSC_HAVE_KOKKOS) 22575fbaff96SJunchao Zhang matType = MATAIJKOKKOS; 22585fbaff96SJunchao Zhang #else 22595fbaff96SJunchao Zhang SETERRQ(comm, PETSC_ERR_SUP, "To support MATHYPRE COO assembly on device, we need Kokkos, e.g., --download-kokkos --download-kokkos-kernels"); 22605fbaff96SJunchao Zhang #endif 22615fbaff96SJunchao Zhang } 22625fbaff96SJunchao Zhang #endif 22635fbaff96SJunchao Zhang 22645fbaff96SJunchao Zhang /* Do COO preallocation through cooMat */ 22655fbaff96SJunchao Zhang hmat = (Mat_HYPRE *)mat->data; 22665fbaff96SJunchao Zhang PetscCall(MatDestroy(&hmat->cooMat)); 22675fbaff96SJunchao Zhang PetscCall(MatCreate(comm, &cooMat)); 22685fbaff96SJunchao Zhang PetscCall(MatSetType(cooMat, matType)); 22695fbaff96SJunchao Zhang PetscCall(MatSetLayouts(cooMat, rmap, cmap)); 22705fbaff96SJunchao Zhang PetscCall(MatSetPreallocationCOO(cooMat, coo_n, coo_i, coo_j)); 22715fbaff96SJunchao Zhang 22725fbaff96SJunchao Zhang /* Copy the sparsity pattern from cooMat to hypre IJMatrix hmat->ij */ 22735fbaff96SJunchao Zhang PetscCall(MatSetOption(mat, MAT_SORTED_FULL, PETSC_TRUE)); 22745fbaff96SJunchao Zhang PetscCall(MatSetOption(mat, MAT_NO_OFF_PROC_ENTRIES, PETSC_TRUE)); 22755fbaff96SJunchao Zhang PetscCall(MatHYPRE_CreateFromMat(cooMat, hmat)); /* Create hmat->ij and preallocate it */ 22765fbaff96SJunchao Zhang PetscCall(MatHYPRE_IJMatrixCopy(cooMat, hmat->ij)); /* Copy A's (a,i,j) to hmat->ij. To reuse code. Copying 'a' is not really needed */ 22775fbaff96SJunchao Zhang 22785fbaff96SJunchao Zhang mat->preallocated = PETSC_TRUE; 22795fbaff96SJunchao Zhang PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY)); 22805fbaff96SJunchao Zhang PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY)); /* Migrate mat to device if it is bound to. Hypre builds its own SpMV context here */ 22815fbaff96SJunchao Zhang 22822c4ab24aSJunchao Zhang /* Attach cooMat to mat */ 22832c4ab24aSJunchao Zhang PetscCall(MatAttachCOOMat_HYPRE(mat, cooMat)); 22843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22855fbaff96SJunchao Zhang } 22865fbaff96SJunchao Zhang 2287d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_HYPRE(Mat mat, const PetscScalar v[], InsertMode imode) 2288d71ae5a4SJacob Faibussowitsch { 22895fbaff96SJunchao Zhang Mat_HYPRE *hmat = (Mat_HYPRE *)mat->data; 22905fbaff96SJunchao Zhang PetscMPIInt size; 22915fbaff96SJunchao Zhang Mat A; 22925fbaff96SJunchao Zhang 22935fbaff96SJunchao Zhang PetscFunctionBegin; 22945fbaff96SJunchao Zhang PetscCheck(hmat->cooMat, hmat->comm, PETSC_ERR_PLIB, "HYPRE COO delegate matrix has not been created yet"); 22955fbaff96SJunchao Zhang PetscCallMPI(MPI_Comm_size(hmat->comm, &size)); 22965fbaff96SJunchao Zhang PetscCall(MatSetValuesCOO(hmat->cooMat, v, imode)); 22975fbaff96SJunchao Zhang 22985fbaff96SJunchao Zhang /* Move diagonal elements of the diagonal block to the front of their row, as needed by ParCSRMatrix. So damn hacky */ 22995fbaff96SJunchao Zhang A = (size == 1) ? hmat->cooMat : ((Mat_MPIAIJ *)hmat->cooMat->data)->A; 23005fbaff96SJunchao Zhang if (hmat->memType == HYPRE_MEMORY_HOST) { 23015fbaff96SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 23025fbaff96SJunchao Zhang PetscInt i, m, *Ai = aij->i, *Adiag = aij->diag; 23035fbaff96SJunchao Zhang PetscScalar *Aa = aij->a, tmp; 23045fbaff96SJunchao Zhang 23055fbaff96SJunchao Zhang PetscCall(MatGetSize(A, &m, NULL)); 23065fbaff96SJunchao Zhang for (i = 0; i < m; i++) { 23075fbaff96SJunchao Zhang if (Adiag[i] >= Ai[i] && Adiag[i] < Ai[i + 1]) { /* Digonal element of this row exists in a[] and j[] */ 23085fbaff96SJunchao Zhang tmp = Aa[Ai[i]]; 23095fbaff96SJunchao Zhang Aa[Ai[i]] = Aa[Adiag[i]]; 23105fbaff96SJunchao Zhang Aa[Adiag[i]] = tmp; 23115fbaff96SJunchao Zhang } 23125fbaff96SJunchao Zhang } 23135fbaff96SJunchao Zhang } else { 23145fbaff96SJunchao Zhang #if defined(PETSC_HAVE_KOKKOS_KERNELS) 23155fbaff96SJunchao Zhang PetscCall(MatSeqAIJMoveDiagonalValuesFront_SeqAIJKokkos(A, hmat->diag)); 23165fbaff96SJunchao Zhang #endif 23175fbaff96SJunchao Zhang } 23183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23195fbaff96SJunchao Zhang } 23205fbaff96SJunchao Zhang 2321a055b5aaSBarry Smith /*MC 23222ef1f0ffSBarry Smith MATHYPRE - "hypre" - A matrix type to be used for sequential and parallel sparse matrices 2323a055b5aaSBarry Smith based on the hypre IJ interface. 2324a055b5aaSBarry Smith 2325a055b5aaSBarry Smith Level: intermediate 2326a055b5aaSBarry Smith 23272ef1f0ffSBarry Smith .seealso: [](chapter_matrices), `Mat`, `MatCreate()`, `MatHYPRESetPreallocation` 2328a055b5aaSBarry Smith M*/ 2329a055b5aaSBarry Smith 2330d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_HYPRE(Mat B) 2331d71ae5a4SJacob Faibussowitsch { 233263c07aadSStefano Zampini Mat_HYPRE *hB; 233363c07aadSStefano Zampini 233463c07aadSStefano Zampini PetscFunctionBegin; 23354dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&hB)); 23366ea7df73SStefano Zampini 2337978814f1SStefano Zampini hB->inner_free = PETSC_TRUE; 2338c69f721fSFande Kong hB->available = PETSC_TRUE; 2339336664bdSPierre Jolivet hB->sorted_full = PETSC_FALSE; /* no assumption whether column indices are sorted or not */ 2340c69f721fSFande Kong hB->size = 0; 2341c69f721fSFande Kong hB->array = NULL; 2342978814f1SStefano Zampini 234363c07aadSStefano Zampini B->data = (void *)hB; 234463c07aadSStefano Zampini B->assembled = PETSC_FALSE; 234563c07aadSStefano Zampini 23469566063dSJacob Faibussowitsch PetscCall(PetscMemzero(B->ops, sizeof(struct _MatOps))); 234763c07aadSStefano Zampini B->ops->mult = MatMult_HYPRE; 234863c07aadSStefano Zampini B->ops->multtranspose = MatMultTranspose_HYPRE; 2349414bd5c3SStefano Zampini B->ops->multadd = MatMultAdd_HYPRE; 2350414bd5c3SStefano Zampini B->ops->multtransposeadd = MatMultTransposeAdd_HYPRE; 235163c07aadSStefano Zampini B->ops->setup = MatSetUp_HYPRE; 235263c07aadSStefano Zampini B->ops->destroy = MatDestroy_HYPRE; 235363c07aadSStefano Zampini B->ops->assemblyend = MatAssemblyEnd_HYPRE; 2354c69f721fSFande Kong B->ops->assemblybegin = MatAssemblyBegin_HYPRE; 2355d975228cSstefano_zampini B->ops->setvalues = MatSetValues_HYPRE; 235668ec7858SStefano Zampini B->ops->missingdiagonal = MatMissingDiagonal_HYPRE; 235768ec7858SStefano Zampini B->ops->scale = MatScale_HYPRE; 235868ec7858SStefano Zampini B->ops->zerorowscolumns = MatZeroRowsColumns_HYPRE; 2359c69f721fSFande Kong B->ops->zeroentries = MatZeroEntries_HYPRE; 2360c69f721fSFande Kong B->ops->zerorows = MatZeroRows_HYPRE; 2361c69f721fSFande Kong B->ops->getrow = MatGetRow_HYPRE; 2362c69f721fSFande Kong B->ops->restorerow = MatRestoreRow_HYPRE; 2363c69f721fSFande Kong B->ops->getvalues = MatGetValues_HYPRE; 2364ddbeb582SStefano Zampini B->ops->setoption = MatSetOption_HYPRE; 236545b8d346SStefano Zampini B->ops->duplicate = MatDuplicate_HYPRE; 2366465edc17SStefano Zampini B->ops->copy = MatCopy_HYPRE; 236745b8d346SStefano Zampini B->ops->view = MatView_HYPRE; 23686305df00SStefano Zampini B->ops->getdiagonal = MatGetDiagonal_HYPRE; 2369363d496dSStefano Zampini B->ops->axpy = MatAXPY_HYPRE; 23704222ddf1SHong Zhang B->ops->productsetfromoptions = MatProductSetFromOptions_HYPRE; 23716ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 23726ea7df73SStefano Zampini B->ops->bindtocpu = MatBindToCPU_HYPRE; 23736ea7df73SStefano Zampini B->boundtocpu = PETSC_FALSE; 23746ea7df73SStefano Zampini #endif 237545b8d346SStefano Zampini 237645b8d346SStefano Zampini /* build cache for off array entries formed */ 23779566063dSJacob Faibussowitsch PetscCall(MatStashCreate_Private(PetscObjectComm((PetscObject)B), 1, &B->stash)); 237863c07aadSStefano Zampini 23799566063dSJacob Faibussowitsch PetscCall(PetscCommGetComm(PetscObjectComm((PetscObject)B), &hB->comm)); 23809566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATHYPRE)); 23819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_hypre_aij_C", MatConvert_HYPRE_AIJ)); 23829566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_hypre_is_C", MatConvert_HYPRE_IS)); 23839566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_hypre_C", MatProductSetFromOptions_HYPRE)); 23849566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_mpiaij_hypre_C", MatProductSetFromOptions_HYPRE)); 23859566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatHYPRESetPreallocation_C", MatHYPRESetPreallocation_HYPRE)); 23869566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatHYPREGetParCSR_C", MatHYPREGetParCSR_HYPRE)); 23875fbaff96SJunchao Zhang PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_HYPRE)); 23885fbaff96SJunchao Zhang PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_HYPRE)); 23896ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 23906ea7df73SStefano Zampini #if defined(HYPRE_USING_HIP) 23919566063dSJacob Faibussowitsch PetscCall(PetscDeviceInitialize(PETSC_DEVICE_HIP)); 23929566063dSJacob Faibussowitsch PetscCall(MatSetVecType(B, VECHIP)); 23936ea7df73SStefano Zampini #endif 23946ea7df73SStefano Zampini #if defined(HYPRE_USING_CUDA) 23959566063dSJacob Faibussowitsch PetscCall(PetscDeviceInitialize(PETSC_DEVICE_CUDA)); 23969566063dSJacob Faibussowitsch PetscCall(MatSetVecType(B, VECCUDA)); 23976ea7df73SStefano Zampini #endif 23986ea7df73SStefano Zampini #endif 2399*ea9ee2c1SPierre Jolivet PetscHYPREInitialize(); 24003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 240163c07aadSStefano Zampini } 240263c07aadSStefano Zampini 2403d71ae5a4SJacob Faibussowitsch static PetscErrorCode hypre_array_destroy(void *ptr) 2404d71ae5a4SJacob Faibussowitsch { 2405225daaf8SStefano Zampini PetscFunctionBegin; 2406e6de0934SSatish Balay hypre_TFree(ptr, HYPRE_MEMORY_HOST); 24073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2408225daaf8SStefano Zampini } 2409