163c07aadSStefano Zampini 263c07aadSStefano Zampini /* 363c07aadSStefano Zampini Creates hypre ijmatrix from PETSc matrix 463c07aadSStefano Zampini */ 5225daaf8SStefano Zampini 6c6698e78SStefano Zampini #include <petscpkg_version.h> 739accc25SStefano Zampini #include <petsc/private/petschypre.h> 8dd9c0a25Sstefano_zampini #include <petscmathypre.h> 963c07aadSStefano Zampini #include <petsc/private/matimpl.h> 10a4af0ceeSJacob Faibussowitsch #include <petsc/private/deviceimpl.h> 1163c07aadSStefano Zampini #include <../src/mat/impls/hypre/mhypre.h> 1263c07aadSStefano Zampini #include <../src/mat/impls/aij/mpi/mpiaij.h> 1358968eb6SStefano Zampini #include <../src/vec/vec/impls/hypre/vhyp.h> 1458968eb6SStefano Zampini #include <HYPRE.h> 15c1a070e6SStefano Zampini #include <HYPRE_utilities.h> 16cd8bc7baSStefano Zampini #include <_hypre_parcsr_ls.h> 1768ec7858SStefano Zampini #include <_hypre_sstruct_ls.h> 1863c07aadSStefano Zampini 190e6427aaSSatish Balay #if PETSC_PKG_HYPRE_VERSION_LT(2,18,0) 200e6427aaSSatish Balay #define hypre_ParCSRMatrixClone(A,B) hypre_ParCSRMatrixCompleteClone(A) 210e6427aaSSatish Balay #endif 220e6427aaSSatish Balay 2363c07aadSStefano Zampini static PetscErrorCode MatHYPRE_CreateFromMat(Mat,Mat_HYPRE*); 2463c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixPreallocate(Mat,Mat,HYPRE_IJMatrix); 2563c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixFastCopy_MPIAIJ(Mat,HYPRE_IJMatrix); 2663c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixFastCopy_SeqAIJ(Mat,HYPRE_IJMatrix); 2739accc25SStefano Zampini static PetscErrorCode MatHYPRE_MultKernel_Private(Mat,HYPRE_Complex,Vec,HYPRE_Complex,Vec,PetscBool); 28225daaf8SStefano Zampini static PetscErrorCode hypre_array_destroy(void*); 296ea7df73SStefano Zampini static PetscErrorCode MatSetValues_HYPRE(Mat,PetscInt,const PetscInt[],PetscInt,const PetscInt[],const PetscScalar[],InsertMode ins); 3063c07aadSStefano Zampini 3163c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixPreallocate(Mat A_d, Mat A_o, HYPRE_IJMatrix ij) 3263c07aadSStefano Zampini { 3363c07aadSStefano Zampini PetscInt i,n_d,n_o; 3463c07aadSStefano Zampini const PetscInt *ia_d,*ia_o; 3563c07aadSStefano Zampini PetscBool done_d=PETSC_FALSE,done_o=PETSC_FALSE; 362cf14000SStefano Zampini HYPRE_Int *nnz_d=NULL,*nnz_o=NULL; 3763c07aadSStefano Zampini 3863c07aadSStefano Zampini PetscFunctionBegin; 3963c07aadSStefano Zampini if (A_d) { /* determine number of nonzero entries in local diagonal part */ 409566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(A_d,0,PETSC_FALSE,PETSC_FALSE,&n_d,&ia_d,NULL,&done_d)); 4163c07aadSStefano Zampini if (done_d) { 429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n_d,&nnz_d)); 4363c07aadSStefano Zampini for (i=0; i<n_d; i++) { 4463c07aadSStefano Zampini nnz_d[i] = ia_d[i+1] - ia_d[i]; 4563c07aadSStefano Zampini } 4663c07aadSStefano Zampini } 479566063dSJacob Faibussowitsch PetscCall(MatRestoreRowIJ(A_d,0,PETSC_FALSE,PETSC_FALSE,NULL,&ia_d,NULL,&done_d)); 4863c07aadSStefano Zampini } 4963c07aadSStefano Zampini if (A_o) { /* determine number of nonzero entries in local off-diagonal part */ 509566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(A_o,0,PETSC_FALSE,PETSC_FALSE,&n_o,&ia_o,NULL,&done_o)); 5163c07aadSStefano Zampini if (done_o) { 529566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n_o,&nnz_o)); 5363c07aadSStefano Zampini for (i=0; i<n_o; i++) { 5463c07aadSStefano Zampini nnz_o[i] = ia_o[i+1] - ia_o[i]; 5563c07aadSStefano Zampini } 5663c07aadSStefano Zampini } 579566063dSJacob Faibussowitsch PetscCall(MatRestoreRowIJ(A_o,0,PETSC_FALSE,PETSC_FALSE,&n_o,&ia_o,NULL,&done_o)); 5863c07aadSStefano Zampini } 5963c07aadSStefano Zampini if (done_d) { /* set number of nonzeros in HYPRE IJ matrix */ 6063c07aadSStefano Zampini if (!done_o) { /* only diagonal part */ 619566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n_d,&nnz_o)); 6263c07aadSStefano Zampini } 63c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2,16,0) 64c6698e78SStefano Zampini { /* If we don't do this, the columns of the matrix will be all zeros! */ 65c6698e78SStefano Zampini hypre_AuxParCSRMatrix *aux_matrix; 66c6698e78SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix*)hypre_IJMatrixTranslator(ij); 67c6698e78SStefano Zampini hypre_AuxParCSRMatrixDestroy(aux_matrix); 68c6698e78SStefano Zampini hypre_IJMatrixTranslator(ij) = NULL; 69792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetDiagOffdSizes,ij,nnz_d,nnz_o); 7022235d61SPierre Jolivet /* it seems they partially fixed it in 2.19.0 */ 7122235d61SPierre Jolivet #if PETSC_PKG_HYPRE_VERSION_LT(2,19,0) 72c6698e78SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix*)hypre_IJMatrixTranslator(ij); 73c6698e78SStefano Zampini hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 1; 7422235d61SPierre Jolivet #endif 75c6698e78SStefano Zampini } 76c6698e78SStefano Zampini #else 77792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetDiagOffdSizes,ij,nnz_d,nnz_o); 78c6698e78SStefano Zampini #endif 799566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz_d)); 809566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz_o)); 8163c07aadSStefano Zampini } 8263c07aadSStefano Zampini PetscFunctionReturn(0); 8363c07aadSStefano Zampini } 8463c07aadSStefano Zampini 8563c07aadSStefano Zampini static PetscErrorCode MatHYPRE_CreateFromMat(Mat A, Mat_HYPRE *hA) 8663c07aadSStefano Zampini { 8763c07aadSStefano Zampini PetscInt rstart,rend,cstart,cend; 8863c07aadSStefano Zampini 8963c07aadSStefano Zampini PetscFunctionBegin; 909566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 919566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 9263c07aadSStefano Zampini rstart = A->rmap->rstart; 9363c07aadSStefano Zampini rend = A->rmap->rend; 9463c07aadSStefano Zampini cstart = A->cmap->rstart; 9563c07aadSStefano Zampini cend = A->cmap->rend; 96792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixCreate,hA->comm,rstart,rend-1,cstart,cend-1,&hA->ij); 97792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetObjectType,hA->ij,HYPRE_PARCSR); 9863c07aadSStefano Zampini { 9963c07aadSStefano Zampini PetscBool same; 10063c07aadSStefano Zampini Mat A_d,A_o; 10163c07aadSStefano Zampini const PetscInt *colmap; 1029566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A,MATMPIAIJ,&same)); 10363c07aadSStefano Zampini if (same) { 1049566063dSJacob Faibussowitsch PetscCall(MatMPIAIJGetSeqAIJ(A,&A_d,&A_o,&colmap)); 1059566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixPreallocate(A_d,A_o,hA->ij)); 10663c07aadSStefano Zampini PetscFunctionReturn(0); 10763c07aadSStefano Zampini } 1089566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A,MATMPIBAIJ,&same)); 10963c07aadSStefano Zampini if (same) { 1109566063dSJacob Faibussowitsch PetscCall(MatMPIBAIJGetSeqBAIJ(A,&A_d,&A_o,&colmap)); 1119566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixPreallocate(A_d,A_o,hA->ij)); 11263c07aadSStefano Zampini PetscFunctionReturn(0); 11363c07aadSStefano Zampini } 1149566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A,MATSEQAIJ,&same)); 11563c07aadSStefano Zampini if (same) { 1169566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixPreallocate(A,NULL,hA->ij)); 11763c07aadSStefano Zampini PetscFunctionReturn(0); 11863c07aadSStefano Zampini } 1199566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A,MATSEQBAIJ,&same)); 12063c07aadSStefano Zampini if (same) { 1219566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixPreallocate(A,NULL,hA->ij)); 12263c07aadSStefano Zampini PetscFunctionReturn(0); 12363c07aadSStefano Zampini } 12463c07aadSStefano Zampini } 12563c07aadSStefano Zampini PetscFunctionReturn(0); 12663c07aadSStefano Zampini } 12763c07aadSStefano Zampini 12863c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixCopy(Mat A, HYPRE_IJMatrix ij) 12963c07aadSStefano Zampini { 13063c07aadSStefano Zampini PetscInt i,rstart,rend,ncols,nr,nc; 13163c07aadSStefano Zampini const PetscScalar *values; 13263c07aadSStefano Zampini const PetscInt *cols; 13363c07aadSStefano Zampini PetscBool flg; 13463c07aadSStefano Zampini 13563c07aadSStefano Zampini PetscFunctionBegin; 1366ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2,19,0) 137792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixInitialize,ij); 1386ea7df73SStefano Zampini #else 139792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixInitialize_v2,ij,HYPRE_MEMORY_HOST); 1406ea7df73SStefano Zampini #endif 1419566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A,MATMPIAIJ,&flg)); 1429566063dSJacob Faibussowitsch PetscCall(MatGetSize(A,&nr,&nc)); 14363c07aadSStefano Zampini if (flg && nr == nc) { 1449566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixFastCopy_MPIAIJ(A,ij)); 14563c07aadSStefano Zampini PetscFunctionReturn(0); 14663c07aadSStefano Zampini } 1479566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A,MATSEQAIJ,&flg)); 14863c07aadSStefano Zampini if (flg) { 1499566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixFastCopy_SeqAIJ(A,ij)); 15063c07aadSStefano Zampini PetscFunctionReturn(0); 15163c07aadSStefano Zampini } 15263c07aadSStefano Zampini 1535fbaff96SJunchao Zhang /* Do not need Aux since we have done precise i[],j[] allocation in MatHYPRE_CreateFromMat() */ 1545fbaff96SJunchao Zhang hypre_AuxParCSRMatrixNeedAux((hypre_AuxParCSRMatrix*)hypre_IJMatrixTranslator(ij)) = 0; 1555fbaff96SJunchao Zhang 1569566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(A,&rstart,&rend)); 15763c07aadSStefano Zampini for (i=rstart; i<rend; i++) { 1589566063dSJacob Faibussowitsch PetscCall(MatGetRow(A,i,&ncols,&cols,&values)); 159e3977e59Sstefano_zampini if (ncols) { 1602cf14000SStefano Zampini HYPRE_Int nc = (HYPRE_Int)ncols; 1612cf14000SStefano Zampini 162aed4548fSBarry Smith PetscCheck((PetscInt)nc == ncols,PETSC_COMM_SELF,PETSC_ERR_SUP,"Hypre overflow! number of columns %" PetscInt_FMT " for row %" PetscInt_FMT,ncols,i); 163792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetValues,ij,1,&nc,(HYPRE_BigInt *)&i,(HYPRE_BigInt *)cols,(HYPRE_Complex *)values); 164e3977e59Sstefano_zampini } 1659566063dSJacob Faibussowitsch PetscCall(MatRestoreRow(A,i,&ncols,&cols,&values)); 16663c07aadSStefano Zampini } 16763c07aadSStefano Zampini PetscFunctionReturn(0); 16863c07aadSStefano Zampini } 16963c07aadSStefano Zampini 17063c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixFastCopy_SeqAIJ(Mat A, HYPRE_IJMatrix ij) 17163c07aadSStefano Zampini { 17263c07aadSStefano Zampini Mat_SeqAIJ *pdiag = (Mat_SeqAIJ*)A->data; 17358968eb6SStefano Zampini HYPRE_Int type; 17463c07aadSStefano Zampini hypre_ParCSRMatrix *par_matrix; 17563c07aadSStefano Zampini hypre_AuxParCSRMatrix *aux_matrix; 17663c07aadSStefano Zampini hypre_CSRMatrix *hdiag; 1772cf14000SStefano Zampini PetscBool sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int)); 1786ea7df73SStefano Zampini const PetscScalar *pa; 17963c07aadSStefano Zampini 18063c07aadSStefano Zampini PetscFunctionBegin; 181792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType,ij,&type); 18208401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR,PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported"); 183792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject,ij,(void**)&par_matrix); 18463c07aadSStefano Zampini hdiag = hypre_ParCSRMatrixDiag(par_matrix); 18563c07aadSStefano Zampini /* 18663c07aadSStefano Zampini this is the Hack part where we monkey directly with the hypre datastructures 18763c07aadSStefano Zampini */ 1882cf14000SStefano Zampini if (sameint) { 1899566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hdiag->i,pdiag->i,A->rmap->n + 1)); 1909566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hdiag->j,pdiag->j,pdiag->nz)); 1912cf14000SStefano Zampini } else { 1922cf14000SStefano Zampini PetscInt i; 1932cf14000SStefano Zampini 1942cf14000SStefano Zampini for (i=0;i<A->rmap->n + 1;i++) hdiag->i[i] = (HYPRE_Int)pdiag->i[i]; 1952cf14000SStefano Zampini for (i=0;i<pdiag->nz;i++) hdiag->j[i] = (HYPRE_Int)pdiag->j[i]; 1962cf14000SStefano Zampini } 1976ea7df73SStefano Zampini 1989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&pa)); 1999566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hdiag->data,pa,pdiag->nz)); 2009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&pa)); 201ea9daf28SStefano Zampini 202ea9daf28SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix*)hypre_IJMatrixTranslator(ij); 20363c07aadSStefano Zampini hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0; 20463c07aadSStefano Zampini PetscFunctionReturn(0); 20563c07aadSStefano Zampini } 20663c07aadSStefano Zampini 20763c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixFastCopy_MPIAIJ(Mat A, HYPRE_IJMatrix ij) 20863c07aadSStefano Zampini { 20963c07aadSStefano Zampini Mat_MPIAIJ *pA = (Mat_MPIAIJ*)A->data; 21063c07aadSStefano Zampini Mat_SeqAIJ *pdiag,*poffd; 21163c07aadSStefano Zampini PetscInt i,*garray = pA->garray,*jj,cstart,*pjj; 2122cf14000SStefano Zampini HYPRE_Int *hjj,type; 21363c07aadSStefano Zampini hypre_ParCSRMatrix *par_matrix; 21463c07aadSStefano Zampini hypre_AuxParCSRMatrix *aux_matrix; 21563c07aadSStefano Zampini hypre_CSRMatrix *hdiag,*hoffd; 2162cf14000SStefano Zampini PetscBool sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int)); 2176ea7df73SStefano Zampini const PetscScalar *pa; 21863c07aadSStefano Zampini 21963c07aadSStefano Zampini PetscFunctionBegin; 22063c07aadSStefano Zampini pdiag = (Mat_SeqAIJ*) pA->A->data; 22163c07aadSStefano Zampini poffd = (Mat_SeqAIJ*) pA->B->data; 22263c07aadSStefano Zampini /* cstart is only valid for square MPIAIJ layed out in the usual way */ 2239566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(A,&cstart,NULL)); 22463c07aadSStefano Zampini 225792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType,ij,&type); 22608401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR,PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported"); 227792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject,ij,(void**)&par_matrix); 22863c07aadSStefano Zampini hdiag = hypre_ParCSRMatrixDiag(par_matrix); 22963c07aadSStefano Zampini hoffd = hypre_ParCSRMatrixOffd(par_matrix); 23063c07aadSStefano Zampini 23163c07aadSStefano Zampini /* 23263c07aadSStefano Zampini this is the Hack part where we monkey directly with the hypre datastructures 23363c07aadSStefano Zampini */ 2342cf14000SStefano Zampini if (sameint) { 2359566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hdiag->i,pdiag->i,pA->A->rmap->n + 1)); 2362cf14000SStefano Zampini } else { 2372cf14000SStefano Zampini for (i=0; i<pA->A->rmap->n + 1; i++) hdiag->i[i] = (HYPRE_Int)(pdiag->i[i]); 2382cf14000SStefano Zampini } 23963c07aadSStefano Zampini /* need to shift the diag column indices (hdiag->j) back to global numbering since hypre is expecting this */ 2402cf14000SStefano Zampini hjj = hdiag->j; 2412cf14000SStefano Zampini pjj = pdiag->j; 242c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2,16,0) 2432cf14000SStefano Zampini for (i=0; i<pdiag->nz; i++) hjj[i] = pjj[i]; 244c6698e78SStefano Zampini #else 2452cf14000SStefano Zampini for (i=0; i<pdiag->nz; i++) hjj[i] = cstart + pjj[i]; 246c6698e78SStefano Zampini #endif 2479566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(pA->A,&pa)); 2489566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hdiag->data,pa,pdiag->nz)); 2499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(pA->A,&pa)); 2502cf14000SStefano Zampini if (sameint) { 2519566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hoffd->i,poffd->i,pA->A->rmap->n + 1)); 2522cf14000SStefano Zampini } else { 2532cf14000SStefano Zampini for (i=0; i<pA->A->rmap->n + 1; i++) hoffd->i[i] = (HYPRE_Int)(poffd->i[i]); 2542cf14000SStefano Zampini } 2552cf14000SStefano Zampini 25663c07aadSStefano Zampini /* need to move the offd column indices (hoffd->j) back to global numbering since hypre is expecting this 25763c07aadSStefano Zampini If we hacked a hypre a bit more we might be able to avoid this step */ 258c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2,16,0) 259792fecdfSBarry Smith PetscCallExternal(hypre_CSRMatrixBigInitialize,hoffd); 260c6698e78SStefano Zampini jj = (PetscInt*) hoffd->big_j; 261c6698e78SStefano Zampini #else 26263c07aadSStefano Zampini jj = (PetscInt*) hoffd->j; 263c6698e78SStefano Zampini #endif 2642cf14000SStefano Zampini pjj = poffd->j; 26563c07aadSStefano Zampini for (i=0; i<poffd->nz; i++) jj[i] = garray[pjj[i]]; 266c6698e78SStefano Zampini 2679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(pA->B,&pa)); 2689566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hoffd->data,pa,poffd->nz)); 2699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(pA->B,&pa)); 27063c07aadSStefano Zampini 271ea9daf28SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix*)hypre_IJMatrixTranslator(ij); 27263c07aadSStefano Zampini hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0; 27363c07aadSStefano Zampini PetscFunctionReturn(0); 27463c07aadSStefano Zampini } 27563c07aadSStefano Zampini 2762df22349SStefano Zampini static PetscErrorCode MatConvert_HYPRE_IS(Mat A, MatType mtype, MatReuse reuse, Mat* B) 2772df22349SStefano Zampini { 2782df22349SStefano Zampini Mat_HYPRE* mhA = (Mat_HYPRE*)(A->data); 2792df22349SStefano Zampini Mat lA; 2802df22349SStefano Zampini ISLocalToGlobalMapping rl2g,cl2g; 2812df22349SStefano Zampini IS is; 2822df22349SStefano Zampini hypre_ParCSRMatrix *hA; 2832df22349SStefano Zampini hypre_CSRMatrix *hdiag,*hoffd; 2842df22349SStefano Zampini MPI_Comm comm; 28539accc25SStefano Zampini HYPRE_Complex *hdd,*hod,*aa; 28639accc25SStefano Zampini PetscScalar *data; 2872cf14000SStefano Zampini HYPRE_BigInt *col_map_offd; 2882cf14000SStefano Zampini HYPRE_Int *hdi,*hdj,*hoi,*hoj; 2892df22349SStefano Zampini PetscInt *ii,*jj,*iptr,*jptr; 2902df22349SStefano Zampini PetscInt cum,dr,dc,oc,str,stc,nnz,i,jd,jo,M,N; 29158968eb6SStefano Zampini HYPRE_Int type; 2922df22349SStefano Zampini 2932df22349SStefano Zampini PetscFunctionBegin; 294a1787963SStefano Zampini comm = PetscObjectComm((PetscObject)A); 295792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType,mhA->ij,&type); 29608401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR,comm,PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported"); 297792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject,mhA->ij,(void**)&hA); 2982df22349SStefano Zampini M = hypre_ParCSRMatrixGlobalNumRows(hA); 2992df22349SStefano Zampini N = hypre_ParCSRMatrixGlobalNumCols(hA); 3002df22349SStefano Zampini str = hypre_ParCSRMatrixFirstRowIndex(hA); 3012df22349SStefano Zampini stc = hypre_ParCSRMatrixFirstColDiag(hA); 3022df22349SStefano Zampini hdiag = hypre_ParCSRMatrixDiag(hA); 3032df22349SStefano Zampini hoffd = hypre_ParCSRMatrixOffd(hA); 3042df22349SStefano Zampini dr = hypre_CSRMatrixNumRows(hdiag); 3052df22349SStefano Zampini dc = hypre_CSRMatrixNumCols(hdiag); 3062df22349SStefano Zampini nnz = hypre_CSRMatrixNumNonzeros(hdiag); 3072df22349SStefano Zampini hdi = hypre_CSRMatrixI(hdiag); 3082df22349SStefano Zampini hdj = hypre_CSRMatrixJ(hdiag); 3092df22349SStefano Zampini hdd = hypre_CSRMatrixData(hdiag); 3102df22349SStefano Zampini oc = hypre_CSRMatrixNumCols(hoffd); 3112df22349SStefano Zampini nnz += hypre_CSRMatrixNumNonzeros(hoffd); 3122df22349SStefano Zampini hoi = hypre_CSRMatrixI(hoffd); 3132df22349SStefano Zampini hoj = hypre_CSRMatrixJ(hoffd); 3142df22349SStefano Zampini hod = hypre_CSRMatrixData(hoffd); 3152df22349SStefano Zampini if (reuse != MAT_REUSE_MATRIX) { 3162df22349SStefano Zampini PetscInt *aux; 3172df22349SStefano Zampini 3182df22349SStefano Zampini /* generate l2g maps for rows and cols */ 3199566063dSJacob Faibussowitsch PetscCall(ISCreateStride(comm,dr,str,1,&is)); 3209566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreateIS(is,&rl2g)); 3219566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is)); 3222df22349SStefano Zampini col_map_offd = hypre_ParCSRMatrixColMapOffd(hA); 3239566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(dc+oc,&aux)); 3242df22349SStefano Zampini for (i=0; i<dc; i++) aux[i] = i+stc; 3252df22349SStefano Zampini for (i=0; i<oc; i++) aux[i+dc] = col_map_offd[i]; 3269566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(comm,dc+oc,aux,PETSC_OWN_POINTER,&is)); 3279566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreateIS(is,&cl2g)); 3289566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is)); 3292df22349SStefano Zampini /* create MATIS object */ 3309566063dSJacob Faibussowitsch PetscCall(MatCreate(comm,B)); 3319566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B,dr,dc,M,N)); 3329566063dSJacob Faibussowitsch PetscCall(MatSetType(*B,MATIS)); 3339566063dSJacob Faibussowitsch PetscCall(MatSetLocalToGlobalMapping(*B,rl2g,cl2g)); 3349566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingDestroy(&rl2g)); 3359566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingDestroy(&cl2g)); 3362df22349SStefano Zampini 3372df22349SStefano Zampini /* allocate CSR for local matrix */ 3389566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(dr+1,&iptr)); 3399566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz,&jptr)); 3409566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz,&data)); 3412df22349SStefano Zampini } else { 3422df22349SStefano Zampini PetscInt nr; 3432df22349SStefano Zampini PetscBool done; 3449566063dSJacob Faibussowitsch PetscCall(MatISGetLocalMat(*B,&lA)); 3459566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(lA,0,PETSC_FALSE,PETSC_FALSE,&nr,(const PetscInt**)&iptr,(const PetscInt**)&jptr,&done)); 34608401ef6SPierre Jolivet PetscCheck(nr == dr,PETSC_COMM_SELF,PETSC_ERR_USER,"Cannot reuse mat: invalid number of rows in local mat! %" PetscInt_FMT " != %" PetscInt_FMT,nr,dr); 34708401ef6SPierre Jolivet PetscCheck(iptr[nr] >= nnz,PETSC_COMM_SELF,PETSC_ERR_USER,"Cannot reuse mat: invalid number of nonzeros in local mat! reuse %" PetscInt_FMT " requested %" PetscInt_FMT,iptr[nr],nnz); 3489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(lA,&data)); 3492df22349SStefano Zampini } 3502df22349SStefano Zampini /* merge local matrices */ 3512df22349SStefano Zampini ii = iptr; 3522df22349SStefano Zampini jj = jptr; 35339accc25SStefano Zampini aa = (HYPRE_Complex*)data; /* this cast fixes the clang error when doing the assignments below: implicit conversion from 'HYPRE_Complex' (aka '_Complex double') to 'double' is not permitted in C++ */ 3542df22349SStefano Zampini *ii = *(hdi++) + *(hoi++); 3552df22349SStefano Zampini for (jd=0,jo=0,cum=0; *ii<nnz; cum++) { 35639accc25SStefano Zampini PetscScalar *aold = (PetscScalar*)aa; 3572df22349SStefano Zampini PetscInt *jold = jj,nc = jd+jo; 3582df22349SStefano Zampini for (; jd<*hdi; jd++) { *jj++ = *hdj++; *aa++ = *hdd++; } 3592df22349SStefano Zampini for (; jo<*hoi; jo++) { *jj++ = *hoj++ + dc; *aa++ = *hod++; } 3602df22349SStefano Zampini *(++ii) = *(hdi++) + *(hoi++); 3619566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(jd+jo-nc,jold,aold)); 3622df22349SStefano Zampini } 3632df22349SStefano Zampini for (; cum<dr; cum++) *(++ii) = nnz; 3642df22349SStefano Zampini if (reuse != MAT_REUSE_MATRIX) { 365a033916dSStefano Zampini Mat_SeqAIJ* a; 366a033916dSStefano Zampini 3679566063dSJacob Faibussowitsch PetscCall(MatCreateSeqAIJWithArrays(PETSC_COMM_SELF,dr,dc+oc,iptr,jptr,data,&lA)); 3689566063dSJacob Faibussowitsch PetscCall(MatISSetLocalMat(*B,lA)); 369a033916dSStefano Zampini /* hack SeqAIJ */ 370a033916dSStefano Zampini a = (Mat_SeqAIJ*)(lA->data); 371a033916dSStefano Zampini a->free_a = PETSC_TRUE; 372a033916dSStefano Zampini a->free_ij = PETSC_TRUE; 3739566063dSJacob Faibussowitsch PetscCall(MatDestroy(&lA)); 3742df22349SStefano Zampini } 3759566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY)); 3769566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY)); 3772df22349SStefano Zampini if (reuse == MAT_INPLACE_MATRIX) { 3789566063dSJacob Faibussowitsch PetscCall(MatHeaderReplace(A,B)); 3792df22349SStefano Zampini } 3802df22349SStefano Zampini PetscFunctionReturn(0); 3812df22349SStefano Zampini } 3822df22349SStefano Zampini 38363c07aadSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType type, MatReuse reuse, Mat *B) 38463c07aadSStefano Zampini { 38584d4e069SStefano Zampini Mat M = NULL; 38663c07aadSStefano Zampini Mat_HYPRE *hB; 38763c07aadSStefano Zampini MPI_Comm comm = PetscObjectComm((PetscObject)A); 38863c07aadSStefano Zampini 38963c07aadSStefano Zampini PetscFunctionBegin; 39063c07aadSStefano Zampini if (reuse == MAT_REUSE_MATRIX) { 39163c07aadSStefano Zampini /* always destroy the old matrix and create a new memory; 39263c07aadSStefano Zampini hope this does not churn the memory too much. The problem 39363c07aadSStefano Zampini is I do not know if it is possible to put the matrix back to 39463c07aadSStefano Zampini its initial state so that we can directly copy the values 39563c07aadSStefano Zampini the second time through. */ 39663c07aadSStefano Zampini hB = (Mat_HYPRE*)((*B)->data); 397792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixDestroy,hB->ij); 39863c07aadSStefano Zampini } else { 3999566063dSJacob Faibussowitsch PetscCall(MatCreate(comm,&M)); 4009566063dSJacob Faibussowitsch PetscCall(MatSetType(M,MATHYPRE)); 4019566063dSJacob Faibussowitsch PetscCall(MatSetSizes(M,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N)); 40284d4e069SStefano Zampini hB = (Mat_HYPRE*)(M->data); 40384d4e069SStefano Zampini if (reuse == MAT_INITIAL_MATRIX) *B = M; 40463c07aadSStefano Zampini } 4059566063dSJacob Faibussowitsch PetscCall(MatSetOption(*B,MAT_SORTED_FULL,PETSC_TRUE)); /* "perfect" preallocation, so no need for hypre_AuxParCSRMatrixNeedAux */ 4069566063dSJacob Faibussowitsch PetscCall(MatSetOption(*B,MAT_NO_OFF_PROC_ENTRIES,PETSC_TRUE)); 4079566063dSJacob Faibussowitsch PetscCall(MatHYPRE_CreateFromMat(A,hB)); 4089566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixCopy(A,hB->ij)); 40984d4e069SStefano Zampini if (reuse == MAT_INPLACE_MATRIX) { 4109566063dSJacob Faibussowitsch PetscCall(MatHeaderReplace(A,&M)); 41184d4e069SStefano Zampini } 4124ec6421dSstefano_zampini (*B)->preallocated = PETSC_TRUE; 4139566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY)); 4149566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY)); 41563c07aadSStefano Zampini PetscFunctionReturn(0); 41663c07aadSStefano Zampini } 41763c07aadSStefano Zampini 418ea9daf28SStefano Zampini static PetscErrorCode MatConvert_HYPRE_AIJ(Mat A, MatType mtype, MatReuse reuse, Mat *B) 41963c07aadSStefano Zampini { 42063c07aadSStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 42163c07aadSStefano Zampini hypre_ParCSRMatrix *parcsr; 42263c07aadSStefano Zampini hypre_CSRMatrix *hdiag,*hoffd; 42363c07aadSStefano Zampini MPI_Comm comm; 42463c07aadSStefano Zampini PetscScalar *da,*oa,*aptr; 42563c07aadSStefano Zampini PetscInt *dii,*djj,*oii,*ojj,*iptr; 42663c07aadSStefano Zampini PetscInt i,dnnz,onnz,m,n; 42758968eb6SStefano Zampini HYPRE_Int type; 42863c07aadSStefano Zampini PetscMPIInt size; 4292cf14000SStefano Zampini PetscBool sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int)); 43063c07aadSStefano Zampini 43163c07aadSStefano Zampini PetscFunctionBegin; 43263c07aadSStefano Zampini comm = PetscObjectComm((PetscObject)A); 433792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType,hA->ij,&type); 43408401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR,comm,PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported"); 43563c07aadSStefano Zampini if (reuse == MAT_REUSE_MATRIX) { 43663c07aadSStefano Zampini PetscBool ismpiaij,isseqaij; 4379566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)*B,MATMPIAIJ,&ismpiaij)); 4389566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)*B,MATSEQAIJ,&isseqaij)); 43908401ef6SPierre Jolivet PetscCheck(ismpiaij || isseqaij,comm,PETSC_ERR_SUP,"Only MATMPIAIJ or MATSEQAIJ are supported"); 44063c07aadSStefano Zampini } 4416ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 44208401ef6SPierre Jolivet PetscCheck(HYPRE_MEMORY_DEVICE != hypre_IJMatrixMemoryLocation(hA->ij),comm,PETSC_ERR_SUP,"Not yet implemented"); 4436ea7df73SStefano Zampini #endif 4449566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(comm,&size)); 44563c07aadSStefano Zampini 446792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject,hA->ij,(void**)&parcsr); 44763c07aadSStefano Zampini hdiag = hypre_ParCSRMatrixDiag(parcsr); 44863c07aadSStefano Zampini hoffd = hypre_ParCSRMatrixOffd(parcsr); 44963c07aadSStefano Zampini m = hypre_CSRMatrixNumRows(hdiag); 45063c07aadSStefano Zampini n = hypre_CSRMatrixNumCols(hdiag); 45163c07aadSStefano Zampini dnnz = hypre_CSRMatrixNumNonzeros(hdiag); 45263c07aadSStefano Zampini onnz = hypre_CSRMatrixNumNonzeros(hoffd); 453225daaf8SStefano Zampini if (reuse == MAT_INITIAL_MATRIX) { 4549566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m+1,&dii)); 4559566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(dnnz,&djj)); 4569566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(dnnz,&da)); 457225daaf8SStefano Zampini } else if (reuse == MAT_REUSE_MATRIX) { 45863c07aadSStefano Zampini PetscInt nr; 45963c07aadSStefano Zampini PetscBool done; 46063c07aadSStefano Zampini if (size > 1) { 46163c07aadSStefano Zampini Mat_MPIAIJ *b = (Mat_MPIAIJ*)((*B)->data); 46263c07aadSStefano Zampini 4639566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(b->A,0,PETSC_FALSE,PETSC_FALSE,&nr,(const PetscInt**)&dii,(const PetscInt**)&djj,&done)); 46408401ef6SPierre Jolivet PetscCheck(nr == m,PETSC_COMM_SELF,PETSC_ERR_USER,"Cannot reuse mat: invalid number of local rows in diag part! %" PetscInt_FMT " != %" PetscInt_FMT,nr,m); 46508401ef6SPierre Jolivet PetscCheck(dii[nr] >= dnnz,PETSC_COMM_SELF,PETSC_ERR_USER,"Cannot reuse mat: invalid number of nonzeros in diag part! reuse %" PetscInt_FMT " hypre %" PetscInt_FMT,dii[nr],dnnz); 4669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(b->A,&da)); 46763c07aadSStefano Zampini } else { 4689566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(*B,0,PETSC_FALSE,PETSC_FALSE,&nr,(const PetscInt**)&dii,(const PetscInt**)&djj,&done)); 46908401ef6SPierre Jolivet PetscCheck(nr == m,PETSC_COMM_SELF,PETSC_ERR_USER,"Cannot reuse mat: invalid number of local rows! %" PetscInt_FMT " != %" PetscInt_FMT,nr,m); 47008401ef6SPierre Jolivet PetscCheck(dii[nr] >= dnnz,PETSC_COMM_SELF,PETSC_ERR_USER,"Cannot reuse mat: invalid number of nonzeros! reuse %" PetscInt_FMT " hypre %" PetscInt_FMT,dii[nr],dnnz); 4719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*B,&da)); 47263c07aadSStefano Zampini } 473225daaf8SStefano Zampini } else { /* MAT_INPLACE_MATRIX */ 4742cf14000SStefano Zampini if (!sameint) { 4759566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m+1,&dii)); 4769566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(dnnz,&djj)); 4772cf14000SStefano Zampini } else { 4787d968826Sstefano_zampini dii = (PetscInt*)hypre_CSRMatrixI(hdiag); 4797d968826Sstefano_zampini djj = (PetscInt*)hypre_CSRMatrixJ(hdiag); 48063c07aadSStefano Zampini } 48139accc25SStefano Zampini da = (PetscScalar*)hypre_CSRMatrixData(hdiag); 48263c07aadSStefano Zampini } 4832cf14000SStefano Zampini 4842cf14000SStefano Zampini if (!sameint) { 485a16187a7SStefano Zampini if (reuse != MAT_REUSE_MATRIX) { for (i=0;i<m+1;i++) dii[i] = (PetscInt)(hypre_CSRMatrixI(hdiag)[i]); } 4862cf14000SStefano Zampini for (i=0;i<dnnz;i++) djj[i] = (PetscInt)(hypre_CSRMatrixJ(hdiag)[i]); 4872cf14000SStefano Zampini } else { 4889566063dSJacob Faibussowitsch if (reuse != MAT_REUSE_MATRIX) PetscCall(PetscArraycpy(dii,hypre_CSRMatrixI(hdiag),m+1)); 4899566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(djj,hypre_CSRMatrixJ(hdiag),dnnz)); 4902cf14000SStefano Zampini } 4919566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(da,hypre_CSRMatrixData(hdiag),dnnz)); 49263c07aadSStefano Zampini iptr = djj; 49363c07aadSStefano Zampini aptr = da; 49463c07aadSStefano Zampini for (i=0; i<m; i++) { 49563c07aadSStefano Zampini PetscInt nc = dii[i+1]-dii[i]; 4969566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(nc,iptr,aptr)); 49763c07aadSStefano Zampini iptr += nc; 49863c07aadSStefano Zampini aptr += nc; 49963c07aadSStefano Zampini } 50063c07aadSStefano Zampini if (size > 1) { 5012cf14000SStefano Zampini HYPRE_BigInt *coffd; 5022cf14000SStefano Zampini HYPRE_Int *offdj; 50363c07aadSStefano Zampini 504225daaf8SStefano Zampini if (reuse == MAT_INITIAL_MATRIX) { 5059566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m+1,&oii)); 5069566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(onnz,&ojj)); 5079566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(onnz,&oa)); 508225daaf8SStefano Zampini } else if (reuse == MAT_REUSE_MATRIX) { 50963c07aadSStefano Zampini Mat_MPIAIJ *b = (Mat_MPIAIJ*)((*B)->data); 51063c07aadSStefano Zampini PetscInt nr,hr = hypre_CSRMatrixNumRows(hoffd); 51163c07aadSStefano Zampini PetscBool done; 51263c07aadSStefano Zampini 5139566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(b->B,0,PETSC_FALSE,PETSC_FALSE,&nr,(const PetscInt**)&oii,(const PetscInt**)&ojj,&done)); 51408401ef6SPierre Jolivet PetscCheck(nr == hr,PETSC_COMM_SELF,PETSC_ERR_USER,"Cannot reuse mat: invalid number of local rows in offdiag part! %" PetscInt_FMT " != %" PetscInt_FMT,nr,hr); 51508401ef6SPierre Jolivet PetscCheck(oii[nr] >= onnz,PETSC_COMM_SELF,PETSC_ERR_USER,"Cannot reuse mat: invalid number of nonzeros in offdiag part! reuse %" PetscInt_FMT " hypre %" PetscInt_FMT,oii[nr],onnz); 5169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(b->B,&oa)); 517225daaf8SStefano Zampini } else { /* MAT_INPLACE_MATRIX */ 5182cf14000SStefano Zampini if (!sameint) { 5199566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m+1,&oii)); 5209566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(onnz,&ojj)); 5212cf14000SStefano Zampini } else { 5227d968826Sstefano_zampini oii = (PetscInt*)hypre_CSRMatrixI(hoffd); 5237d968826Sstefano_zampini ojj = (PetscInt*)hypre_CSRMatrixJ(hoffd); 52463c07aadSStefano Zampini } 52539accc25SStefano Zampini oa = (PetscScalar*)hypre_CSRMatrixData(hoffd); 52663c07aadSStefano Zampini } 527a16187a7SStefano Zampini if (reuse != MAT_REUSE_MATRIX) { 5282cf14000SStefano Zampini if (!sameint) { 5292cf14000SStefano Zampini for (i=0;i<m+1;i++) oii[i] = (PetscInt)(hypre_CSRMatrixI(hoffd)[i]); 5302cf14000SStefano Zampini } else { 5319566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(oii,hypre_CSRMatrixI(hoffd),m+1)); 5322cf14000SStefano Zampini } 533a16187a7SStefano Zampini } 5349566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(oa,hypre_CSRMatrixData(hoffd),onnz)); 535a16187a7SStefano Zampini 53663c07aadSStefano Zampini offdj = hypre_CSRMatrixJ(hoffd); 53763c07aadSStefano Zampini coffd = hypre_ParCSRMatrixColMapOffd(parcsr); 538a16187a7SStefano Zampini /* we only need the permutation to be computed properly, I don't know if HYPRE 539a16187a7SStefano Zampini messes up with the ordering. Just in case, allocate some memory and free it 540a16187a7SStefano Zampini later */ 541a16187a7SStefano Zampini if (reuse == MAT_REUSE_MATRIX) { 542a16187a7SStefano Zampini Mat_MPIAIJ *b = (Mat_MPIAIJ*)((*B)->data); 543a16187a7SStefano Zampini PetscInt mnz; 544a16187a7SStefano Zampini 5459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetMaxRowNonzeros(b->B,&mnz)); 5469566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mnz,&ojj)); 547a16187a7SStefano Zampini } else for (i=0; i<onnz; i++) ojj[i] = coffd[offdj[i]]; 54863c07aadSStefano Zampini iptr = ojj; 54963c07aadSStefano Zampini aptr = oa; 55063c07aadSStefano Zampini for (i=0; i<m; i++) { 55163c07aadSStefano Zampini PetscInt nc = oii[i+1]-oii[i]; 552a16187a7SStefano Zampini if (reuse == MAT_REUSE_MATRIX) { 553a16187a7SStefano Zampini PetscInt j; 554a16187a7SStefano Zampini 555a16187a7SStefano Zampini iptr = ojj; 556a16187a7SStefano Zampini for (j=0; j<nc; j++) iptr[j] = coffd[offdj[oii[i] + j]]; 557a16187a7SStefano Zampini } 5589566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(nc,iptr,aptr)); 55963c07aadSStefano Zampini iptr += nc; 56063c07aadSStefano Zampini aptr += nc; 56163c07aadSStefano Zampini } 5629566063dSJacob Faibussowitsch if (reuse == MAT_REUSE_MATRIX) PetscCall(PetscFree(ojj)); 563225daaf8SStefano Zampini if (reuse == MAT_INITIAL_MATRIX) { 56463c07aadSStefano Zampini Mat_MPIAIJ *b; 56563c07aadSStefano Zampini Mat_SeqAIJ *d,*o; 566225daaf8SStefano Zampini 5679566063dSJacob Faibussowitsch PetscCall(MatCreateMPIAIJWithSplitArrays(comm,m,n,PETSC_DECIDE,PETSC_DECIDE,dii,djj,da,oii,ojj,oa,B)); 56863c07aadSStefano Zampini /* hack MPIAIJ */ 56963c07aadSStefano Zampini b = (Mat_MPIAIJ*)((*B)->data); 57063c07aadSStefano Zampini d = (Mat_SeqAIJ*)b->A->data; 57163c07aadSStefano Zampini o = (Mat_SeqAIJ*)b->B->data; 57263c07aadSStefano Zampini d->free_a = PETSC_TRUE; 57363c07aadSStefano Zampini d->free_ij = PETSC_TRUE; 57463c07aadSStefano Zampini o->free_a = PETSC_TRUE; 57563c07aadSStefano Zampini o->free_ij = PETSC_TRUE; 576225daaf8SStefano Zampini } else if (reuse == MAT_INPLACE_MATRIX) { 577225daaf8SStefano Zampini Mat T; 5782cf14000SStefano Zampini 5799566063dSJacob Faibussowitsch PetscCall(MatCreateMPIAIJWithSplitArrays(comm,m,n,PETSC_DECIDE,PETSC_DECIDE,dii,djj,da,oii,ojj,oa,&T)); 5802cf14000SStefano Zampini if (sameint) { /* ownership of CSR pointers is transferred to PETSc */ 581225daaf8SStefano Zampini hypre_CSRMatrixI(hdiag) = NULL; 582225daaf8SStefano Zampini hypre_CSRMatrixJ(hdiag) = NULL; 583225daaf8SStefano Zampini hypre_CSRMatrixI(hoffd) = NULL; 584225daaf8SStefano Zampini hypre_CSRMatrixJ(hoffd) = NULL; 5852cf14000SStefano Zampini } else { /* Hack MPIAIJ -> free ij but not a */ 5862cf14000SStefano Zampini Mat_MPIAIJ *b = (Mat_MPIAIJ*)(T->data); 5872cf14000SStefano Zampini Mat_SeqAIJ *d = (Mat_SeqAIJ*)(b->A->data); 5882cf14000SStefano Zampini Mat_SeqAIJ *o = (Mat_SeqAIJ*)(b->B->data); 5892cf14000SStefano Zampini 5902cf14000SStefano Zampini d->free_ij = PETSC_TRUE; 5912cf14000SStefano Zampini o->free_ij = PETSC_TRUE; 5922cf14000SStefano Zampini } 5932cf14000SStefano Zampini hypre_CSRMatrixData(hdiag) = NULL; 594225daaf8SStefano Zampini hypre_CSRMatrixData(hoffd) = NULL; 5959566063dSJacob Faibussowitsch PetscCall(MatHeaderReplace(A,&T)); 59663c07aadSStefano Zampini } 597225daaf8SStefano Zampini } else { 598225daaf8SStefano Zampini oii = NULL; 599225daaf8SStefano Zampini ojj = NULL; 600225daaf8SStefano Zampini oa = NULL; 601225daaf8SStefano Zampini if (reuse == MAT_INITIAL_MATRIX) { 60263c07aadSStefano Zampini Mat_SeqAIJ* b; 6032cf14000SStefano Zampini 6049566063dSJacob Faibussowitsch PetscCall(MatCreateSeqAIJWithArrays(comm,m,n,dii,djj,da,B)); 60563c07aadSStefano Zampini /* hack SeqAIJ */ 60663c07aadSStefano Zampini b = (Mat_SeqAIJ*)((*B)->data); 60763c07aadSStefano Zampini b->free_a = PETSC_TRUE; 60863c07aadSStefano Zampini b->free_ij = PETSC_TRUE; 609225daaf8SStefano Zampini } else if (reuse == MAT_INPLACE_MATRIX) { 610225daaf8SStefano Zampini Mat T; 6112cf14000SStefano Zampini 6129566063dSJacob Faibussowitsch PetscCall(MatCreateSeqAIJWithArrays(comm,m,n,dii,djj,da,&T)); 6132cf14000SStefano Zampini if (sameint) { /* ownership of CSR pointers is transferred to PETSc */ 614225daaf8SStefano Zampini hypre_CSRMatrixI(hdiag) = NULL; 615225daaf8SStefano Zampini hypre_CSRMatrixJ(hdiag) = NULL; 6162cf14000SStefano Zampini } else { /* free ij but not a */ 6172cf14000SStefano Zampini Mat_SeqAIJ* b = (Mat_SeqAIJ*)(T->data); 6182cf14000SStefano Zampini 6192cf14000SStefano Zampini b->free_ij = PETSC_TRUE; 6202cf14000SStefano Zampini } 621225daaf8SStefano Zampini hypre_CSRMatrixData(hdiag) = NULL; 6229566063dSJacob Faibussowitsch PetscCall(MatHeaderReplace(A,&T)); 62363c07aadSStefano Zampini } 624225daaf8SStefano Zampini } 625225daaf8SStefano Zampini 6262cf14000SStefano Zampini /* we have to use hypre_Tfree to free the HYPRE arrays 6272cf14000SStefano Zampini that PETSc now onws */ 62863c07aadSStefano Zampini if (reuse == MAT_INPLACE_MATRIX) { 6292cf14000SStefano Zampini PetscInt nh; 6302cf14000SStefano Zampini void *ptrs[6] = {da,oa,dii,djj,oii,ojj}; 6312cf14000SStefano Zampini const char *names[6] = {"_hypre_csr_da", 6322cf14000SStefano Zampini "_hypre_csr_oa", 6332cf14000SStefano Zampini "_hypre_csr_dii", 634225daaf8SStefano Zampini "_hypre_csr_djj", 635225daaf8SStefano Zampini "_hypre_csr_oii", 6362cf14000SStefano Zampini "_hypre_csr_ojj"}; 6372cf14000SStefano Zampini nh = sameint ? 6 : 2; 6382cf14000SStefano Zampini for (i=0; i<nh; i++) { 639225daaf8SStefano Zampini PetscContainer c; 640225daaf8SStefano Zampini 6419566063dSJacob Faibussowitsch PetscCall(PetscContainerCreate(comm,&c)); 6429566063dSJacob Faibussowitsch PetscCall(PetscContainerSetPointer(c,ptrs[i])); 6439566063dSJacob Faibussowitsch PetscCall(PetscContainerSetUserDestroy(c,hypre_array_destroy)); 6449566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)(*B),names[i],(PetscObject)c)); 6459566063dSJacob Faibussowitsch PetscCall(PetscContainerDestroy(&c)); 646225daaf8SStefano Zampini } 64763c07aadSStefano Zampini } 64863c07aadSStefano Zampini PetscFunctionReturn(0); 64963c07aadSStefano Zampini } 65063c07aadSStefano Zampini 651613e5ff0Sstefano_zampini static PetscErrorCode MatAIJGetParCSR_Private(Mat A, hypre_ParCSRMatrix **hA) 652c1a070e6SStefano Zampini { 653613e5ff0Sstefano_zampini hypre_ParCSRMatrix *tA; 654c1a070e6SStefano Zampini hypre_CSRMatrix *hdiag,*hoffd; 655c1a070e6SStefano Zampini Mat_SeqAIJ *diag,*offd; 6562cf14000SStefano Zampini PetscInt *garray,i,noffd,dnnz,onnz,*row_starts,*col_starts; 657c1a070e6SStefano Zampini MPI_Comm comm = PetscObjectComm((PetscObject)A); 658613e5ff0Sstefano_zampini PetscBool ismpiaij,isseqaij; 6592cf14000SStefano Zampini PetscBool sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int)); 6606ea7df73SStefano Zampini HYPRE_Int *hdi = NULL,*hdj = NULL,*hoi = NULL,*hoj = NULL; 6615c97c10fSStefano Zampini PetscInt *pdi = NULL,*pdj = NULL,*poi = NULL,*poj = NULL; 6626ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 6636ea7df73SStefano Zampini PetscBool iscuda = PETSC_FALSE; 6646ea7df73SStefano Zampini #endif 665c1a070e6SStefano Zampini 666c1a070e6SStefano Zampini PetscFunctionBegin; 6679566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A,MATMPIAIJ,&ismpiaij)); 6689566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A,MATSEQAIJ,&isseqaij)); 66908401ef6SPierre Jolivet PetscCheck(ismpiaij || isseqaij,comm,PETSC_ERR_SUP,"Unsupported type %s",((PetscObject)A)->type_name); 670c1a070e6SStefano Zampini if (ismpiaij) { 671c1a070e6SStefano Zampini Mat_MPIAIJ *a = (Mat_MPIAIJ*)(A->data); 672c1a070e6SStefano Zampini 673c1a070e6SStefano Zampini diag = (Mat_SeqAIJ*)a->A->data; 674c1a070e6SStefano Zampini offd = (Mat_SeqAIJ*)a->B->data; 6756ea7df73SStefano Zampini #if defined(PETSC_HAVE_CUDA) && defined(PETSC_HAVE_HYPRE_DEVICE) && defined(HYPRE_USING_CUDA) 6769566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)A,MATMPIAIJCUSPARSE,&iscuda)); 6776ea7df73SStefano Zampini if (iscuda && !A->boundtocpu) { 6786ea7df73SStefano Zampini sameint = PETSC_TRUE; 6799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJCUSPARSEGetIJ(a->A,PETSC_FALSE,(const HYPRE_Int**)&hdi,(const HYPRE_Int**)&hdj)); 6809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJCUSPARSEGetIJ(a->B,PETSC_FALSE,(const HYPRE_Int**)&hoi,(const HYPRE_Int**)&hoj)); 6816ea7df73SStefano Zampini } else { 6826ea7df73SStefano Zampini #else 6836ea7df73SStefano Zampini { 6846ea7df73SStefano Zampini #endif 6856ea7df73SStefano Zampini pdi = diag->i; 6866ea7df73SStefano Zampini pdj = diag->j; 6876ea7df73SStefano Zampini poi = offd->i; 6886ea7df73SStefano Zampini poj = offd->j; 6896ea7df73SStefano Zampini if (sameint) { 6906ea7df73SStefano Zampini hdi = (HYPRE_Int*)pdi; 6916ea7df73SStefano Zampini hdj = (HYPRE_Int*)pdj; 6926ea7df73SStefano Zampini hoi = (HYPRE_Int*)poi; 6936ea7df73SStefano Zampini hoj = (HYPRE_Int*)poj; 6946ea7df73SStefano Zampini } 6956ea7df73SStefano Zampini } 696c1a070e6SStefano Zampini garray = a->garray; 697c1a070e6SStefano Zampini noffd = a->B->cmap->N; 698c1a070e6SStefano Zampini dnnz = diag->nz; 699c1a070e6SStefano Zampini onnz = offd->nz; 700c1a070e6SStefano Zampini } else { 701c1a070e6SStefano Zampini diag = (Mat_SeqAIJ*)A->data; 702c1a070e6SStefano Zampini offd = NULL; 7036ea7df73SStefano Zampini #if defined(PETSC_HAVE_CUDA) && defined(PETSC_HAVE_HYPRE_DEVICE) 7049566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)A,MATSEQAIJCUSPARSE,&iscuda)); 7056ea7df73SStefano Zampini if (iscuda && !A->boundtocpu) { 7066ea7df73SStefano Zampini sameint = PETSC_TRUE; 7079566063dSJacob Faibussowitsch PetscCall(MatSeqAIJCUSPARSEGetIJ(A,PETSC_FALSE,(const HYPRE_Int**)&hdi,(const HYPRE_Int**)&hdj)); 7086ea7df73SStefano Zampini } else { 7096ea7df73SStefano Zampini #else 7106ea7df73SStefano Zampini { 7116ea7df73SStefano Zampini #endif 7126ea7df73SStefano Zampini pdi = diag->i; 7136ea7df73SStefano Zampini pdj = diag->j; 7146ea7df73SStefano Zampini if (sameint) { 7156ea7df73SStefano Zampini hdi = (HYPRE_Int*)pdi; 7166ea7df73SStefano Zampini hdj = (HYPRE_Int*)pdj; 7176ea7df73SStefano Zampini } 7186ea7df73SStefano Zampini } 719c1a070e6SStefano Zampini garray = NULL; 720c1a070e6SStefano Zampini noffd = 0; 721c1a070e6SStefano Zampini dnnz = diag->nz; 722c1a070e6SStefano Zampini onnz = 0; 723c1a070e6SStefano Zampini } 724225daaf8SStefano Zampini 725c1a070e6SStefano Zampini /* create a temporary ParCSR */ 726c1a070e6SStefano Zampini if (HYPRE_AssumedPartitionCheck()) { 727c1a070e6SStefano Zampini PetscMPIInt myid; 728c1a070e6SStefano Zampini 7299566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_rank(comm,&myid)); 730c1a070e6SStefano Zampini row_starts = A->rmap->range + myid; 731c1a070e6SStefano Zampini col_starts = A->cmap->range + myid; 732c1a070e6SStefano Zampini } else { 733c1a070e6SStefano Zampini row_starts = A->rmap->range; 734c1a070e6SStefano Zampini col_starts = A->cmap->range; 735c1a070e6SStefano Zampini } 7362cf14000SStefano Zampini tA = hypre_ParCSRMatrixCreate(comm,A->rmap->N,A->cmap->N,(HYPRE_BigInt*)row_starts,(HYPRE_BigInt*)col_starts,noffd,dnnz,onnz); 737a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts) 738c1a070e6SStefano Zampini hypre_ParCSRMatrixSetRowStartsOwner(tA,0); 739c1a070e6SStefano Zampini hypre_ParCSRMatrixSetColStartsOwner(tA,0); 740a1d2239cSSatish Balay #endif 741c1a070e6SStefano Zampini 742225daaf8SStefano Zampini /* set diagonal part */ 743c1a070e6SStefano Zampini hdiag = hypre_ParCSRMatrixDiag(tA); 7446ea7df73SStefano Zampini if (!sameint) { /* malloc CSR pointers */ 7459566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(A->rmap->n+1,&hdi,dnnz,&hdj)); 7466ea7df73SStefano Zampini for (i = 0; i < A->rmap->n+1; i++) hdi[i] = (HYPRE_Int)(pdi[i]); 7476ea7df73SStefano Zampini for (i = 0; i < dnnz; i++) hdj[i] = (HYPRE_Int)(pdj[i]); 7482cf14000SStefano Zampini } 7496ea7df73SStefano Zampini hypre_CSRMatrixI(hdiag) = hdi; 7506ea7df73SStefano Zampini hypre_CSRMatrixJ(hdiag) = hdj; 75139accc25SStefano Zampini hypre_CSRMatrixData(hdiag) = (HYPRE_Complex*)diag->a; 752c1a070e6SStefano Zampini hypre_CSRMatrixNumNonzeros(hdiag) = diag->nz; 753c1a070e6SStefano Zampini hypre_CSRMatrixSetRownnz(hdiag); 754c1a070e6SStefano Zampini hypre_CSRMatrixSetDataOwner(hdiag,0); 755c1a070e6SStefano Zampini 756225daaf8SStefano Zampini /* set offdiagonal part */ 757c1a070e6SStefano Zampini hoffd = hypre_ParCSRMatrixOffd(tA); 758c1a070e6SStefano Zampini if (offd) { 7596ea7df73SStefano Zampini if (!sameint) { /* malloc CSR pointers */ 7609566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(A->rmap->n+1,&hoi,onnz,&hoj)); 7616ea7df73SStefano Zampini for (i = 0; i < A->rmap->n+1; i++) hoi[i] = (HYPRE_Int)(poi[i]); 7626ea7df73SStefano Zampini for (i = 0; i < onnz; i++) hoj[i] = (HYPRE_Int)(poj[i]); 7632cf14000SStefano Zampini } 7646ea7df73SStefano Zampini hypre_CSRMatrixI(hoffd) = hoi; 7656ea7df73SStefano Zampini hypre_CSRMatrixJ(hoffd) = hoj; 76639accc25SStefano Zampini hypre_CSRMatrixData(hoffd) = (HYPRE_Complex*)offd->a; 767c1a070e6SStefano Zampini hypre_CSRMatrixNumNonzeros(hoffd) = offd->nz; 768c1a070e6SStefano Zampini hypre_CSRMatrixSetRownnz(hoffd); 769c1a070e6SStefano Zampini hypre_CSRMatrixSetDataOwner(hoffd,0); 7706ea7df73SStefano Zampini } 7716ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 772792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixInitialize_v2,tA,iscuda ? HYPRE_MEMORY_DEVICE : HYPRE_MEMORY_HOST); 7736ea7df73SStefano Zampini #else 7746ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2,18,0) 775792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixInitialize,tA); 7766ea7df73SStefano Zampini #else 777792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixInitialize_v2,tA,HYPRE_MEMORY_HOST); 7786ea7df73SStefano Zampini #endif 7796ea7df73SStefano Zampini #endif 7806ea7df73SStefano Zampini hypre_TFree(hypre_ParCSRMatrixColMapOffd(tA),HYPRE_MEMORY_HOST); 781c1a070e6SStefano Zampini hypre_ParCSRMatrixSetNumNonzeros(tA); 7822cf14000SStefano Zampini hypre_ParCSRMatrixColMapOffd(tA) = (HYPRE_BigInt*)garray; 783792fecdfSBarry Smith if (!hypre_ParCSRMatrixCommPkg(tA)) PetscCallExternal(hypre_MatvecCommPkgCreate,tA); 784613e5ff0Sstefano_zampini *hA = tA; 785613e5ff0Sstefano_zampini PetscFunctionReturn(0); 786613e5ff0Sstefano_zampini } 787c1a070e6SStefano Zampini 788613e5ff0Sstefano_zampini static PetscErrorCode MatAIJRestoreParCSR_Private(Mat A, hypre_ParCSRMatrix **hA) 789613e5ff0Sstefano_zampini { 790613e5ff0Sstefano_zampini hypre_CSRMatrix *hdiag,*hoffd; 7916ea7df73SStefano Zampini PetscBool ismpiaij,sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int)); 7926ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 7936ea7df73SStefano Zampini PetscBool iscuda = PETSC_FALSE; 7946ea7df73SStefano Zampini #endif 795c1a070e6SStefano Zampini 796613e5ff0Sstefano_zampini PetscFunctionBegin; 7979566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A,MATMPIAIJ,&ismpiaij)); 7986ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 7999566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)A,&iscuda,MATSEQAIJCUSPARSE,MATMPIAIJCUSPARSE,"")); 8006ea7df73SStefano Zampini if (iscuda) sameint = PETSC_TRUE; 8016ea7df73SStefano Zampini #endif 802613e5ff0Sstefano_zampini hdiag = hypre_ParCSRMatrixDiag(*hA); 803613e5ff0Sstefano_zampini hoffd = hypre_ParCSRMatrixOffd(*hA); 8046ea7df73SStefano Zampini /* free temporary memory allocated by PETSc 8056ea7df73SStefano Zampini set pointers to NULL before destroying tA */ 8062cf14000SStefano Zampini if (!sameint) { 8072cf14000SStefano Zampini HYPRE_Int *hi,*hj; 8082cf14000SStefano Zampini 8092cf14000SStefano Zampini hi = hypre_CSRMatrixI(hdiag); 8102cf14000SStefano Zampini hj = hypre_CSRMatrixJ(hdiag); 8119566063dSJacob Faibussowitsch PetscCall(PetscFree2(hi,hj)); 8126ea7df73SStefano Zampini if (ismpiaij) { 8132cf14000SStefano Zampini hi = hypre_CSRMatrixI(hoffd); 8142cf14000SStefano Zampini hj = hypre_CSRMatrixJ(hoffd); 8159566063dSJacob Faibussowitsch PetscCall(PetscFree2(hi,hj)); 8162cf14000SStefano Zampini } 8172cf14000SStefano Zampini } 818c1a070e6SStefano Zampini hypre_CSRMatrixI(hdiag) = NULL; 819c1a070e6SStefano Zampini hypre_CSRMatrixJ(hdiag) = NULL; 820c1a070e6SStefano Zampini hypre_CSRMatrixData(hdiag) = NULL; 8216ea7df73SStefano Zampini if (ismpiaij) { 822c1a070e6SStefano Zampini hypre_CSRMatrixI(hoffd) = NULL; 823c1a070e6SStefano Zampini hypre_CSRMatrixJ(hoffd) = NULL; 824c1a070e6SStefano Zampini hypre_CSRMatrixData(hoffd) = NULL; 8256ea7df73SStefano Zampini } 826613e5ff0Sstefano_zampini hypre_ParCSRMatrixColMapOffd(*hA) = NULL; 827613e5ff0Sstefano_zampini hypre_ParCSRMatrixDestroy(*hA); 828613e5ff0Sstefano_zampini *hA = NULL; 829613e5ff0Sstefano_zampini PetscFunctionReturn(0); 830613e5ff0Sstefano_zampini } 831613e5ff0Sstefano_zampini 832613e5ff0Sstefano_zampini /* calls RAP from BoomerAMG: 8333dad0653Sstefano_zampini the resulting ParCSR will not own the column and row starts 8346ea7df73SStefano Zampini It looks like we don't need to have the diagonal entries ordered first */ 835a055b5aaSBarry Smith static PetscErrorCode MatHYPRE_ParCSR_RAP(hypre_ParCSRMatrix *hR, hypre_ParCSRMatrix *hA,hypre_ParCSRMatrix *hP, hypre_ParCSRMatrix **hRAP) 836613e5ff0Sstefano_zampini { 837a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts) 838613e5ff0Sstefano_zampini HYPRE_Int P_owns_col_starts,R_owns_row_starts; 839a1d2239cSSatish Balay #endif 840613e5ff0Sstefano_zampini 841613e5ff0Sstefano_zampini PetscFunctionBegin; 842a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts) 843613e5ff0Sstefano_zampini P_owns_col_starts = hypre_ParCSRMatrixOwnsColStarts(hP); 844613e5ff0Sstefano_zampini R_owns_row_starts = hypre_ParCSRMatrixOwnsRowStarts(hR); 845a1d2239cSSatish Balay #endif 8466ea7df73SStefano Zampini /* can be replaced by version test later */ 8476ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 848792fecdfSBarry Smith PetscStackPushExternal("hypre_ParCSRMatrixRAP"); 8496ea7df73SStefano Zampini *hRAP = hypre_ParCSRMatrixRAP(hR,hA,hP); 8506ea7df73SStefano Zampini PetscStackPop; 8516ea7df73SStefano Zampini #else 852792fecdfSBarry Smith PetscCallExternal(hypre_BoomerAMGBuildCoarseOperator,hR,hA,hP,hRAP); 853792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixSetNumNonzeros,*hRAP); 8546ea7df73SStefano Zampini #endif 855613e5ff0Sstefano_zampini /* hypre_BoomerAMGBuildCoarseOperator steals the col_starts from P and the row_starts from R */ 856a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts) 857613e5ff0Sstefano_zampini hypre_ParCSRMatrixSetRowStartsOwner(*hRAP,0); 858613e5ff0Sstefano_zampini hypre_ParCSRMatrixSetColStartsOwner(*hRAP,0); 859613e5ff0Sstefano_zampini if (P_owns_col_starts) hypre_ParCSRMatrixSetColStartsOwner(hP,1); 860613e5ff0Sstefano_zampini if (R_owns_row_starts) hypre_ParCSRMatrixSetRowStartsOwner(hR,1); 861a1d2239cSSatish Balay #endif 862613e5ff0Sstefano_zampini PetscFunctionReturn(0); 863613e5ff0Sstefano_zampini } 864613e5ff0Sstefano_zampini 8656f231fbdSstefano_zampini static PetscErrorCode MatPtAPNumeric_AIJ_AIJ_wHYPRE(Mat A,Mat P,Mat C) 866613e5ff0Sstefano_zampini { 8676f231fbdSstefano_zampini Mat B; 8686abb4441SStefano Zampini hypre_ParCSRMatrix *hA,*hP,*hPtAP = NULL; 8694222ddf1SHong Zhang Mat_Product *product=C->product; 870613e5ff0Sstefano_zampini 871613e5ff0Sstefano_zampini PetscFunctionBegin; 8729566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(A,&hA)); 8739566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(P,&hP)); 8749566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_RAP(hP,hA,hP,&hPtAP)); 8759566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(hPtAP,MATAIJ,PETSC_OWN_POINTER,&B)); 8764222ddf1SHong Zhang 8779566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(C,&B)); 8784222ddf1SHong Zhang C->product = product; 8794222ddf1SHong Zhang 8809566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(A,&hA)); 8819566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(P,&hP)); 8826f231fbdSstefano_zampini PetscFunctionReturn(0); 8836f231fbdSstefano_zampini } 8846f231fbdSstefano_zampini 8854222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatPtAPSymbolic_AIJ_AIJ_wHYPRE(Mat A,Mat P,PetscReal fill,Mat C) 8866f231fbdSstefano_zampini { 8876f231fbdSstefano_zampini PetscFunctionBegin; 8889566063dSJacob Faibussowitsch PetscCall(MatSetType(C,MATAIJ)); 8894222ddf1SHong Zhang C->ops->ptapnumeric = MatPtAPNumeric_AIJ_AIJ_wHYPRE; 8904222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_PtAP; 891613e5ff0Sstefano_zampini PetscFunctionReturn(0); 892613e5ff0Sstefano_zampini } 893613e5ff0Sstefano_zampini 8944cc28894Sstefano_zampini static PetscErrorCode MatPtAPNumeric_AIJ_HYPRE(Mat A,Mat P,Mat C) 895613e5ff0Sstefano_zampini { 8964cc28894Sstefano_zampini Mat B; 8974cc28894Sstefano_zampini Mat_HYPRE *hP; 8986abb4441SStefano Zampini hypre_ParCSRMatrix *hA = NULL,*Pparcsr,*ptapparcsr = NULL; 899613e5ff0Sstefano_zampini HYPRE_Int type; 900613e5ff0Sstefano_zampini MPI_Comm comm = PetscObjectComm((PetscObject)A); 9014cc28894Sstefano_zampini PetscBool ishypre; 902613e5ff0Sstefano_zampini 903613e5ff0Sstefano_zampini PetscFunctionBegin; 9049566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)P,MATHYPRE,&ishypre)); 90528b400f6SJacob Faibussowitsch PetscCheck(ishypre,comm,PETSC_ERR_USER,"P should be of type %s",MATHYPRE); 9064cc28894Sstefano_zampini hP = (Mat_HYPRE*)P->data; 907792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType,hP->ij,&type); 90808401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR,comm,PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported"); 909792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject,hP->ij,(void**)&Pparcsr); 910613e5ff0Sstefano_zampini 9119566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(A,&hA)); 9129566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_RAP(Pparcsr,hA,Pparcsr,&ptapparcsr)); 9139566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(A,&hA)); 914225daaf8SStefano Zampini 9154cc28894Sstefano_zampini /* create temporary matrix and merge to C */ 9169566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(ptapparcsr,((PetscObject)C)->type_name,PETSC_OWN_POINTER,&B)); 9179566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(C,&B)); 9184cc28894Sstefano_zampini PetscFunctionReturn(0); 9194cc28894Sstefano_zampini } 9204cc28894Sstefano_zampini 9214cc28894Sstefano_zampini static PetscErrorCode MatPtAPNumeric_HYPRE_HYPRE(Mat A,Mat P,Mat C) 9224cc28894Sstefano_zampini { 9234cc28894Sstefano_zampini Mat B; 9246abb4441SStefano Zampini hypre_ParCSRMatrix *Aparcsr,*Pparcsr,*ptapparcsr = NULL; 9254cc28894Sstefano_zampini Mat_HYPRE *hA,*hP; 9264cc28894Sstefano_zampini PetscBool ishypre; 9274cc28894Sstefano_zampini HYPRE_Int type; 9284cc28894Sstefano_zampini 9294cc28894Sstefano_zampini PetscFunctionBegin; 9309566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)P,MATHYPRE,&ishypre)); 93128b400f6SJacob Faibussowitsch PetscCheck(ishypre,PetscObjectComm((PetscObject)P),PETSC_ERR_USER,"P should be of type %s",MATHYPRE); 9329566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)A,MATHYPRE,&ishypre)); 93328b400f6SJacob Faibussowitsch PetscCheck(ishypre,PetscObjectComm((PetscObject)A),PETSC_ERR_USER,"A should be of type %s",MATHYPRE); 9344cc28894Sstefano_zampini hA = (Mat_HYPRE*)A->data; 9354cc28894Sstefano_zampini hP = (Mat_HYPRE*)P->data; 936792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType,hA->ij,&type); 93708401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR,PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported"); 938792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType,hP->ij,&type); 93908401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR,PetscObjectComm((PetscObject)P),PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported"); 940792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject,hA->ij,(void**)&Aparcsr); 941792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject,hP->ij,(void**)&Pparcsr); 9429566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_RAP(Pparcsr,Aparcsr,Pparcsr,&ptapparcsr)); 9439566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(ptapparcsr,MATHYPRE,PETSC_OWN_POINTER,&B)); 9449566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(C,&B)); 9454cc28894Sstefano_zampini PetscFunctionReturn(0); 9464cc28894Sstefano_zampini } 9474cc28894Sstefano_zampini 948d501dc42Sstefano_zampini /* calls hypre_ParMatmul 949d501dc42Sstefano_zampini hypre_ParMatMul uses hypre_ParMatrixCreate with the communicator of hA 9503dad0653Sstefano_zampini hypre_ParMatrixCreate does not duplicate the communicator 9516ea7df73SStefano Zampini It looks like we don't need to have the diagonal entries ordered first */ 952d501dc42Sstefano_zampini static PetscErrorCode MatHYPRE_ParCSR_MatMatMult(hypre_ParCSRMatrix *hA, hypre_ParCSRMatrix *hB, hypre_ParCSRMatrix **hAB) 953d501dc42Sstefano_zampini { 954d501dc42Sstefano_zampini PetscFunctionBegin; 9556ea7df73SStefano Zampini /* can be replaced by version test later */ 9566ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 957792fecdfSBarry Smith PetscStackPushExternal("hypre_ParCSRMatMat"); 9586ea7df73SStefano Zampini *hAB = hypre_ParCSRMatMat(hA,hB); 9596ea7df73SStefano Zampini #else 960792fecdfSBarry Smith PetscStackPushExternal("hypre_ParMatmul"); 961d501dc42Sstefano_zampini *hAB = hypre_ParMatmul(hA,hB); 9626ea7df73SStefano Zampini #endif 963d501dc42Sstefano_zampini PetscStackPop; 964d501dc42Sstefano_zampini PetscFunctionReturn(0); 965d501dc42Sstefano_zampini } 966d501dc42Sstefano_zampini 9675e5acdf2Sstefano_zampini static PetscErrorCode MatMatMultNumeric_AIJ_AIJ_wHYPRE(Mat A,Mat B,Mat C) 9685e5acdf2Sstefano_zampini { 9695e5acdf2Sstefano_zampini Mat D; 970d501dc42Sstefano_zampini hypre_ParCSRMatrix *hA,*hB,*hAB = NULL; 9714222ddf1SHong Zhang Mat_Product *product=C->product; 9725e5acdf2Sstefano_zampini 9735e5acdf2Sstefano_zampini PetscFunctionBegin; 9749566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(A,&hA)); 9759566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(B,&hB)); 9769566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_MatMatMult(hA,hB,&hAB)); 9779566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(hAB,MATAIJ,PETSC_OWN_POINTER,&D)); 9784222ddf1SHong Zhang 9799566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(C,&D)); 9804222ddf1SHong Zhang C->product = product; 9814222ddf1SHong Zhang 9829566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(A,&hA)); 9839566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(B,&hB)); 9845e5acdf2Sstefano_zampini PetscFunctionReturn(0); 9855e5acdf2Sstefano_zampini } 9865e5acdf2Sstefano_zampini 9874222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatMatMultSymbolic_AIJ_AIJ_wHYPRE(Mat A,Mat B,PetscReal fill,Mat C) 9885e5acdf2Sstefano_zampini { 9895e5acdf2Sstefano_zampini PetscFunctionBegin; 9909566063dSJacob Faibussowitsch PetscCall(MatSetType(C,MATAIJ)); 9914222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_AIJ_AIJ_wHYPRE; 9924222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_AB; 9935e5acdf2Sstefano_zampini PetscFunctionReturn(0); 9945e5acdf2Sstefano_zampini } 9955e5acdf2Sstefano_zampini 996d501dc42Sstefano_zampini static PetscErrorCode MatMatMultNumeric_HYPRE_HYPRE(Mat A,Mat B,Mat C) 997d501dc42Sstefano_zampini { 998d501dc42Sstefano_zampini Mat D; 999d501dc42Sstefano_zampini hypre_ParCSRMatrix *Aparcsr,*Bparcsr,*ABparcsr = NULL; 1000d501dc42Sstefano_zampini Mat_HYPRE *hA,*hB; 1001d501dc42Sstefano_zampini PetscBool ishypre; 1002d501dc42Sstefano_zampini HYPRE_Int type; 10034222ddf1SHong Zhang Mat_Product *product; 1004d501dc42Sstefano_zampini 1005d501dc42Sstefano_zampini PetscFunctionBegin; 10069566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B,MATHYPRE,&ishypre)); 100728b400f6SJacob Faibussowitsch PetscCheck(ishypre,PetscObjectComm((PetscObject)B),PETSC_ERR_USER,"B should be of type %s",MATHYPRE); 10089566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)A,MATHYPRE,&ishypre)); 100928b400f6SJacob Faibussowitsch PetscCheck(ishypre,PetscObjectComm((PetscObject)A),PETSC_ERR_USER,"A should be of type %s",MATHYPRE); 1010d501dc42Sstefano_zampini hA = (Mat_HYPRE*)A->data; 1011d501dc42Sstefano_zampini hB = (Mat_HYPRE*)B->data; 1012792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType,hA->ij,&type); 101308401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR,PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported"); 1014792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType,hB->ij,&type); 101508401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR,PetscObjectComm((PetscObject)B),PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported"); 1016792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject,hA->ij,(void**)&Aparcsr); 1017792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject,hB->ij,(void**)&Bparcsr); 10189566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_MatMatMult(Aparcsr,Bparcsr,&ABparcsr)); 10199566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(ABparcsr,MATHYPRE,PETSC_OWN_POINTER,&D)); 10204222ddf1SHong Zhang 1021d501dc42Sstefano_zampini /* need to use HeaderReplace because HeaderMerge messes up with the communicator */ 10224222ddf1SHong Zhang product = C->product; /* save it from MatHeaderReplace() */ 10234222ddf1SHong Zhang C->product = NULL; 10249566063dSJacob Faibussowitsch PetscCall(MatHeaderReplace(C,&D)); 10254222ddf1SHong Zhang C->product = product; 1026d501dc42Sstefano_zampini C->ops->matmultnumeric = MatMatMultNumeric_HYPRE_HYPRE; 10274222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_AB; 1028d501dc42Sstefano_zampini PetscFunctionReturn(0); 1029d501dc42Sstefano_zampini } 1030d501dc42Sstefano_zampini 10313dad0653Sstefano_zampini PETSC_INTERN PetscErrorCode MatTransposeMatMatMultNumeric_AIJ_AIJ_AIJ_wHYPRE(Mat A,Mat B,Mat C,Mat D) 103220e1dc0dSstefano_zampini { 103320e1dc0dSstefano_zampini Mat E; 10346abb4441SStefano Zampini hypre_ParCSRMatrix *hA,*hB,*hC,*hABC = NULL; 103520e1dc0dSstefano_zampini 103620e1dc0dSstefano_zampini PetscFunctionBegin; 10379566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(A,&hA)); 10389566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(B,&hB)); 10399566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(C,&hC)); 10409566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_RAP(hA,hB,hC,&hABC)); 10419566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(hABC,MATAIJ,PETSC_OWN_POINTER,&E)); 10429566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(D,&E)); 10439566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(A,&hA)); 10449566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(B,&hB)); 10459566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(C,&hC)); 104620e1dc0dSstefano_zampini PetscFunctionReturn(0); 104720e1dc0dSstefano_zampini } 104820e1dc0dSstefano_zampini 10494222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatTransposeMatMatMultSymbolic_AIJ_AIJ_AIJ_wHYPRE(Mat A,Mat B,Mat C,PetscReal fill,Mat D) 105020e1dc0dSstefano_zampini { 105120e1dc0dSstefano_zampini PetscFunctionBegin; 10529566063dSJacob Faibussowitsch PetscCall(MatSetType(D,MATAIJ)); 105320e1dc0dSstefano_zampini PetscFunctionReturn(0); 105420e1dc0dSstefano_zampini } 105520e1dc0dSstefano_zampini 10564222ddf1SHong Zhang /* ---------------------------------------------------- */ 10574222ddf1SHong Zhang static PetscErrorCode MatProductSymbolic_AB_HYPRE(Mat C) 10584222ddf1SHong Zhang { 10594222ddf1SHong Zhang PetscFunctionBegin; 10604222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_AB; 10614222ddf1SHong Zhang PetscFunctionReturn(0); 10624222ddf1SHong Zhang } 10634222ddf1SHong Zhang 10644222ddf1SHong Zhang static PetscErrorCode MatProductSetFromOptions_HYPRE_AB(Mat C) 10654222ddf1SHong Zhang { 10664222ddf1SHong Zhang Mat_Product *product = C->product; 10674222ddf1SHong Zhang PetscBool Ahypre; 10684222ddf1SHong Zhang 10694222ddf1SHong Zhang PetscFunctionBegin; 10709566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)product->A,MATHYPRE,&Ahypre)); 10714222ddf1SHong Zhang if (Ahypre) { /* A is a Hypre matrix */ 10729566063dSJacob Faibussowitsch PetscCall(MatSetType(C,MATHYPRE)); 10734222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_AB_HYPRE; 10744222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_HYPRE_HYPRE; 10754222ddf1SHong Zhang PetscFunctionReturn(0); 10766718818eSStefano Zampini } 10774222ddf1SHong Zhang PetscFunctionReturn(0); 10784222ddf1SHong Zhang } 10794222ddf1SHong Zhang 10804222ddf1SHong Zhang static PetscErrorCode MatProductSymbolic_PtAP_HYPRE(Mat C) 10814222ddf1SHong Zhang { 10824222ddf1SHong Zhang PetscFunctionBegin; 10834222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_PtAP; 10844222ddf1SHong Zhang PetscFunctionReturn(0); 10854222ddf1SHong Zhang } 10864222ddf1SHong Zhang 10874222ddf1SHong Zhang static PetscErrorCode MatProductSetFromOptions_HYPRE_PtAP(Mat C) 10884222ddf1SHong Zhang { 10894222ddf1SHong Zhang Mat_Product *product = C->product; 10904222ddf1SHong Zhang PetscBool flg; 10914222ddf1SHong Zhang PetscInt type = 0; 10924222ddf1SHong Zhang const char *outTypes[4] = {"aij","seqaij","mpiaij","hypre"}; 10934222ddf1SHong Zhang PetscInt ntype = 4; 10944222ddf1SHong Zhang Mat A = product->A; 10954222ddf1SHong Zhang PetscBool Ahypre; 10964222ddf1SHong Zhang 10974222ddf1SHong Zhang PetscFunctionBegin; 10989566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)A,MATHYPRE,&Ahypre)); 10994222ddf1SHong Zhang if (Ahypre) { /* A is a Hypre matrix */ 11009566063dSJacob Faibussowitsch PetscCall(MatSetType(C,MATHYPRE)); 11014222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_PtAP_HYPRE; 11024222ddf1SHong Zhang C->ops->ptapnumeric = MatPtAPNumeric_HYPRE_HYPRE; 11034222ddf1SHong Zhang PetscFunctionReturn(0); 11044222ddf1SHong Zhang } 11054222ddf1SHong Zhang 11064222ddf1SHong Zhang /* A is AIJ, P is Hypre, C = PtAP can be either AIJ or Hypre format */ 11074222ddf1SHong Zhang /* Get runtime option */ 11084222ddf1SHong Zhang if (product->api_user) { 1109d0609cedSBarry Smith PetscOptionsBegin(PetscObjectComm((PetscObject)C),((PetscObject)C)->prefix,"MatPtAP_HYPRE","Mat"); 11109566063dSJacob Faibussowitsch PetscCall(PetscOptionsEList("-matptap_hypre_outtype","MatPtAP outtype","MatPtAP outtype",outTypes,ntype,outTypes[type],&type,&flg)); 1111d0609cedSBarry Smith PetscOptionsEnd(); 11124222ddf1SHong Zhang } else { 1113d0609cedSBarry Smith PetscOptionsBegin(PetscObjectComm((PetscObject)C),((PetscObject)C)->prefix,"MatProduct_PtAP_HYPRE","Mat"); 11149566063dSJacob Faibussowitsch PetscCall(PetscOptionsEList("-mat_product_algorithm_hypre_outtype","MatProduct_PtAP outtype","MatProduct_PtAP",outTypes,ntype,outTypes[type],&type,&flg)); 1115d0609cedSBarry Smith PetscOptionsEnd(); 11164222ddf1SHong Zhang } 11174222ddf1SHong Zhang 11184222ddf1SHong Zhang if (type == 0 || type == 1 || type == 2) { 11199566063dSJacob Faibussowitsch PetscCall(MatSetType(C,MATAIJ)); 11204222ddf1SHong Zhang } else if (type == 3) { 11219566063dSJacob Faibussowitsch PetscCall(MatSetType(C,MATHYPRE)); 11224222ddf1SHong Zhang } else SETERRQ(PetscObjectComm((PetscObject)C),PETSC_ERR_SUP,"MatPtAP outtype is not supported"); 11234222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_PtAP_HYPRE; 11244222ddf1SHong Zhang C->ops->ptapnumeric = MatPtAPNumeric_AIJ_HYPRE; 11254222ddf1SHong Zhang PetscFunctionReturn(0); 11264222ddf1SHong Zhang } 11274222ddf1SHong Zhang 11284222ddf1SHong Zhang static PetscErrorCode MatProductSetFromOptions_HYPRE(Mat C) 11294222ddf1SHong Zhang { 11304222ddf1SHong Zhang Mat_Product *product = C->product; 11314222ddf1SHong Zhang 11324222ddf1SHong Zhang PetscFunctionBegin; 11334222ddf1SHong Zhang switch (product->type) { 11344222ddf1SHong Zhang case MATPRODUCT_AB: 11359566063dSJacob Faibussowitsch PetscCall(MatProductSetFromOptions_HYPRE_AB(C)); 11364222ddf1SHong Zhang break; 11374222ddf1SHong Zhang case MATPRODUCT_PtAP: 11389566063dSJacob Faibussowitsch PetscCall(MatProductSetFromOptions_HYPRE_PtAP(C)); 11394222ddf1SHong Zhang break; 11406718818eSStefano Zampini default: 11416718818eSStefano Zampini break; 11424222ddf1SHong Zhang } 11434222ddf1SHong Zhang PetscFunctionReturn(0); 11444222ddf1SHong Zhang } 11454222ddf1SHong Zhang 11464222ddf1SHong Zhang /* -------------------------------------------------------- */ 11474222ddf1SHong Zhang 1148ea9daf28SStefano Zampini static PetscErrorCode MatMultTranspose_HYPRE(Mat A, Vec x, Vec y) 114963c07aadSStefano Zampini { 115063c07aadSStefano Zampini PetscFunctionBegin; 11519566063dSJacob Faibussowitsch PetscCall(MatHYPRE_MultKernel_Private(A,1.0,x,0.0,y,PETSC_TRUE)); 115263c07aadSStefano Zampini PetscFunctionReturn(0); 115363c07aadSStefano Zampini } 115463c07aadSStefano Zampini 1155ea9daf28SStefano Zampini static PetscErrorCode MatMult_HYPRE(Mat A, Vec x, Vec y) 115663c07aadSStefano Zampini { 115763c07aadSStefano Zampini PetscFunctionBegin; 11589566063dSJacob Faibussowitsch PetscCall(MatHYPRE_MultKernel_Private(A,1.0,x,0.0,y,PETSC_FALSE)); 115963c07aadSStefano Zampini PetscFunctionReturn(0); 116063c07aadSStefano Zampini } 116163c07aadSStefano Zampini 1162414bd5c3SStefano Zampini static PetscErrorCode MatMultAdd_HYPRE(Mat A, Vec x, Vec y, Vec z) 1163414bd5c3SStefano Zampini { 1164414bd5c3SStefano Zampini PetscFunctionBegin; 1165414bd5c3SStefano Zampini if (y != z) { 11669566063dSJacob Faibussowitsch PetscCall(VecCopy(y,z)); 1167414bd5c3SStefano Zampini } 11689566063dSJacob Faibussowitsch PetscCall(MatHYPRE_MultKernel_Private(A,1.0,x,1.0,z,PETSC_FALSE)); 1169414bd5c3SStefano Zampini PetscFunctionReturn(0); 1170414bd5c3SStefano Zampini } 1171414bd5c3SStefano Zampini 1172414bd5c3SStefano Zampini static PetscErrorCode MatMultTransposeAdd_HYPRE(Mat A, Vec x, Vec y, Vec z) 1173414bd5c3SStefano Zampini { 1174414bd5c3SStefano Zampini PetscFunctionBegin; 1175414bd5c3SStefano Zampini if (y != z) { 11769566063dSJacob Faibussowitsch PetscCall(VecCopy(y,z)); 1177414bd5c3SStefano Zampini } 11789566063dSJacob Faibussowitsch PetscCall(MatHYPRE_MultKernel_Private(A,1.0,x,1.0,z,PETSC_TRUE)); 1179414bd5c3SStefano Zampini PetscFunctionReturn(0); 1180414bd5c3SStefano Zampini } 1181414bd5c3SStefano Zampini 1182414bd5c3SStefano Zampini /* y = a * A * x + b * y or y = a * A^t * x + b * y depending on trans */ 118339accc25SStefano Zampini static PetscErrorCode MatHYPRE_MultKernel_Private(Mat A, HYPRE_Complex a, Vec x, HYPRE_Complex b, Vec y, PetscBool trans) 118463c07aadSStefano Zampini { 118563c07aadSStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 118663c07aadSStefano Zampini hypre_ParCSRMatrix *parcsr; 118763c07aadSStefano Zampini hypre_ParVector *hx,*hy; 118863c07aadSStefano Zampini 118963c07aadSStefano Zampini PetscFunctionBegin; 119063c07aadSStefano Zampini if (trans) { 11919566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorPushVecRead(hA->b,x)); 11929566063dSJacob Faibussowitsch if (b != 0.0) PetscCall(VecHYPRE_IJVectorPushVec(hA->x,y)); 11939566063dSJacob Faibussowitsch else PetscCall(VecHYPRE_IJVectorPushVecWrite(hA->x,y)); 1194792fecdfSBarry Smith PetscCallExternal(HYPRE_IJVectorGetObject,hA->b->ij,(void**)&hx); 1195792fecdfSBarry Smith PetscCallExternal(HYPRE_IJVectorGetObject,hA->x->ij,(void**)&hy); 119663c07aadSStefano Zampini } else { 11979566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorPushVecRead(hA->x,x)); 11989566063dSJacob Faibussowitsch if (b != 0.0) PetscCall(VecHYPRE_IJVectorPushVec(hA->b,y)); 11999566063dSJacob Faibussowitsch else PetscCall(VecHYPRE_IJVectorPushVecWrite(hA->b,y)); 1200792fecdfSBarry Smith PetscCallExternal(HYPRE_IJVectorGetObject,hA->x->ij,(void**)&hx); 1201792fecdfSBarry Smith PetscCallExternal(HYPRE_IJVectorGetObject,hA->b->ij,(void**)&hy); 120263c07aadSStefano Zampini } 1203792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject,hA->ij,(void**)&parcsr); 12046ea7df73SStefano Zampini if (trans) { 1205792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixMatvecT,a,parcsr,hx,b,hy); 12066ea7df73SStefano Zampini } else { 1207792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixMatvec,a,parcsr,hx,b,hy); 12086ea7df73SStefano Zampini } 12099566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorPopVec(hA->x)); 12109566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorPopVec(hA->b)); 121163c07aadSStefano Zampini PetscFunctionReturn(0); 121263c07aadSStefano Zampini } 121363c07aadSStefano Zampini 1214ea9daf28SStefano Zampini static PetscErrorCode MatDestroy_HYPRE(Mat A) 121563c07aadSStefano Zampini { 121663c07aadSStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 121763c07aadSStefano Zampini 121863c07aadSStefano Zampini PetscFunctionBegin; 12199566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorDestroy(&hA->x)); 12209566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorDestroy(&hA->b)); 1221978814f1SStefano Zampini if (hA->ij) { 1222978814f1SStefano Zampini if (!hA->inner_free) hypre_IJMatrixObject(hA->ij) = NULL; 1223792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixDestroy,hA->ij); 1224978814f1SStefano Zampini } 12259566063dSJacob Faibussowitsch if (hA->comm) PetscCall(PetscCommRestoreComm(PetscObjectComm((PetscObject)A),&hA->comm)); 1226c69f721fSFande Kong 12279566063dSJacob Faibussowitsch PetscCall(MatStashDestroy_Private(&A->stash)); 12289566063dSJacob Faibussowitsch PetscCall(PetscFree(hA->array)); 1229c69f721fSFande Kong 12305fbaff96SJunchao Zhang if (hA->cooMat) { 12315fbaff96SJunchao Zhang PetscCall(MatDestroy(&hA->cooMat)); 1232*e77caa6dSBarry Smith PetscStackCallExternalVoid("hypre_TFree",hypre_TFree(hA->diagJ,hA->memType)); 1233*e77caa6dSBarry Smith PetscStackCallExternalVoid("hypre_TFree",hypre_TFree(hA->offdJ,hA->memType)); 1234*e77caa6dSBarry Smith PetscStackCallExternalVoid("hypre_TFree",hypre_TFree(hA->diag,hA->memType)); 12355fbaff96SJunchao Zhang } 12365fbaff96SJunchao Zhang 12379566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_hypre_aij_C",NULL)); 12389566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_hypre_is_C",NULL)); 12399566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqaij_hypre_C",NULL)); 12409566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_mpiaij_hypre_C",NULL)); 12419566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatHYPRESetPreallocation_C",NULL)); 12429566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatHYPREGetParCSR_C",NULL)); 12435fbaff96SJunchao Zhang PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSetPreallocationCOO_C",NULL)); 12445fbaff96SJunchao Zhang PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSetValuesCOO_C",NULL)); 12459566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 124663c07aadSStefano Zampini PetscFunctionReturn(0); 124763c07aadSStefano Zampini } 124863c07aadSStefano Zampini 1249ea9daf28SStefano Zampini static PetscErrorCode MatSetUp_HYPRE(Mat A) 125063c07aadSStefano Zampini { 12514ec6421dSstefano_zampini PetscFunctionBegin; 12529566063dSJacob Faibussowitsch PetscCall(MatHYPRESetPreallocation(A,PETSC_DEFAULT,NULL,PETSC_DEFAULT,NULL)); 12534ec6421dSstefano_zampini PetscFunctionReturn(0); 12544ec6421dSstefano_zampini } 12554ec6421dSstefano_zampini 12566ea7df73SStefano Zampini //TODO FIX hypre_CSRMatrixMatvecOutOfPlace 12576ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 12586ea7df73SStefano Zampini static PetscErrorCode MatBindToCPU_HYPRE(Mat A, PetscBool bind) 12596ea7df73SStefano Zampini { 12606ea7df73SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 12616ea7df73SStefano Zampini HYPRE_MemoryLocation hmem = bind ? HYPRE_MEMORY_HOST : HYPRE_MEMORY_DEVICE; 12626ea7df73SStefano Zampini 12636ea7df73SStefano Zampini PetscFunctionBegin; 12646ea7df73SStefano Zampini A->boundtocpu = bind; 12655fbaff96SJunchao Zhang if (hA->ij && hypre_IJMatrixAssembleFlag(hA->ij) && hmem != hypre_IJMatrixMemoryLocation(hA->ij)) { 12666ea7df73SStefano Zampini hypre_ParCSRMatrix *parcsr; 1267792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject,hA->ij,(void**)&parcsr); 1268792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixMigrate,parcsr, hmem); 12696ea7df73SStefano Zampini } 12709566063dSJacob Faibussowitsch if (hA->x) PetscCall(VecHYPRE_IJBindToCPU(hA->x,bind)); 12719566063dSJacob Faibussowitsch if (hA->b) PetscCall(VecHYPRE_IJBindToCPU(hA->b,bind)); 12726ea7df73SStefano Zampini PetscFunctionReturn(0); 12736ea7df73SStefano Zampini } 12746ea7df73SStefano Zampini #endif 12756ea7df73SStefano Zampini 12764ec6421dSstefano_zampini static PetscErrorCode MatAssemblyEnd_HYPRE(Mat A, MatAssemblyType mode) 12774ec6421dSstefano_zampini { 127863c07aadSStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 1279c69f721fSFande Kong PetscMPIInt n; 1280c69f721fSFande Kong PetscInt i,j,rstart,ncols,flg; 1281c69f721fSFande Kong PetscInt *row,*col; 1282c69f721fSFande Kong PetscScalar *val; 128363c07aadSStefano Zampini 128463c07aadSStefano Zampini PetscFunctionBegin; 128508401ef6SPierre Jolivet PetscCheck(mode != MAT_FLUSH_ASSEMBLY,PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"MAT_FLUSH_ASSEMBLY currently not supported with MATHYPRE"); 1286c69f721fSFande Kong 1287c69f721fSFande Kong if (!A->nooffprocentries) { 1288c69f721fSFande Kong while (1) { 12899566063dSJacob Faibussowitsch PetscCall(MatStashScatterGetMesg_Private(&A->stash,&n,&row,&col,&val,&flg)); 1290c69f721fSFande Kong if (!flg) break; 1291c69f721fSFande Kong 1292c69f721fSFande Kong for (i=0; i<n;) { 1293c69f721fSFande Kong /* Now identify the consecutive vals belonging to the same row */ 1294c69f721fSFande Kong for (j=i,rstart=row[j]; j<n; j++) { 1295c69f721fSFande Kong if (row[j] != rstart) break; 1296c69f721fSFande Kong } 1297c69f721fSFande Kong if (j < n) ncols = j-i; 1298c69f721fSFande Kong else ncols = n-i; 1299c69f721fSFande Kong /* Now assemble all these values with a single function call */ 13009566063dSJacob Faibussowitsch PetscCall(MatSetValues_HYPRE(A,1,row+i,ncols,col+i,val+i,A->insertmode)); 1301c69f721fSFande Kong 1302c69f721fSFande Kong i = j; 1303c69f721fSFande Kong } 1304c69f721fSFande Kong } 13059566063dSJacob Faibussowitsch PetscCall(MatStashScatterEnd_Private(&A->stash)); 1306c69f721fSFande Kong } 1307c69f721fSFande Kong 1308792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixAssemble,hA->ij); 1309336664bdSPierre Jolivet /* The assembly routine destroys the aux_matrix, we recreate it here by calling HYPRE_IJMatrixInitialize */ 1310336664bdSPierre Jolivet /* If the option MAT_SORTED_FULL is set to true, the indices and values can be passed to hypre directly, so we don't need the aux_matrix */ 1311336664bdSPierre Jolivet if (!hA->sorted_full) { 1312af1cf968SStefano Zampini hypre_AuxParCSRMatrix *aux_matrix; 1313af1cf968SStefano Zampini 1314af1cf968SStefano Zampini /* call destroy just to make sure we do not leak anything */ 1315af1cf968SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix*)hypre_IJMatrixTranslator(hA->ij); 1316792fecdfSBarry Smith PetscCallExternal(hypre_AuxParCSRMatrixDestroy,aux_matrix); 1317af1cf968SStefano Zampini hypre_IJMatrixTranslator(hA->ij) = NULL; 1318af1cf968SStefano Zampini 1319af1cf968SStefano Zampini /* Initialize with assembled flag -> it only recreates the aux_par_matrix */ 1320792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixInitialize,hA->ij); 1321af1cf968SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix*)hypre_IJMatrixTranslator(hA->ij); 13226ea7df73SStefano Zampini if (aux_matrix) { 1323af1cf968SStefano Zampini hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 1; /* see comment in MatHYPRESetPreallocation_HYPRE */ 132422235d61SPierre Jolivet #if PETSC_PKG_HYPRE_VERSION_LT(2,19,0) 1325792fecdfSBarry Smith PetscCallExternal(hypre_AuxParCSRMatrixInitialize,aux_matrix); 132622235d61SPierre Jolivet #else 1327792fecdfSBarry Smith PetscCallExternal(hypre_AuxParCSRMatrixInitialize_v2,aux_matrix,HYPRE_MEMORY_HOST); 132822235d61SPierre Jolivet #endif 1329af1cf968SStefano Zampini } 13306ea7df73SStefano Zampini } 13316ea7df73SStefano Zampini { 13326ea7df73SStefano Zampini hypre_ParCSRMatrix *parcsr; 13336ea7df73SStefano Zampini 1334792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject,hA->ij,(void**)&parcsr); 1335792fecdfSBarry Smith if (!hypre_ParCSRMatrixCommPkg(parcsr)) PetscCallExternal(hypre_MatvecCommPkgCreate,parcsr); 13366ea7df73SStefano Zampini } 13379566063dSJacob Faibussowitsch if (!hA->x) PetscCall(VecHYPRE_IJVectorCreate(A->cmap,&hA->x)); 13389566063dSJacob Faibussowitsch if (!hA->b) PetscCall(VecHYPRE_IJVectorCreate(A->rmap,&hA->b)); 13396ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 13409566063dSJacob Faibussowitsch PetscCall(MatBindToCPU_HYPRE(A,A->boundtocpu)); 13416ea7df73SStefano Zampini #endif 134263c07aadSStefano Zampini PetscFunctionReturn(0); 134363c07aadSStefano Zampini } 134463c07aadSStefano Zampini 1345c69f721fSFande Kong static PetscErrorCode MatGetArray_HYPRE(Mat A, PetscInt size, void **array) 1346c69f721fSFande Kong { 1347c69f721fSFande Kong Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 1348c69f721fSFande Kong 1349c69f721fSFande Kong PetscFunctionBegin; 135028b400f6SJacob Faibussowitsch PetscCheck(hA->available,PETSC_COMM_SELF,PETSC_ERR_ARG_NULL,"Temporary space is in use"); 1351c69f721fSFande Kong 135239accc25SStefano Zampini if (hA->size >= size) { 135339accc25SStefano Zampini *array = hA->array; 135439accc25SStefano Zampini } else { 13559566063dSJacob Faibussowitsch PetscCall(PetscFree(hA->array)); 1356c69f721fSFande Kong hA->size = size; 13579566063dSJacob Faibussowitsch PetscCall(PetscMalloc(hA->size,&hA->array)); 1358c69f721fSFande Kong *array = hA->array; 1359c69f721fSFande Kong } 1360c69f721fSFande Kong 1361c69f721fSFande Kong hA->available = PETSC_FALSE; 1362c69f721fSFande Kong PetscFunctionReturn(0); 1363c69f721fSFande Kong } 1364c69f721fSFande Kong 1365708542d2SFande Kong static PetscErrorCode MatRestoreArray_HYPRE(Mat A, void **array) 1366c69f721fSFande Kong { 1367c69f721fSFande Kong Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 1368c69f721fSFande Kong 1369c69f721fSFande Kong PetscFunctionBegin; 1370c69f721fSFande Kong *array = NULL; 1371c69f721fSFande Kong hA->available = PETSC_TRUE; 1372c69f721fSFande Kong PetscFunctionReturn(0); 1373c69f721fSFande Kong } 1374c69f721fSFande Kong 13756ea7df73SStefano Zampini static PetscErrorCode MatSetValues_HYPRE(Mat A, PetscInt nr, const PetscInt rows[], PetscInt nc, const PetscInt cols[], const PetscScalar v[], InsertMode ins) 1376d975228cSstefano_zampini { 1377d975228cSstefano_zampini Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 1378d975228cSstefano_zampini PetscScalar *vals = (PetscScalar *)v; 137939accc25SStefano Zampini HYPRE_Complex *sscr; 1380c69f721fSFande Kong PetscInt *cscr[2]; 1381c69f721fSFande Kong PetscInt i,nzc; 138208defe43SFande Kong void *array = NULL; 1383d975228cSstefano_zampini 1384d975228cSstefano_zampini PetscFunctionBegin; 13859566063dSJacob Faibussowitsch PetscCall(MatGetArray_HYPRE(A,sizeof(PetscInt)*(2*nc)+sizeof(HYPRE_Complex)*nc*nr,&array)); 1386c69f721fSFande Kong cscr[0] = (PetscInt*)array; 1387c69f721fSFande Kong cscr[1] = ((PetscInt*)array)+nc; 138839accc25SStefano Zampini sscr = (HYPRE_Complex*)(((PetscInt*)array)+nc*2); 1389d975228cSstefano_zampini for (i=0,nzc=0;i<nc;i++) { 1390d975228cSstefano_zampini if (cols[i] >= 0) { 1391d975228cSstefano_zampini cscr[0][nzc ] = cols[i]; 1392d975228cSstefano_zampini cscr[1][nzc++] = i; 1393d975228cSstefano_zampini } 1394d975228cSstefano_zampini } 1395c69f721fSFande Kong if (!nzc) { 13969566063dSJacob Faibussowitsch PetscCall(MatRestoreArray_HYPRE(A,&array)); 1397c69f721fSFande Kong PetscFunctionReturn(0); 1398c69f721fSFande Kong } 1399d975228cSstefano_zampini 14006ea7df73SStefano Zampini #if 0 //defined(PETSC_HAVE_HYPRE_DEVICE) 14016ea7df73SStefano Zampini if (HYPRE_MEMORY_HOST != hypre_IJMatrixMemoryLocation(hA->ij)) { 14026ea7df73SStefano Zampini hypre_ParCSRMatrix *parcsr; 14036ea7df73SStefano Zampini 1404792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject,hA->ij,(void**)&parcsr); 1405792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixMigrate,parcsr, HYPRE_MEMORY_HOST); 14066ea7df73SStefano Zampini } 14076ea7df73SStefano Zampini #endif 14086ea7df73SStefano Zampini 1409d975228cSstefano_zampini if (ins == ADD_VALUES) { 1410d975228cSstefano_zampini for (i=0;i<nr;i++) { 14116ea7df73SStefano Zampini if (rows[i] >= 0) { 1412d975228cSstefano_zampini PetscInt j; 14132cf14000SStefano Zampini HYPRE_Int hnc = (HYPRE_Int)nzc; 14142cf14000SStefano Zampini 1415aed4548fSBarry Smith PetscCheck((PetscInt)hnc == nzc,PETSC_COMM_SELF,PETSC_ERR_SUP,"Hypre overflow! number of columns %" PetscInt_FMT " for row %" PetscInt_FMT,nzc,rows[i]); 14169566063dSJacob Faibussowitsch for (j=0;j<nzc;j++) PetscCall(PetscHYPREScalarCast(vals[cscr[1][j]],&sscr[j])); 1417792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixAddToValues,hA->ij,1,&hnc,(HYPRE_BigInt*)(rows+i),(HYPRE_BigInt*)cscr[0],sscr); 1418d975228cSstefano_zampini } 1419d975228cSstefano_zampini vals += nc; 1420d975228cSstefano_zampini } 1421d975228cSstefano_zampini } else { /* INSERT_VALUES */ 1422d975228cSstefano_zampini PetscInt rst,ren; 1423c69f721fSFande Kong 14249566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(A,&rst,&ren)); 1425d975228cSstefano_zampini for (i=0;i<nr;i++) { 14266ea7df73SStefano Zampini if (rows[i] >= 0) { 1427d975228cSstefano_zampini PetscInt j; 14282cf14000SStefano Zampini HYPRE_Int hnc = (HYPRE_Int)nzc; 14292cf14000SStefano Zampini 1430aed4548fSBarry Smith PetscCheck((PetscInt)hnc == nzc,PETSC_COMM_SELF,PETSC_ERR_SUP,"Hypre overflow! number of columns %" PetscInt_FMT " for row %" PetscInt_FMT,nzc,rows[i]); 14319566063dSJacob Faibussowitsch for (j=0;j<nzc;j++) PetscCall(PetscHYPREScalarCast(vals[cscr[1][j]],&sscr[j])); 1432c69f721fSFande Kong /* nonlocal values */ 14339566063dSJacob Faibussowitsch if (rows[i] < rst || rows[i] >= ren) PetscCall(MatStashValuesRow_Private(&A->stash,rows[i],nzc,cscr[0],(PetscScalar*)sscr,PETSC_FALSE)); 1434c69f721fSFande Kong /* local values */ 1435792fecdfSBarry Smith else PetscCallExternal(HYPRE_IJMatrixSetValues,hA->ij,1,&hnc,(HYPRE_BigInt*)(rows+i),(HYPRE_BigInt*)cscr[0],sscr); 1436d975228cSstefano_zampini } 1437d975228cSstefano_zampini vals += nc; 1438d975228cSstefano_zampini } 1439d975228cSstefano_zampini } 1440c69f721fSFande Kong 14419566063dSJacob Faibussowitsch PetscCall(MatRestoreArray_HYPRE(A,&array)); 1442d975228cSstefano_zampini PetscFunctionReturn(0); 1443d975228cSstefano_zampini } 1444d975228cSstefano_zampini 1445d975228cSstefano_zampini static PetscErrorCode MatHYPRESetPreallocation_HYPRE(Mat A, PetscInt dnz, const PetscInt dnnz[], PetscInt onz, const PetscInt onnz[]) 1446d975228cSstefano_zampini { 1447d975228cSstefano_zampini Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 14487d968826Sstefano_zampini HYPRE_Int *hdnnz,*honnz; 144906a29025Sstefano_zampini PetscInt i,rs,re,cs,ce,bs; 1450d975228cSstefano_zampini PetscMPIInt size; 1451d975228cSstefano_zampini 1452d975228cSstefano_zampini PetscFunctionBegin; 14539566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 14549566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 1455d975228cSstefano_zampini rs = A->rmap->rstart; 1456d975228cSstefano_zampini re = A->rmap->rend; 1457d975228cSstefano_zampini cs = A->cmap->rstart; 1458d975228cSstefano_zampini ce = A->cmap->rend; 1459d975228cSstefano_zampini if (!hA->ij) { 1460792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixCreate,hA->comm,rs,re-1,cs,ce-1,&hA->ij); 1461792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetObjectType,hA->ij,HYPRE_PARCSR); 1462d975228cSstefano_zampini } else { 14632cf14000SStefano Zampini HYPRE_BigInt hrs,hre,hcs,hce; 1464792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetLocalRange,hA->ij,&hrs,&hre,&hcs,&hce); 1465aed4548fSBarry Smith PetscCheck(hre-hrs+1 == re -rs,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Inconsistent local rows: IJMatrix [%" PetscHYPRE_BigInt_FMT ",%" PetscHYPRE_BigInt_FMT "), PETSc [%" PetscInt_FMT ",%" PetscInt_FMT ")",hrs,hre+1,rs,re); 1466aed4548fSBarry Smith PetscCheck(hce-hcs+1 == ce -cs,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Inconsistent local cols: IJMatrix [%" PetscHYPRE_BigInt_FMT ",%" PetscHYPRE_BigInt_FMT "), PETSc [%" PetscInt_FMT ",%" PetscInt_FMT ")",hcs,hce+1,cs,ce); 1467d975228cSstefano_zampini } 14689566063dSJacob Faibussowitsch PetscCall(MatGetBlockSize(A,&bs)); 146906a29025Sstefano_zampini if (dnz == PETSC_DEFAULT || dnz == PETSC_DECIDE) dnz = 10*bs; 147006a29025Sstefano_zampini if (onz == PETSC_DEFAULT || onz == PETSC_DECIDE) onz = 10*bs; 147106a29025Sstefano_zampini 1472d975228cSstefano_zampini if (!dnnz) { 14739566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n,&hdnnz)); 1474d975228cSstefano_zampini for (i=0;i<A->rmap->n;i++) hdnnz[i] = dnz; 1475d975228cSstefano_zampini } else { 14767d968826Sstefano_zampini hdnnz = (HYPRE_Int*)dnnz; 1477d975228cSstefano_zampini } 14789566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)A),&size)); 1479d975228cSstefano_zampini if (size > 1) { 1480ddbeb582SStefano Zampini hypre_AuxParCSRMatrix *aux_matrix; 1481d975228cSstefano_zampini if (!onnz) { 14829566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n,&honnz)); 1483d975228cSstefano_zampini for (i=0;i<A->rmap->n;i++) honnz[i] = onz; 148422235d61SPierre Jolivet } else honnz = (HYPRE_Int*)onnz; 1485ddbeb582SStefano Zampini /* SetDiagOffdSizes sets hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0, since it seems 1486ddbeb582SStefano Zampini they assume the user will input the entire row values, properly sorted 1487336664bdSPierre Jolivet In PETSc, we don't make such an assumption and set this flag to 1, 1488336664bdSPierre Jolivet unless the option MAT_SORTED_FULL is set to true. 1489ddbeb582SStefano Zampini Also, to avoid possible memory leaks, we destroy and recreate the translator 1490ddbeb582SStefano Zampini This has to be done here, as HYPRE_IJMatrixInitialize will properly initialize 1491ddbeb582SStefano Zampini the IJ matrix for us */ 1492ddbeb582SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix*)hypre_IJMatrixTranslator(hA->ij); 1493ddbeb582SStefano Zampini hypre_AuxParCSRMatrixDestroy(aux_matrix); 1494ddbeb582SStefano Zampini hypre_IJMatrixTranslator(hA->ij) = NULL; 1495792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetDiagOffdSizes,hA->ij,hdnnz,honnz); 1496ddbeb582SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix*)hypre_IJMatrixTranslator(hA->ij); 1497336664bdSPierre Jolivet hypre_AuxParCSRMatrixNeedAux(aux_matrix) = !hA->sorted_full; 1498d975228cSstefano_zampini } else { 1499d975228cSstefano_zampini honnz = NULL; 1500792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetRowSizes,hA->ij,hdnnz); 1501d975228cSstefano_zampini } 1502ddbeb582SStefano Zampini 1503af1cf968SStefano Zampini /* reset assembled flag and call the initialize method */ 1504af1cf968SStefano Zampini hypre_IJMatrixAssembleFlag(hA->ij) = 0; 15056ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2,19,0) 1506792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixInitialize,hA->ij); 15076ea7df73SStefano Zampini #else 1508792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixInitialize_v2,hA->ij,HYPRE_MEMORY_HOST); 15096ea7df73SStefano Zampini #endif 1510d975228cSstefano_zampini if (!dnnz) { 15119566063dSJacob Faibussowitsch PetscCall(PetscFree(hdnnz)); 1512d975228cSstefano_zampini } 1513d975228cSstefano_zampini if (!onnz && honnz) { 15149566063dSJacob Faibussowitsch PetscCall(PetscFree(honnz)); 1515d975228cSstefano_zampini } 1516af1cf968SStefano Zampini /* Match AIJ logic */ 151706a29025Sstefano_zampini A->preallocated = PETSC_TRUE; 1518af1cf968SStefano Zampini A->assembled = PETSC_FALSE; 1519d975228cSstefano_zampini PetscFunctionReturn(0); 1520d975228cSstefano_zampini } 1521d975228cSstefano_zampini 1522d975228cSstefano_zampini /*@C 1523d975228cSstefano_zampini MatHYPRESetPreallocation - Preallocates memory for a sparse parallel matrix in HYPRE IJ format 1524d975228cSstefano_zampini 1525d975228cSstefano_zampini Collective on Mat 1526d975228cSstefano_zampini 1527d975228cSstefano_zampini Input Parameters: 1528d975228cSstefano_zampini + A - the matrix 1529d975228cSstefano_zampini . dnz - number of nonzeros per row in DIAGONAL portion of local submatrix 1530d975228cSstefano_zampini (same value is used for all local rows) 1531d975228cSstefano_zampini . dnnz - array containing the number of nonzeros in the various rows of the 1532d975228cSstefano_zampini DIAGONAL portion of the local submatrix (possibly different for each row) 1533d975228cSstefano_zampini or NULL (PETSC_NULL_INTEGER in Fortran), if d_nz is used to specify the nonzero structure. 1534d975228cSstefano_zampini The size of this array is equal to the number of local rows, i.e 'm'. 1535d975228cSstefano_zampini For matrices that will be factored, you must leave room for (and set) 1536d975228cSstefano_zampini the diagonal entry even if it is zero. 1537d975228cSstefano_zampini . onz - number of nonzeros per row in the OFF-DIAGONAL portion of local 1538d975228cSstefano_zampini submatrix (same value is used for all local rows). 1539d975228cSstefano_zampini - onnz - array containing the number of nonzeros in the various rows of the 1540d975228cSstefano_zampini OFF-DIAGONAL portion of the local submatrix (possibly different for 1541d975228cSstefano_zampini each row) or NULL (PETSC_NULL_INTEGER in Fortran), if o_nz is used to specify the nonzero 1542d975228cSstefano_zampini structure. The size of this array is equal to the number 1543d975228cSstefano_zampini of local rows, i.e 'm'. 1544d975228cSstefano_zampini 154595452b02SPatrick Sanan Notes: 154695452b02SPatrick Sanan If the *nnz parameter is given then the *nz parameter is ignored; for sequential matrices, onz and onnz are ignored. 1547d975228cSstefano_zampini 1548d975228cSstefano_zampini Level: intermediate 1549d975228cSstefano_zampini 1550db781477SPatrick Sanan .seealso: `MatCreate()`, `MatMPIAIJSetPreallocation()`, `MATHYPRE` 1551d975228cSstefano_zampini @*/ 1552d975228cSstefano_zampini PetscErrorCode MatHYPRESetPreallocation(Mat A, PetscInt dnz, const PetscInt dnnz[], PetscInt onz, const PetscInt onnz[]) 1553d975228cSstefano_zampini { 1554d975228cSstefano_zampini PetscFunctionBegin; 1555d975228cSstefano_zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1556d975228cSstefano_zampini PetscValidType(A,1); 1557cac4c232SBarry Smith PetscTryMethod(A,"MatHYPRESetPreallocation_C",(Mat,PetscInt,const PetscInt[],PetscInt,const PetscInt[]),(A,dnz,dnnz,onz,onnz)); 1558d975228cSstefano_zampini PetscFunctionReturn(0); 1559d975228cSstefano_zampini } 1560d975228cSstefano_zampini 1561225daaf8SStefano Zampini /* 1562225daaf8SStefano Zampini MatCreateFromParCSR - Creates a matrix from a hypre_ParCSRMatrix 1563225daaf8SStefano Zampini 1564225daaf8SStefano Zampini Collective 1565225daaf8SStefano Zampini 1566225daaf8SStefano Zampini Input Parameters: 156745b8d346SStefano Zampini + parcsr - the pointer to the hypre_ParCSRMatrix 1568bb4689ddSStefano Zampini . mtype - matrix type to be created. Currently MATAIJ, MATIS and MATHYPRE are supported. 1569225daaf8SStefano Zampini - copymode - PETSc copying options 1570225daaf8SStefano Zampini 1571225daaf8SStefano Zampini Output Parameter: 1572225daaf8SStefano Zampini . A - the matrix 1573225daaf8SStefano Zampini 1574225daaf8SStefano Zampini Level: intermediate 1575225daaf8SStefano Zampini 1576db781477SPatrick Sanan .seealso: `MatHYPRE`, `PetscCopyMode` 1577225daaf8SStefano Zampini */ 157845b8d346SStefano Zampini PETSC_EXTERN PetscErrorCode MatCreateFromParCSR(hypre_ParCSRMatrix *parcsr, MatType mtype, PetscCopyMode copymode, Mat* A) 1579978814f1SStefano Zampini { 1580225daaf8SStefano Zampini Mat T; 1581978814f1SStefano Zampini Mat_HYPRE *hA; 1582978814f1SStefano Zampini MPI_Comm comm; 1583978814f1SStefano Zampini PetscInt rstart,rend,cstart,cend,M,N; 1584d248a85cSRichard Tran Mills PetscBool isseqaij,isseqaijmkl,ismpiaij,isaij,ishyp,isis; 1585978814f1SStefano Zampini 1586978814f1SStefano Zampini PetscFunctionBegin; 1587978814f1SStefano Zampini comm = hypre_ParCSRMatrixComm(parcsr); 15889566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype,MATSEQAIJ,&isseqaij)); 15899566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype,MATSEQAIJMKL,&isseqaijmkl)); 15909566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype,MATMPIAIJ,&ismpiaij)); 15919566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype,MATAIJ,&isaij)); 15929566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype,MATHYPRE,&ishyp)); 15939566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype,MATIS,&isis)); 1594d248a85cSRichard Tran Mills isaij = (PetscBool)(isseqaij || isseqaijmkl || ismpiaij || isaij); 15956ea7df73SStefano Zampini /* TODO */ 1596aed4548fSBarry Smith PetscCheck(isaij || ishyp || isis,comm,PETSC_ERR_SUP,"Unsupported MatType %s! Supported types are %s, %s, %s, %s, %s, and %s",mtype,MATAIJ,MATSEQAIJ,MATSEQAIJMKL,MATMPIAIJ,MATIS,MATHYPRE); 1597978814f1SStefano Zampini /* access ParCSRMatrix */ 1598978814f1SStefano Zampini rstart = hypre_ParCSRMatrixFirstRowIndex(parcsr); 1599978814f1SStefano Zampini rend = hypre_ParCSRMatrixLastRowIndex(parcsr); 1600978814f1SStefano Zampini cstart = hypre_ParCSRMatrixFirstColDiag(parcsr); 1601978814f1SStefano Zampini cend = hypre_ParCSRMatrixLastColDiag(parcsr); 1602978814f1SStefano Zampini M = hypre_ParCSRMatrixGlobalNumRows(parcsr); 1603978814f1SStefano Zampini N = hypre_ParCSRMatrixGlobalNumCols(parcsr); 1604978814f1SStefano Zampini 1605fa92c42cSstefano_zampini /* fix for empty local rows/columns */ 1606fa92c42cSstefano_zampini if (rend < rstart) rend = rstart; 1607fa92c42cSstefano_zampini if (cend < cstart) cend = cstart; 1608fa92c42cSstefano_zampini 1609e6471dc9SStefano Zampini /* PETSc convention */ 1610e6471dc9SStefano Zampini rend++; 1611e6471dc9SStefano Zampini cend++; 1612e6471dc9SStefano Zampini rend = PetscMin(rend,M); 1613e6471dc9SStefano Zampini cend = PetscMin(cend,N); 1614e6471dc9SStefano Zampini 1615978814f1SStefano Zampini /* create PETSc matrix with MatHYPRE */ 16169566063dSJacob Faibussowitsch PetscCall(MatCreate(comm,&T)); 16179566063dSJacob Faibussowitsch PetscCall(MatSetSizes(T,rend-rstart,cend-cstart,M,N)); 16189566063dSJacob Faibussowitsch PetscCall(MatSetType(T,MATHYPRE)); 1619225daaf8SStefano Zampini hA = (Mat_HYPRE*)(T->data); 1620978814f1SStefano Zampini 1621978814f1SStefano Zampini /* create HYPRE_IJMatrix */ 1622792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixCreate,hA->comm,rstart,rend-1,cstart,cend-1,&hA->ij); 1623792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetObjectType,hA->ij,HYPRE_PARCSR); 162445b8d346SStefano Zampini 16256ea7df73SStefano Zampini // TODO DEV 162645b8d346SStefano Zampini /* create new ParCSR object if needed */ 162745b8d346SStefano Zampini if (ishyp && copymode == PETSC_COPY_VALUES) { 162845b8d346SStefano Zampini hypre_ParCSRMatrix *new_parcsr; 16296ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2,18,0) 163045b8d346SStefano Zampini hypre_CSRMatrix *hdiag,*hoffd,*ndiag,*noffd; 163145b8d346SStefano Zampini 16320e6427aaSSatish Balay new_parcsr = hypre_ParCSRMatrixClone(parcsr,0); 163345b8d346SStefano Zampini hdiag = hypre_ParCSRMatrixDiag(parcsr); 163445b8d346SStefano Zampini hoffd = hypre_ParCSRMatrixOffd(parcsr); 163545b8d346SStefano Zampini ndiag = hypre_ParCSRMatrixDiag(new_parcsr); 163645b8d346SStefano Zampini noffd = hypre_ParCSRMatrixOffd(new_parcsr); 16379566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hypre_CSRMatrixData(ndiag),hypre_CSRMatrixData(hdiag),hypre_CSRMatrixNumNonzeros(hdiag))); 16389566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hypre_CSRMatrixData(noffd),hypre_CSRMatrixData(hoffd),hypre_CSRMatrixNumNonzeros(hoffd))); 16396ea7df73SStefano Zampini #else 16406ea7df73SStefano Zampini new_parcsr = hypre_ParCSRMatrixClone(parcsr,1); 16416ea7df73SStefano Zampini #endif 164245b8d346SStefano Zampini parcsr = new_parcsr; 164345b8d346SStefano Zampini copymode = PETSC_OWN_POINTER; 164445b8d346SStefano Zampini } 1645978814f1SStefano Zampini 1646978814f1SStefano Zampini /* set ParCSR object */ 1647978814f1SStefano Zampini hypre_IJMatrixObject(hA->ij) = parcsr; 16484ec6421dSstefano_zampini T->preallocated = PETSC_TRUE; 1649978814f1SStefano Zampini 1650978814f1SStefano Zampini /* set assembled flag */ 1651978814f1SStefano Zampini hypre_IJMatrixAssembleFlag(hA->ij) = 1; 16526ea7df73SStefano Zampini #if 0 1653792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixInitialize,hA->ij); 16546ea7df73SStefano Zampini #endif 1655225daaf8SStefano Zampini if (ishyp) { 16566d2a658fSstefano_zampini PetscMPIInt myid = 0; 16576d2a658fSstefano_zampini 16586d2a658fSstefano_zampini /* make sure we always have row_starts and col_starts available */ 16596d2a658fSstefano_zampini if (HYPRE_AssumedPartitionCheck()) { 16609566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_rank(comm,&myid)); 16616d2a658fSstefano_zampini } 1662a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts) 16636d2a658fSstefano_zampini if (!hypre_ParCSRMatrixOwnsColStarts(parcsr)) { 16646d2a658fSstefano_zampini PetscLayout map; 16656d2a658fSstefano_zampini 16669566063dSJacob Faibussowitsch PetscCall(MatGetLayouts(T,NULL,&map)); 16679566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(map)); 16682cf14000SStefano Zampini hypre_ParCSRMatrixColStarts(parcsr) = (HYPRE_BigInt*)(map->range + myid); 16696d2a658fSstefano_zampini } 16706d2a658fSstefano_zampini if (!hypre_ParCSRMatrixOwnsRowStarts(parcsr)) { 16716d2a658fSstefano_zampini PetscLayout map; 16726d2a658fSstefano_zampini 16739566063dSJacob Faibussowitsch PetscCall(MatGetLayouts(T,&map,NULL)); 16749566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(map)); 16752cf14000SStefano Zampini hypre_ParCSRMatrixRowStarts(parcsr) = (HYPRE_BigInt*)(map->range + myid); 16766d2a658fSstefano_zampini } 1677a1d2239cSSatish Balay #endif 1678978814f1SStefano Zampini /* prevent from freeing the pointer */ 1679978814f1SStefano Zampini if (copymode == PETSC_USE_POINTER) hA->inner_free = PETSC_FALSE; 1680225daaf8SStefano Zampini *A = T; 16819566063dSJacob Faibussowitsch PetscCall(MatSetOption(*A,MAT_SORTED_FULL,PETSC_TRUE)); 16829566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*A,MAT_FINAL_ASSEMBLY)); 16839566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*A,MAT_FINAL_ASSEMBLY)); 1684bb4689ddSStefano Zampini } else if (isaij) { 1685bb4689ddSStefano Zampini if (copymode != PETSC_OWN_POINTER) { 1686225daaf8SStefano Zampini /* prevent from freeing the pointer */ 1687225daaf8SStefano Zampini hA->inner_free = PETSC_FALSE; 16889566063dSJacob Faibussowitsch PetscCall(MatConvert_HYPRE_AIJ(T,MATAIJ,MAT_INITIAL_MATRIX,A)); 16899566063dSJacob Faibussowitsch PetscCall(MatDestroy(&T)); 1690225daaf8SStefano Zampini } else { /* AIJ return type with PETSC_OWN_POINTER */ 16919566063dSJacob Faibussowitsch PetscCall(MatConvert_HYPRE_AIJ(T,MATAIJ,MAT_INPLACE_MATRIX,&T)); 1692225daaf8SStefano Zampini *A = T; 1693225daaf8SStefano Zampini } 1694bb4689ddSStefano Zampini } else if (isis) { 16959566063dSJacob Faibussowitsch PetscCall(MatConvert_HYPRE_IS(T,MATIS,MAT_INITIAL_MATRIX,A)); 16968cfe8d00SStefano Zampini if (copymode != PETSC_OWN_POINTER) hA->inner_free = PETSC_FALSE; 16979566063dSJacob Faibussowitsch PetscCall(MatDestroy(&T)); 1698bb4689ddSStefano Zampini } 1699978814f1SStefano Zampini PetscFunctionReturn(0); 1700978814f1SStefano Zampini } 1701978814f1SStefano Zampini 170268ec7858SStefano Zampini static PetscErrorCode MatHYPREGetParCSR_HYPRE(Mat A, hypre_ParCSRMatrix **parcsr) 1703dd9c0a25Sstefano_zampini { 1704dd9c0a25Sstefano_zampini Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 1705dd9c0a25Sstefano_zampini HYPRE_Int type; 1706dd9c0a25Sstefano_zampini 1707dd9c0a25Sstefano_zampini PetscFunctionBegin; 170828b400f6SJacob Faibussowitsch PetscCheck(hA->ij,PetscObjectComm((PetscObject)A),PETSC_ERR_PLIB,"HYPRE_IJMatrix not present"); 1709792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObjectType,hA->ij,&type); 171008401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR,PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"HYPRE_IJMatrix is not of type HYPRE_PARCSR"); 1711792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject,hA->ij,(void**)parcsr); 1712dd9c0a25Sstefano_zampini PetscFunctionReturn(0); 1713dd9c0a25Sstefano_zampini } 1714dd9c0a25Sstefano_zampini 1715dd9c0a25Sstefano_zampini /* 1716dd9c0a25Sstefano_zampini MatHYPREGetParCSR - Gets the pointer to the ParCSR matrix 1717dd9c0a25Sstefano_zampini 1718dd9c0a25Sstefano_zampini Not collective 1719dd9c0a25Sstefano_zampini 1720dd9c0a25Sstefano_zampini Input Parameters: 1721dd9c0a25Sstefano_zampini + A - the MATHYPRE object 1722dd9c0a25Sstefano_zampini 1723dd9c0a25Sstefano_zampini Output Parameter: 1724dd9c0a25Sstefano_zampini . parcsr - the pointer to the hypre_ParCSRMatrix 1725dd9c0a25Sstefano_zampini 1726dd9c0a25Sstefano_zampini Level: intermediate 1727dd9c0a25Sstefano_zampini 1728db781477SPatrick Sanan .seealso: `MatHYPRE`, `PetscCopyMode` 1729dd9c0a25Sstefano_zampini */ 1730dd9c0a25Sstefano_zampini PetscErrorCode MatHYPREGetParCSR(Mat A, hypre_ParCSRMatrix **parcsr) 1731dd9c0a25Sstefano_zampini { 1732dd9c0a25Sstefano_zampini PetscFunctionBegin; 1733dd9c0a25Sstefano_zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1734dd9c0a25Sstefano_zampini PetscValidType(A,1); 1735cac4c232SBarry Smith PetscUseMethod(A,"MatHYPREGetParCSR_C",(Mat,hypre_ParCSRMatrix**),(A,parcsr)); 1736dd9c0a25Sstefano_zampini PetscFunctionReturn(0); 1737dd9c0a25Sstefano_zampini } 1738dd9c0a25Sstefano_zampini 173968ec7858SStefano Zampini static PetscErrorCode MatMissingDiagonal_HYPRE(Mat A, PetscBool *missing, PetscInt *dd) 174068ec7858SStefano Zampini { 174168ec7858SStefano Zampini hypre_ParCSRMatrix *parcsr; 174268ec7858SStefano Zampini hypre_CSRMatrix *ha; 174368ec7858SStefano Zampini PetscInt rst; 174468ec7858SStefano Zampini 174568ec7858SStefano Zampini PetscFunctionBegin; 174608401ef6SPierre Jolivet PetscCheck(A->rmap->n == A->cmap->n,PETSC_COMM_SELF,PETSC_ERR_SUP,"Not implemented with non-square diagonal blocks"); 17479566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(A,&rst,NULL)); 17489566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A,&parcsr)); 174968ec7858SStefano Zampini if (missing) *missing = PETSC_FALSE; 175068ec7858SStefano Zampini if (dd) *dd = -1; 175168ec7858SStefano Zampini ha = hypre_ParCSRMatrixDiag(parcsr); 175268ec7858SStefano Zampini if (ha) { 175368299464SStefano Zampini PetscInt size,i; 175468299464SStefano Zampini HYPRE_Int *ii,*jj; 175568ec7858SStefano Zampini 175668ec7858SStefano Zampini size = hypre_CSRMatrixNumRows(ha); 175768ec7858SStefano Zampini ii = hypre_CSRMatrixI(ha); 175868ec7858SStefano Zampini jj = hypre_CSRMatrixJ(ha); 175968ec7858SStefano Zampini for (i = 0; i < size; i++) { 176068ec7858SStefano Zampini PetscInt j; 176168ec7858SStefano Zampini PetscBool found = PETSC_FALSE; 176268ec7858SStefano Zampini 176368ec7858SStefano Zampini for (j = ii[i]; j < ii[i+1] && !found; j++) 176468ec7858SStefano Zampini found = (jj[j] == i) ? PETSC_TRUE : PETSC_FALSE; 176568ec7858SStefano Zampini 176668ec7858SStefano Zampini if (!found) { 17677d3de750SJacob Faibussowitsch PetscInfo(A,"Matrix is missing local diagonal entry %" PetscInt_FMT "\n",i); 176868ec7858SStefano Zampini if (missing) *missing = PETSC_TRUE; 176968ec7858SStefano Zampini if (dd) *dd = i+rst; 177068ec7858SStefano Zampini PetscFunctionReturn(0); 177168ec7858SStefano Zampini } 177268ec7858SStefano Zampini } 177368ec7858SStefano Zampini if (!size) { 177468ec7858SStefano Zampini PetscInfo(A,"Matrix has no diagonal entries therefore is missing diagonal\n"); 177568ec7858SStefano Zampini if (missing) *missing = PETSC_TRUE; 177668ec7858SStefano Zampini if (dd) *dd = rst; 177768ec7858SStefano Zampini } 177868ec7858SStefano Zampini } else { 177968ec7858SStefano Zampini PetscInfo(A,"Matrix has no diagonal entries therefore is missing diagonal\n"); 178068ec7858SStefano Zampini if (missing) *missing = PETSC_TRUE; 178168ec7858SStefano Zampini if (dd) *dd = rst; 178268ec7858SStefano Zampini } 178368ec7858SStefano Zampini PetscFunctionReturn(0); 178468ec7858SStefano Zampini } 178568ec7858SStefano Zampini 178668ec7858SStefano Zampini static PetscErrorCode MatScale_HYPRE(Mat A, PetscScalar s) 178768ec7858SStefano Zampini { 178868ec7858SStefano Zampini hypre_ParCSRMatrix *parcsr; 17896ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2,19,0) 179068ec7858SStefano Zampini hypre_CSRMatrix *ha; 17916ea7df73SStefano Zampini #endif 179239accc25SStefano Zampini HYPRE_Complex hs; 179368ec7858SStefano Zampini 179468ec7858SStefano Zampini PetscFunctionBegin; 17959566063dSJacob Faibussowitsch PetscCall(PetscHYPREScalarCast(s,&hs)); 17969566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A,&parcsr)); 17976ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2,19,0) 1798792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixScale,parcsr,hs); 17996ea7df73SStefano Zampini #else /* diagonal part */ 180068ec7858SStefano Zampini ha = hypre_ParCSRMatrixDiag(parcsr); 180168ec7858SStefano Zampini if (ha) { 180268299464SStefano Zampini PetscInt size,i; 180368299464SStefano Zampini HYPRE_Int *ii; 180439accc25SStefano Zampini HYPRE_Complex *a; 180568ec7858SStefano Zampini 180668ec7858SStefano Zampini size = hypre_CSRMatrixNumRows(ha); 180768ec7858SStefano Zampini a = hypre_CSRMatrixData(ha); 180868ec7858SStefano Zampini ii = hypre_CSRMatrixI(ha); 180939accc25SStefano Zampini for (i = 0; i < ii[size]; i++) a[i] *= hs; 181068ec7858SStefano Zampini } 181168ec7858SStefano Zampini /* offdiagonal part */ 181268ec7858SStefano Zampini ha = hypre_ParCSRMatrixOffd(parcsr); 181368ec7858SStefano Zampini if (ha) { 181468299464SStefano Zampini PetscInt size,i; 181568299464SStefano Zampini HYPRE_Int *ii; 181639accc25SStefano Zampini HYPRE_Complex *a; 181768ec7858SStefano Zampini 181868ec7858SStefano Zampini size = hypre_CSRMatrixNumRows(ha); 181968ec7858SStefano Zampini a = hypre_CSRMatrixData(ha); 182068ec7858SStefano Zampini ii = hypre_CSRMatrixI(ha); 182139accc25SStefano Zampini for (i = 0; i < ii[size]; i++) a[i] *= hs; 182268ec7858SStefano Zampini } 18236ea7df73SStefano Zampini #endif 182468ec7858SStefano Zampini PetscFunctionReturn(0); 182568ec7858SStefano Zampini } 182668ec7858SStefano Zampini 182768ec7858SStefano Zampini static PetscErrorCode MatZeroRowsColumns_HYPRE(Mat A, PetscInt numRows, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 182868ec7858SStefano Zampini { 182968ec7858SStefano Zampini hypre_ParCSRMatrix *parcsr; 183068299464SStefano Zampini HYPRE_Int *lrows; 183168299464SStefano Zampini PetscInt rst,ren,i; 183268ec7858SStefano Zampini 183368ec7858SStefano Zampini PetscFunctionBegin; 183408401ef6SPierre Jolivet PetscCheck(!x && !b,PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"To be implemented"); 18359566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A,&parcsr)); 18369566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(numRows,&lrows)); 18379566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(A,&rst,&ren)); 183868ec7858SStefano Zampini for (i=0;i<numRows;i++) { 183968ec7858SStefano Zampini if (rows[i] < rst || rows[i] >= ren) 184068ec7858SStefano Zampini SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Non-local rows not yet supported"); 184168ec7858SStefano Zampini lrows[i] = rows[i] - rst; 184268ec7858SStefano Zampini } 1843792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixEliminateRowsCols,parcsr,numRows,lrows); 18449566063dSJacob Faibussowitsch PetscCall(PetscFree(lrows)); 184568ec7858SStefano Zampini PetscFunctionReturn(0); 184668ec7858SStefano Zampini } 184768ec7858SStefano Zampini 1848c69f721fSFande Kong static PetscErrorCode MatZeroEntries_HYPRE_CSRMatrix(hypre_CSRMatrix *ha) 1849c69f721fSFande Kong { 1850c69f721fSFande Kong PetscFunctionBegin; 1851c69f721fSFande Kong if (ha) { 1852c69f721fSFande Kong HYPRE_Int *ii, size; 1853c69f721fSFande Kong HYPRE_Complex *a; 1854c69f721fSFande Kong 1855c69f721fSFande Kong size = hypre_CSRMatrixNumRows(ha); 1856c69f721fSFande Kong a = hypre_CSRMatrixData(ha); 1857c69f721fSFande Kong ii = hypre_CSRMatrixI(ha); 1858c69f721fSFande Kong 18599566063dSJacob Faibussowitsch if (a) PetscCall(PetscArrayzero(a,ii[size])); 1860c69f721fSFande Kong } 1861c69f721fSFande Kong PetscFunctionReturn(0); 1862c69f721fSFande Kong } 1863c69f721fSFande Kong 1864c69f721fSFande Kong PetscErrorCode MatZeroEntries_HYPRE(Mat A) 1865c69f721fSFande Kong { 18666ea7df73SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 18676ea7df73SStefano Zampini 18686ea7df73SStefano Zampini PetscFunctionBegin; 18696ea7df73SStefano Zampini if (HYPRE_MEMORY_DEVICE == hypre_IJMatrixMemoryLocation(hA->ij)) { 1870792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetConstantValues,hA->ij,0.0); 18716ea7df73SStefano Zampini } else { 1872c69f721fSFande Kong hypre_ParCSRMatrix *parcsr; 1873c69f721fSFande Kong 18749566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A,&parcsr)); 18759566063dSJacob Faibussowitsch PetscCall(MatZeroEntries_HYPRE_CSRMatrix(hypre_ParCSRMatrixDiag(parcsr))); 18769566063dSJacob Faibussowitsch PetscCall(MatZeroEntries_HYPRE_CSRMatrix(hypre_ParCSRMatrixOffd(parcsr))); 18776ea7df73SStefano Zampini } 1878c69f721fSFande Kong PetscFunctionReturn(0); 1879c69f721fSFande Kong } 1880c69f721fSFande Kong 188139accc25SStefano Zampini static PetscErrorCode MatZeroRows_HYPRE_CSRMatrix(hypre_CSRMatrix *hA,PetscInt N,const PetscInt rows[],HYPRE_Complex diag) 1882c69f721fSFande Kong { 188339accc25SStefano Zampini PetscInt ii; 188439accc25SStefano Zampini HYPRE_Int *i, *j; 188539accc25SStefano Zampini HYPRE_Complex *a; 1886c69f721fSFande Kong 1887c69f721fSFande Kong PetscFunctionBegin; 1888c69f721fSFande Kong if (!hA) PetscFunctionReturn(0); 1889c69f721fSFande Kong 189039accc25SStefano Zampini i = hypre_CSRMatrixI(hA); 189139accc25SStefano Zampini j = hypre_CSRMatrixJ(hA); 1892c69f721fSFande Kong a = hypre_CSRMatrixData(hA); 1893c69f721fSFande Kong 1894c69f721fSFande Kong for (ii = 0; ii < N; ii++) { 189539accc25SStefano Zampini HYPRE_Int jj, ibeg, iend, irow; 189639accc25SStefano Zampini 1897c69f721fSFande Kong irow = rows[ii]; 1898c69f721fSFande Kong ibeg = i[irow]; 1899c69f721fSFande Kong iend = i[irow+1]; 1900c69f721fSFande Kong for (jj = ibeg; jj < iend; jj++) 1901c69f721fSFande Kong if (j[jj] == irow) a[jj] = diag; 1902c69f721fSFande Kong else a[jj] = 0.0; 1903c69f721fSFande Kong } 1904c69f721fSFande Kong PetscFunctionReturn(0); 1905c69f721fSFande Kong } 1906c69f721fSFande Kong 1907ddbeb582SStefano Zampini static PetscErrorCode MatZeroRows_HYPRE(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 1908c69f721fSFande Kong { 1909c69f721fSFande Kong hypre_ParCSRMatrix *parcsr; 1910c69f721fSFande Kong PetscInt *lrows,len; 191139accc25SStefano Zampini HYPRE_Complex hdiag; 1912c69f721fSFande Kong 1913c69f721fSFande Kong PetscFunctionBegin; 191408401ef6SPierre Jolivet PetscCheck(!x && !b,PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Does not support to modify the solution and the right hand size"); 19159566063dSJacob Faibussowitsch PetscCall(PetscHYPREScalarCast(diag,&hdiag)); 1916c69f721fSFande Kong /* retrieve the internal matrix */ 19179566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A,&parcsr)); 1918c69f721fSFande Kong /* get locally owned rows */ 19199566063dSJacob Faibussowitsch PetscCall(MatZeroRowsMapLocal_Private(A,N,rows,&len,&lrows)); 1920c69f721fSFande Kong /* zero diagonal part */ 19219566063dSJacob Faibussowitsch PetscCall(MatZeroRows_HYPRE_CSRMatrix(hypre_ParCSRMatrixDiag(parcsr),len,lrows,hdiag)); 1922c69f721fSFande Kong /* zero off-diagonal part */ 19239566063dSJacob Faibussowitsch PetscCall(MatZeroRows_HYPRE_CSRMatrix(hypre_ParCSRMatrixOffd(parcsr),len,lrows,0.0)); 1924c69f721fSFande Kong 19259566063dSJacob Faibussowitsch PetscCall(PetscFree(lrows)); 1926c69f721fSFande Kong PetscFunctionReturn(0); 1927c69f721fSFande Kong } 1928c69f721fSFande Kong 1929ddbeb582SStefano Zampini static PetscErrorCode MatAssemblyBegin_HYPRE(Mat mat,MatAssemblyType mode) 1930c69f721fSFande Kong { 1931c69f721fSFande Kong PetscFunctionBegin; 1932c69f721fSFande Kong if (mat->nooffprocentries) PetscFunctionReturn(0); 1933c69f721fSFande Kong 19349566063dSJacob Faibussowitsch PetscCall(MatStashScatterBegin_Private(mat,&mat->stash,mat->rmap->range)); 1935c69f721fSFande Kong PetscFunctionReturn(0); 1936c69f721fSFande Kong } 1937c69f721fSFande Kong 1938ddbeb582SStefano Zampini static PetscErrorCode MatGetRow_HYPRE(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 1939c69f721fSFande Kong { 1940c69f721fSFande Kong hypre_ParCSRMatrix *parcsr; 19412cf14000SStefano Zampini HYPRE_Int hnz; 1942c69f721fSFande Kong 1943c69f721fSFande Kong PetscFunctionBegin; 1944c69f721fSFande Kong /* retrieve the internal matrix */ 19459566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A,&parcsr)); 1946c69f721fSFande Kong /* call HYPRE API */ 1947792fecdfSBarry Smith PetscCallExternal(HYPRE_ParCSRMatrixGetRow,parcsr,row,&hnz,(HYPRE_BigInt**)idx,(HYPRE_Complex**)v); 19482cf14000SStefano Zampini if (nz) *nz = (PetscInt)hnz; 1949c69f721fSFande Kong PetscFunctionReturn(0); 1950c69f721fSFande Kong } 1951c69f721fSFande Kong 1952ddbeb582SStefano Zampini static PetscErrorCode MatRestoreRow_HYPRE(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 1953c69f721fSFande Kong { 1954c69f721fSFande Kong hypre_ParCSRMatrix *parcsr; 19552cf14000SStefano Zampini HYPRE_Int hnz; 1956c69f721fSFande Kong 1957c69f721fSFande Kong PetscFunctionBegin; 1958c69f721fSFande Kong /* retrieve the internal matrix */ 19599566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A,&parcsr)); 1960c69f721fSFande Kong /* call HYPRE API */ 19612cf14000SStefano Zampini hnz = nz ? (HYPRE_Int)(*nz) : 0; 1962792fecdfSBarry Smith PetscCallExternal(HYPRE_ParCSRMatrixRestoreRow,parcsr,row,&hnz,(HYPRE_BigInt**)idx,(HYPRE_Complex**)v); 1963c69f721fSFande Kong PetscFunctionReturn(0); 1964c69f721fSFande Kong } 1965c69f721fSFande Kong 1966ddbeb582SStefano Zampini static PetscErrorCode MatGetValues_HYPRE(Mat A,PetscInt m,const PetscInt idxm[],PetscInt n,const PetscInt idxn[],PetscScalar v[]) 1967c69f721fSFande Kong { 196845b8d346SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 1969c69f721fSFande Kong PetscInt i; 19701d4906efSStefano Zampini 1971c69f721fSFande Kong PetscFunctionBegin; 1972c69f721fSFande Kong if (!m || !n) PetscFunctionReturn(0); 1973c69f721fSFande Kong /* Ignore negative row indices 1974c69f721fSFande Kong * And negative column indices should be automatically ignored in hypre 1975c69f721fSFande Kong * */ 19762cf14000SStefano Zampini for (i=0; i<m; i++) { 19772cf14000SStefano Zampini if (idxm[i] >= 0) { 19782cf14000SStefano Zampini HYPRE_Int hn = (HYPRE_Int)n; 1979792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetValues,hA->ij,1,&hn,(HYPRE_BigInt*)&idxm[i],(HYPRE_BigInt*)idxn,(HYPRE_Complex*)(v + i*n)); 19802cf14000SStefano Zampini } 19812cf14000SStefano Zampini } 1982c69f721fSFande Kong PetscFunctionReturn(0); 1983c69f721fSFande Kong } 1984c69f721fSFande Kong 1985ddbeb582SStefano Zampini static PetscErrorCode MatSetOption_HYPRE(Mat A,MatOption op,PetscBool flg) 1986ddbeb582SStefano Zampini { 1987ddbeb582SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 1988ddbeb582SStefano Zampini 1989ddbeb582SStefano Zampini PetscFunctionBegin; 1990c6698e78SStefano Zampini switch (op) { 1991ddbeb582SStefano Zampini case MAT_NO_OFF_PROC_ENTRIES: 1992ddbeb582SStefano Zampini if (flg) { 1993792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixSetMaxOffProcElmts,hA->ij,0); 1994ddbeb582SStefano Zampini } 1995ddbeb582SStefano Zampini break; 1996336664bdSPierre Jolivet case MAT_SORTED_FULL: 1997336664bdSPierre Jolivet hA->sorted_full = flg; 1998336664bdSPierre Jolivet break; 1999ddbeb582SStefano Zampini default: 2000ddbeb582SStefano Zampini break; 2001ddbeb582SStefano Zampini } 2002ddbeb582SStefano Zampini PetscFunctionReturn(0); 2003ddbeb582SStefano Zampini } 2004c69f721fSFande Kong 200545b8d346SStefano Zampini static PetscErrorCode MatView_HYPRE(Mat A, PetscViewer view) 200645b8d346SStefano Zampini { 200745b8d346SStefano Zampini PetscViewerFormat format; 200845b8d346SStefano Zampini 200945b8d346SStefano Zampini PetscFunctionBegin; 20109566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(view,&format)); 20116ea7df73SStefano Zampini if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(0); 201245b8d346SStefano Zampini if (format != PETSC_VIEWER_NATIVE) { 20136ea7df73SStefano Zampini Mat B; 20146ea7df73SStefano Zampini hypre_ParCSRMatrix *parcsr; 20156ea7df73SStefano Zampini PetscErrorCode (*mview)(Mat,PetscViewer) = NULL; 20166ea7df73SStefano Zampini 20179566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A,&parcsr)); 20189566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(parcsr,MATAIJ,PETSC_USE_POINTER,&B)); 20199566063dSJacob Faibussowitsch PetscCall(MatGetOperation(B,MATOP_VIEW,(void(**)(void))&mview)); 202028b400f6SJacob Faibussowitsch PetscCheck(mview,PetscObjectComm((PetscObject)A),PETSC_ERR_PLIB,"Missing view operation"); 20219566063dSJacob Faibussowitsch PetscCall((*mview)(B,view)); 20229566063dSJacob Faibussowitsch PetscCall(MatDestroy(&B)); 202345b8d346SStefano Zampini } else { 202445b8d346SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 202545b8d346SStefano Zampini PetscMPIInt size; 202645b8d346SStefano Zampini PetscBool isascii; 202745b8d346SStefano Zampini const char *filename; 202845b8d346SStefano Zampini 202945b8d346SStefano Zampini /* HYPRE uses only text files */ 20309566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)view,PETSCVIEWERASCII,&isascii)); 203128b400f6SJacob Faibussowitsch PetscCheck(isascii,PetscObjectComm((PetscObject)view),PETSC_ERR_SUP,"PetscViewerType %s: native HYPRE format needs PETSCVIEWERASCII",((PetscObject)view)->type_name); 20329566063dSJacob Faibussowitsch PetscCall(PetscViewerFileGetName(view,&filename)); 2033792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixPrint,hA->ij,filename); 20349566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(hA->comm,&size)); 203545b8d346SStefano Zampini if (size > 1) { 20369566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(view,"Matrix files: %s.%05d ... %s.%05d\n",filename,0,filename,size-1)); 203745b8d346SStefano Zampini } else { 20389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(view,"Matrix file: %s.%05d\n",filename,0)); 203945b8d346SStefano Zampini } 204045b8d346SStefano Zampini } 204145b8d346SStefano Zampini PetscFunctionReturn(0); 204245b8d346SStefano Zampini } 204345b8d346SStefano Zampini 204445b8d346SStefano Zampini static PetscErrorCode MatDuplicate_HYPRE(Mat A,MatDuplicateOption op, Mat *B) 204545b8d346SStefano Zampini { 20466abb4441SStefano Zampini hypre_ParCSRMatrix *parcsr = NULL; 204745b8d346SStefano Zampini PetscCopyMode cpmode; 204845b8d346SStefano Zampini 204945b8d346SStefano Zampini PetscFunctionBegin; 20509566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A,&parcsr)); 205145b8d346SStefano Zampini if (op == MAT_DO_NOT_COPY_VALUES || op == MAT_SHARE_NONZERO_PATTERN) { 20520e6427aaSSatish Balay parcsr = hypre_ParCSRMatrixClone(parcsr,0); 205345b8d346SStefano Zampini cpmode = PETSC_OWN_POINTER; 205445b8d346SStefano Zampini } else { 205545b8d346SStefano Zampini cpmode = PETSC_COPY_VALUES; 205645b8d346SStefano Zampini } 20579566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(parcsr,MATHYPRE,cpmode,B)); 205845b8d346SStefano Zampini PetscFunctionReturn(0); 205945b8d346SStefano Zampini } 206045b8d346SStefano Zampini 2061465edc17SStefano Zampini static PetscErrorCode MatCopy_HYPRE(Mat A, Mat B, MatStructure str) 2062465edc17SStefano Zampini { 2063465edc17SStefano Zampini hypre_ParCSRMatrix *acsr,*bcsr; 2064465edc17SStefano Zampini 2065465edc17SStefano Zampini PetscFunctionBegin; 2066465edc17SStefano Zampini if (str == SAME_NONZERO_PATTERN && A->ops->copy == B->ops->copy) { 20679566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A,&acsr)); 20689566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(B,&bcsr)); 2069792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixCopy,acsr,bcsr,1); 20709566063dSJacob Faibussowitsch PetscCall(MatSetOption(B,MAT_SORTED_FULL,PETSC_TRUE)); /* "perfect" preallocation, so no need for hypre_AuxParCSRMatrixNeedAux */ 20719566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY)); 20729566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY)); 2073465edc17SStefano Zampini } else { 20749566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A,B,str)); 2075465edc17SStefano Zampini } 2076465edc17SStefano Zampini PetscFunctionReturn(0); 2077465edc17SStefano Zampini } 2078465edc17SStefano Zampini 20796305df00SStefano Zampini static PetscErrorCode MatGetDiagonal_HYPRE(Mat A, Vec d) 20806305df00SStefano Zampini { 20816305df00SStefano Zampini hypre_ParCSRMatrix *parcsr; 20826305df00SStefano Zampini hypre_CSRMatrix *dmat; 208339accc25SStefano Zampini HYPRE_Complex *a; 208439accc25SStefano Zampini HYPRE_Complex *data = NULL; 20852cf14000SStefano Zampini HYPRE_Int *diag = NULL; 20862cf14000SStefano Zampini PetscInt i; 20876305df00SStefano Zampini PetscBool cong; 20886305df00SStefano Zampini 20896305df00SStefano Zampini PetscFunctionBegin; 20909566063dSJacob Faibussowitsch PetscCall(MatHasCongruentLayouts(A,&cong)); 209128b400f6SJacob Faibussowitsch PetscCheck(cong,PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Only for square matrices with same local distributions of rows and columns"); 209276bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 20936305df00SStefano Zampini PetscBool miss; 20949566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal(A,&miss,NULL)); 209508401ef6SPierre Jolivet PetscCheck(!miss || !A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_SUP,"Not implemented when diagonal entries are missing"); 20966305df00SStefano Zampini } 20979566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A,&parcsr)); 20986305df00SStefano Zampini dmat = hypre_ParCSRMatrixDiag(parcsr); 20996305df00SStefano Zampini if (dmat) { 210039accc25SStefano Zampini /* this cast fixes the clang error: implicit conversion from 'HYPRE_Complex' (aka '_Complex double') to 'double' is not permitted in C++ */ 21019566063dSJacob Faibussowitsch PetscCall(VecGetArray(d,(PetscScalar**)&a)); 21022cf14000SStefano Zampini diag = hypre_CSRMatrixI(dmat); 210339accc25SStefano Zampini data = hypre_CSRMatrixData(dmat); 21046305df00SStefano Zampini for (i=0;i<A->rmap->n;i++) a[i] = data[diag[i]]; 21059566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(d,(PetscScalar**)&a)); 21066305df00SStefano Zampini } 21076305df00SStefano Zampini PetscFunctionReturn(0); 21086305df00SStefano Zampini } 21096305df00SStefano Zampini 2110363d496dSStefano Zampini #include <petscblaslapack.h> 2111363d496dSStefano Zampini 2112363d496dSStefano Zampini static PetscErrorCode MatAXPY_HYPRE(Mat Y,PetscScalar a,Mat X,MatStructure str) 2113363d496dSStefano Zampini { 2114363d496dSStefano Zampini PetscFunctionBegin; 21156ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 21166ea7df73SStefano Zampini { 21176ea7df73SStefano Zampini Mat B; 21186ea7df73SStefano Zampini hypre_ParCSRMatrix *x,*y,*z; 21196ea7df73SStefano Zampini 21209566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR(Y,&y)); 21219566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR(X,&x)); 2122792fecdfSBarry Smith PetscCallExternal(hypre_ParCSRMatrixAdd,1.0,y,1.0,x,&z); 21239566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(z,MATHYPRE,PETSC_OWN_POINTER,&B)); 21249566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y,&B)); 21256ea7df73SStefano Zampini } 21266ea7df73SStefano Zampini #else 2127363d496dSStefano Zampini if (str == SAME_NONZERO_PATTERN) { 2128363d496dSStefano Zampini hypre_ParCSRMatrix *x,*y; 2129363d496dSStefano Zampini hypre_CSRMatrix *xloc,*yloc; 2130363d496dSStefano Zampini PetscInt xnnz,ynnz; 213139accc25SStefano Zampini HYPRE_Complex *xarr,*yarr; 2132363d496dSStefano Zampini PetscBLASInt one=1,bnz; 2133363d496dSStefano Zampini 21349566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR(Y,&y)); 21359566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR(X,&x)); 2136363d496dSStefano Zampini 2137363d496dSStefano Zampini /* diagonal block */ 2138363d496dSStefano Zampini xloc = hypre_ParCSRMatrixDiag(x); 2139363d496dSStefano Zampini yloc = hypre_ParCSRMatrixDiag(y); 2140363d496dSStefano Zampini xnnz = 0; 2141363d496dSStefano Zampini ynnz = 0; 2142363d496dSStefano Zampini xarr = NULL; 2143363d496dSStefano Zampini yarr = NULL; 2144363d496dSStefano Zampini if (xloc) { 214539accc25SStefano Zampini xarr = hypre_CSRMatrixData(xloc); 2146363d496dSStefano Zampini xnnz = hypre_CSRMatrixNumNonzeros(xloc); 2147363d496dSStefano Zampini } 2148363d496dSStefano Zampini if (yloc) { 214939accc25SStefano Zampini yarr = hypre_CSRMatrixData(yloc); 2150363d496dSStefano Zampini ynnz = hypre_CSRMatrixNumNonzeros(yloc); 2151363d496dSStefano Zampini } 215208401ef6SPierre Jolivet PetscCheck(xnnz == ynnz,PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Different number of nonzeros in diagonal block %" PetscInt_FMT " != %" PetscInt_FMT,xnnz,ynnz); 21539566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(xnnz,&bnz)); 2154792fecdfSBarry Smith PetscCallBLAS("BLASaxpy",BLASaxpy_(&bnz,&a,(PetscScalar*)xarr,&one,(PetscScalar*)yarr,&one)); 2155363d496dSStefano Zampini 2156363d496dSStefano Zampini /* off-diagonal block */ 2157363d496dSStefano Zampini xloc = hypre_ParCSRMatrixOffd(x); 2158363d496dSStefano Zampini yloc = hypre_ParCSRMatrixOffd(y); 2159363d496dSStefano Zampini xnnz = 0; 2160363d496dSStefano Zampini ynnz = 0; 2161363d496dSStefano Zampini xarr = NULL; 2162363d496dSStefano Zampini yarr = NULL; 2163363d496dSStefano Zampini if (xloc) { 216439accc25SStefano Zampini xarr = hypre_CSRMatrixData(xloc); 2165363d496dSStefano Zampini xnnz = hypre_CSRMatrixNumNonzeros(xloc); 2166363d496dSStefano Zampini } 2167363d496dSStefano Zampini if (yloc) { 216839accc25SStefano Zampini yarr = hypre_CSRMatrixData(yloc); 2169363d496dSStefano Zampini ynnz = hypre_CSRMatrixNumNonzeros(yloc); 2170363d496dSStefano Zampini } 217108401ef6SPierre Jolivet PetscCheck(xnnz == ynnz,PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Different number of nonzeros in off-diagonal block %" PetscInt_FMT " != %" PetscInt_FMT,xnnz,ynnz); 21729566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(xnnz,&bnz)); 2173792fecdfSBarry Smith PetscCallBLAS("BLASaxpy",BLASaxpy_(&bnz,&a,(PetscScalar*)xarr,&one,(PetscScalar*)yarr,&one)); 2174363d496dSStefano Zampini } else if (str == SUBSET_NONZERO_PATTERN) { 21759566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y,a,X,str)); 2176363d496dSStefano Zampini } else { 2177363d496dSStefano Zampini Mat B; 2178363d496dSStefano Zampini 21799566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic_Preallocate(Y,X,&B)); 21809566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B,Y,a,X,str)); 21819566063dSJacob Faibussowitsch PetscCall(MatHeaderReplace(Y,&B)); 2182363d496dSStefano Zampini } 21836ea7df73SStefano Zampini #endif 2184363d496dSStefano Zampini PetscFunctionReturn(0); 2185363d496dSStefano Zampini } 2186363d496dSStefano Zampini 2187e8729f6fSJunchao Zhang static PetscErrorCode MatSetPreallocationCOO_HYPRE(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[]) 21885fbaff96SJunchao Zhang { 21895fbaff96SJunchao Zhang MPI_Comm comm; 21905fbaff96SJunchao Zhang PetscMPIInt size; 21915fbaff96SJunchao Zhang PetscLayout rmap,cmap; 21925fbaff96SJunchao Zhang Mat_HYPRE *hmat; 21935fbaff96SJunchao Zhang hypre_ParCSRMatrix *parCSR; 21945fbaff96SJunchao Zhang hypre_CSRMatrix *diag,*offd; 21955fbaff96SJunchao Zhang Mat A,B,cooMat; 21965fbaff96SJunchao Zhang PetscScalar *Aa,*Ba; 21975fbaff96SJunchao Zhang HYPRE_MemoryLocation hypreMemtype = HYPRE_MEMORY_HOST; 21985fbaff96SJunchao Zhang PetscMemType petscMemtype; 21995fbaff96SJunchao Zhang MatType matType = MATAIJ; /* default type of cooMat */ 22005fbaff96SJunchao Zhang 22015fbaff96SJunchao Zhang PetscFunctionBegin; 22025fbaff96SJunchao Zhang /* Build an agent matrix cooMat whose type is either MATAIJ or MATAIJKOKKOS. 22035fbaff96SJunchao Zhang It has the same sparsity pattern as mat, and also shares the data array with mat. We use cooMat to do the COO work. 22045fbaff96SJunchao Zhang */ 22055fbaff96SJunchao Zhang PetscCall(PetscObjectGetComm((PetscObject)mat,&comm)); 22065fbaff96SJunchao Zhang PetscCallMPI(MPI_Comm_size(comm,&size)); 22075fbaff96SJunchao Zhang PetscCall(PetscLayoutSetUp(mat->rmap)); 22085fbaff96SJunchao Zhang PetscCall(PetscLayoutSetUp(mat->cmap)); 22095fbaff96SJunchao Zhang PetscCall(MatGetLayouts(mat,&rmap,&cmap)); 22105fbaff96SJunchao Zhang 22115fbaff96SJunchao Zhang /* I do not know how hypre_ParCSRMatrix stores diagonal elements for non-square matrices, so I just give up now */ 22125fbaff96SJunchao Zhang PetscCheck(rmap->N == cmap->N,comm,PETSC_ERR_SUP,"MATHYPRE COO cannot handle non-square matrices"); 22135fbaff96SJunchao Zhang 22145fbaff96SJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 22155fbaff96SJunchao Zhang if (!mat->boundtocpu) { /* mat will be on device, so will cooMat */ 22165fbaff96SJunchao Zhang #if defined(PETSC_HAVE_KOKKOS) 22175fbaff96SJunchao Zhang matType = MATAIJKOKKOS; 22185fbaff96SJunchao Zhang #else 22195fbaff96SJunchao Zhang SETERRQ(comm,PETSC_ERR_SUP,"To support MATHYPRE COO assembly on device, we need Kokkos, e.g., --download-kokkos --download-kokkos-kernels"); 22205fbaff96SJunchao Zhang #endif 22215fbaff96SJunchao Zhang } 22225fbaff96SJunchao Zhang #endif 22235fbaff96SJunchao Zhang 22245fbaff96SJunchao Zhang /* Do COO preallocation through cooMat */ 22255fbaff96SJunchao Zhang hmat = (Mat_HYPRE*)mat->data; 22265fbaff96SJunchao Zhang PetscCall(MatDestroy(&hmat->cooMat)); 22275fbaff96SJunchao Zhang PetscCall(MatCreate(comm,&cooMat)); 22285fbaff96SJunchao Zhang PetscCall(MatSetType(cooMat,matType)); 22295fbaff96SJunchao Zhang PetscCall(MatSetLayouts(cooMat,rmap,cmap)); 22305fbaff96SJunchao Zhang PetscCall(MatSetPreallocationCOO(cooMat,coo_n,coo_i,coo_j)); 22315fbaff96SJunchao Zhang 22325fbaff96SJunchao Zhang /* Copy the sparsity pattern from cooMat to hypre IJMatrix hmat->ij */ 22335fbaff96SJunchao Zhang PetscCall(MatSetOption(mat,MAT_SORTED_FULL,PETSC_TRUE)); 22345fbaff96SJunchao Zhang PetscCall(MatSetOption(mat,MAT_NO_OFF_PROC_ENTRIES,PETSC_TRUE)); 22355fbaff96SJunchao Zhang PetscCall(MatHYPRE_CreateFromMat(cooMat,hmat)); /* Create hmat->ij and preallocate it */ 22365fbaff96SJunchao Zhang PetscCall(MatHYPRE_IJMatrixCopy(cooMat,hmat->ij)); /* Copy A's (a,i,j) to hmat->ij. To reuse code. Copying 'a' is not really needed */ 22375fbaff96SJunchao Zhang 22385fbaff96SJunchao Zhang mat->preallocated = PETSC_TRUE; 22395fbaff96SJunchao Zhang PetscCall(MatAssemblyBegin(mat,MAT_FINAL_ASSEMBLY)); 22405fbaff96SJunchao Zhang PetscCall(MatAssemblyEnd(mat,MAT_FINAL_ASSEMBLY)); /* Migrate mat to device if it is bound to. Hypre builds its own SpMV context here */ 22415fbaff96SJunchao Zhang 22425fbaff96SJunchao Zhang /* Alias cooMat's data array to IJMatrix's */ 2243792fecdfSBarry Smith PetscCallExternal(HYPRE_IJMatrixGetObject,hmat->ij,(void**)&parCSR); 22445fbaff96SJunchao Zhang diag = hypre_ParCSRMatrixDiag(parCSR); 22455fbaff96SJunchao Zhang offd = hypre_ParCSRMatrixOffd(parCSR); 22465fbaff96SJunchao Zhang 22475fbaff96SJunchao Zhang hypreMemtype = hypre_CSRMatrixMemoryLocation(diag); 22485fbaff96SJunchao Zhang A = (size == 1)? cooMat : ((Mat_MPIAIJ*)cooMat->data)->A; 22495fbaff96SJunchao Zhang PetscCall(MatSeqAIJGetCSRAndMemType(A,NULL,NULL,&Aa,&petscMemtype)); 22505fbaff96SJunchao Zhang PetscAssert((PetscMemTypeHost(petscMemtype) && hypreMemtype == HYPRE_MEMORY_HOST) || 22515fbaff96SJunchao Zhang (PetscMemTypeDevice(petscMemtype) && hypreMemtype == HYPRE_MEMORY_DEVICE), 22525fbaff96SJunchao Zhang comm,PETSC_ERR_PLIB,"PETSc and hypre's memory types mismatch"); 22535fbaff96SJunchao Zhang 22545fbaff96SJunchao Zhang hmat->diagJ = hypre_CSRMatrixJ(diag); 2255*e77caa6dSBarry Smith PetscStackCallExternalVoid("hypre_TFree",hypre_TFree(hypre_CSRMatrixData(diag),hypreMemtype)); 22565fbaff96SJunchao Zhang hypre_CSRMatrixData(diag) = (HYPRE_Complex*)Aa; 22575fbaff96SJunchao Zhang hypre_CSRMatrixOwnsData(diag) = 0; /* Take ownership of (j,a) away from hypre. As a result, we need to free them on our own */ 22585fbaff96SJunchao Zhang 22595fbaff96SJunchao Zhang /* Copy diagonal pointers of A to device to facilitate MatSeqAIJMoveDiagonalValuesFront_SeqAIJKokkos */ 22605fbaff96SJunchao Zhang if (hypreMemtype == HYPRE_MEMORY_DEVICE) { 2261*e77caa6dSBarry Smith PetscStackCallExternalVoid("hypre_TAlloc",hmat->diag = hypre_TAlloc(PetscInt,rmap->n,hypreMemtype)); 22625fbaff96SJunchao Zhang PetscCall(MatMarkDiagonal_SeqAIJ(A)); /* We need updated diagonal positions */ 2263*e77caa6dSBarry Smith PetscStackCallExternalVoid("hypre_TMemcpy",hypre_TMemcpy(hmat->diag,((Mat_SeqAIJ*)A->data)->diag,PetscInt,rmap->n,hypreMemtype,HYPRE_MEMORY_HOST)); 22645fbaff96SJunchao Zhang } 22655fbaff96SJunchao Zhang 22665fbaff96SJunchao Zhang if (size > 1) { 22675fbaff96SJunchao Zhang B = ((Mat_MPIAIJ*)cooMat->data)->B; 22685fbaff96SJunchao Zhang PetscCall(MatSeqAIJGetCSRAndMemType(B,NULL,NULL,&Ba,&petscMemtype)); 22695fbaff96SJunchao Zhang hmat->offdJ = hypre_CSRMatrixJ(offd); 2270*e77caa6dSBarry Smith PetscStackCallExternalVoid("hypre_TFree",hypre_TFree(hypre_CSRMatrixData(offd),hypreMemtype)); 22715fbaff96SJunchao Zhang hypre_CSRMatrixData(offd) = (HYPRE_Complex*)Ba; 22725fbaff96SJunchao Zhang hypre_CSRMatrixOwnsData(offd) = 0; 22735fbaff96SJunchao Zhang } 22745fbaff96SJunchao Zhang 22755fbaff96SJunchao Zhang /* Record cooMat for use in MatSetValuesCOO_HYPRE */ 22765fbaff96SJunchao Zhang hmat->cooMat = cooMat; 22775fbaff96SJunchao Zhang hmat->memType = hypreMemtype; 22785fbaff96SJunchao Zhang PetscFunctionReturn(0); 22795fbaff96SJunchao Zhang } 22805fbaff96SJunchao Zhang 22815fbaff96SJunchao Zhang static PetscErrorCode MatSetValuesCOO_HYPRE(Mat mat, const PetscScalar v[], InsertMode imode) 22825fbaff96SJunchao Zhang { 22835fbaff96SJunchao Zhang Mat_HYPRE *hmat = (Mat_HYPRE*)mat->data; 22845fbaff96SJunchao Zhang PetscMPIInt size; 22855fbaff96SJunchao Zhang Mat A; 22865fbaff96SJunchao Zhang 22875fbaff96SJunchao Zhang PetscFunctionBegin; 22885fbaff96SJunchao Zhang PetscCheck(hmat->cooMat,hmat->comm,PETSC_ERR_PLIB,"HYPRE COO delegate matrix has not been created yet"); 22895fbaff96SJunchao Zhang PetscCallMPI(MPI_Comm_size(hmat->comm,&size)); 22905fbaff96SJunchao Zhang PetscCall(MatSetValuesCOO(hmat->cooMat,v,imode)); 22915fbaff96SJunchao Zhang 22925fbaff96SJunchao Zhang /* Move diagonal elements of the diagonal block to the front of their row, as needed by ParCSRMatrix. So damn hacky */ 22935fbaff96SJunchao Zhang A = (size == 1) ? hmat->cooMat : ((Mat_MPIAIJ*)hmat->cooMat->data)->A; 22945fbaff96SJunchao Zhang if (hmat->memType == HYPRE_MEMORY_HOST) { 22955fbaff96SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 22965fbaff96SJunchao Zhang PetscInt i,m,*Ai = aij->i,*Adiag = aij->diag; 22975fbaff96SJunchao Zhang PetscScalar *Aa = aij->a,tmp; 22985fbaff96SJunchao Zhang 22995fbaff96SJunchao Zhang PetscCall(MatGetSize(A,&m,NULL)); 23005fbaff96SJunchao Zhang for (i=0; i<m; i++) { 23015fbaff96SJunchao Zhang if (Adiag[i] >= Ai[i] && Adiag[i] < Ai[i+1]) { /* Digonal element of this row exists in a[] and j[] */ 23025fbaff96SJunchao Zhang tmp = Aa[Ai[i]]; 23035fbaff96SJunchao Zhang Aa[Ai[i]] = Aa[Adiag[i]]; 23045fbaff96SJunchao Zhang Aa[Adiag[i]] = tmp; 23055fbaff96SJunchao Zhang } 23065fbaff96SJunchao Zhang } 23075fbaff96SJunchao Zhang } else { 23085fbaff96SJunchao Zhang #if defined(PETSC_HAVE_KOKKOS_KERNELS) 23095fbaff96SJunchao Zhang PetscCall(MatSeqAIJMoveDiagonalValuesFront_SeqAIJKokkos(A,hmat->diag)); 23105fbaff96SJunchao Zhang #endif 23115fbaff96SJunchao Zhang } 23125fbaff96SJunchao Zhang PetscFunctionReturn(0); 23135fbaff96SJunchao Zhang } 23145fbaff96SJunchao Zhang 2315a055b5aaSBarry Smith /*MC 2316a055b5aaSBarry Smith MATHYPRE - MATHYPRE = "hypre" - A matrix type to be used for sequential and parallel sparse matrices 2317a055b5aaSBarry Smith based on the hypre IJ interface. 2318a055b5aaSBarry Smith 2319a055b5aaSBarry Smith Level: intermediate 2320a055b5aaSBarry Smith 2321db781477SPatrick Sanan .seealso: `MatCreate()` 2322a055b5aaSBarry Smith M*/ 2323a055b5aaSBarry Smith 232463c07aadSStefano Zampini PETSC_EXTERN PetscErrorCode MatCreate_HYPRE(Mat B) 232563c07aadSStefano Zampini { 232663c07aadSStefano Zampini Mat_HYPRE *hB; 232763c07aadSStefano Zampini 232863c07aadSStefano Zampini PetscFunctionBegin; 23299566063dSJacob Faibussowitsch PetscCall(PetscNewLog(B,&hB)); 23306ea7df73SStefano Zampini 2331978814f1SStefano Zampini hB->inner_free = PETSC_TRUE; 2332c69f721fSFande Kong hB->available = PETSC_TRUE; 2333336664bdSPierre Jolivet hB->sorted_full = PETSC_FALSE; /* no assumption whether column indices are sorted or not */ 2334c69f721fSFande Kong hB->size = 0; 2335c69f721fSFande Kong hB->array = NULL; 2336978814f1SStefano Zampini 233763c07aadSStefano Zampini B->data = (void*)hB; 233863c07aadSStefano Zampini B->assembled = PETSC_FALSE; 233963c07aadSStefano Zampini 23409566063dSJacob Faibussowitsch PetscCall(PetscMemzero(B->ops,sizeof(struct _MatOps))); 234163c07aadSStefano Zampini B->ops->mult = MatMult_HYPRE; 234263c07aadSStefano Zampini B->ops->multtranspose = MatMultTranspose_HYPRE; 2343414bd5c3SStefano Zampini B->ops->multadd = MatMultAdd_HYPRE; 2344414bd5c3SStefano Zampini B->ops->multtransposeadd = MatMultTransposeAdd_HYPRE; 234563c07aadSStefano Zampini B->ops->setup = MatSetUp_HYPRE; 234663c07aadSStefano Zampini B->ops->destroy = MatDestroy_HYPRE; 234763c07aadSStefano Zampini B->ops->assemblyend = MatAssemblyEnd_HYPRE; 2348c69f721fSFande Kong B->ops->assemblybegin = MatAssemblyBegin_HYPRE; 2349d975228cSstefano_zampini B->ops->setvalues = MatSetValues_HYPRE; 235068ec7858SStefano Zampini B->ops->missingdiagonal = MatMissingDiagonal_HYPRE; 235168ec7858SStefano Zampini B->ops->scale = MatScale_HYPRE; 235268ec7858SStefano Zampini B->ops->zerorowscolumns = MatZeroRowsColumns_HYPRE; 2353c69f721fSFande Kong B->ops->zeroentries = MatZeroEntries_HYPRE; 2354c69f721fSFande Kong B->ops->zerorows = MatZeroRows_HYPRE; 2355c69f721fSFande Kong B->ops->getrow = MatGetRow_HYPRE; 2356c69f721fSFande Kong B->ops->restorerow = MatRestoreRow_HYPRE; 2357c69f721fSFande Kong B->ops->getvalues = MatGetValues_HYPRE; 2358ddbeb582SStefano Zampini B->ops->setoption = MatSetOption_HYPRE; 235945b8d346SStefano Zampini B->ops->duplicate = MatDuplicate_HYPRE; 2360465edc17SStefano Zampini B->ops->copy = MatCopy_HYPRE; 236145b8d346SStefano Zampini B->ops->view = MatView_HYPRE; 23626305df00SStefano Zampini B->ops->getdiagonal = MatGetDiagonal_HYPRE; 2363363d496dSStefano Zampini B->ops->axpy = MatAXPY_HYPRE; 23644222ddf1SHong Zhang B->ops->productsetfromoptions = MatProductSetFromOptions_HYPRE; 23656ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 23666ea7df73SStefano Zampini B->ops->bindtocpu = MatBindToCPU_HYPRE; 23676ea7df73SStefano Zampini B->boundtocpu = PETSC_FALSE; 23686ea7df73SStefano Zampini #endif 236945b8d346SStefano Zampini 237045b8d346SStefano Zampini /* build cache for off array entries formed */ 23719566063dSJacob Faibussowitsch PetscCall(MatStashCreate_Private(PetscObjectComm((PetscObject)B),1,&B->stash)); 237263c07aadSStefano Zampini 23739566063dSJacob Faibussowitsch PetscCall(PetscCommGetComm(PetscObjectComm((PetscObject)B),&hB->comm)); 23749566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B,MATHYPRE)); 23759566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_hypre_aij_C",MatConvert_HYPRE_AIJ)); 23769566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_hypre_is_C",MatConvert_HYPRE_IS)); 23779566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaij_hypre_C",MatProductSetFromOptions_HYPRE)); 23789566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_mpiaij_hypre_C",MatProductSetFromOptions_HYPRE)); 23799566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatHYPRESetPreallocation_C",MatHYPRESetPreallocation_HYPRE)); 23809566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatHYPREGetParCSR_C",MatHYPREGetParCSR_HYPRE)); 23815fbaff96SJunchao Zhang PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSetPreallocationCOO_C",MatSetPreallocationCOO_HYPRE)); 23825fbaff96SJunchao Zhang PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSetValuesCOO_C",MatSetValuesCOO_HYPRE)); 23836ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 23846ea7df73SStefano Zampini #if defined(HYPRE_USING_HIP) 23859566063dSJacob Faibussowitsch PetscCall(PetscDeviceInitialize(PETSC_DEVICE_HIP)); 23869566063dSJacob Faibussowitsch PetscCall(MatSetVecType(B,VECHIP)); 23876ea7df73SStefano Zampini #endif 23886ea7df73SStefano Zampini #if defined(HYPRE_USING_CUDA) 23899566063dSJacob Faibussowitsch PetscCall(PetscDeviceInitialize(PETSC_DEVICE_CUDA)); 23909566063dSJacob Faibussowitsch PetscCall(MatSetVecType(B,VECCUDA)); 23916ea7df73SStefano Zampini #endif 23926ea7df73SStefano Zampini #endif 239363c07aadSStefano Zampini PetscFunctionReturn(0); 239463c07aadSStefano Zampini } 239563c07aadSStefano Zampini 2396225daaf8SStefano Zampini static PetscErrorCode hypre_array_destroy(void *ptr) 2397225daaf8SStefano Zampini { 2398225daaf8SStefano Zampini PetscFunctionBegin; 2399e6de0934SSatish Balay hypre_TFree(ptr,HYPRE_MEMORY_HOST); 2400225daaf8SStefano Zampini PetscFunctionReturn(0); 2401225daaf8SStefano Zampini } 2402