163c07aadSStefano Zampini 263c07aadSStefano Zampini /* 363c07aadSStefano Zampini Creates hypre ijmatrix from PETSc matrix 463c07aadSStefano Zampini */ 5225daaf8SStefano Zampini 6c6698e78SStefano Zampini #include <petscpkg_version.h> 739accc25SStefano Zampini #include <petsc/private/petschypre.h> 8dd9c0a25Sstefano_zampini #include <petscmathypre.h> 963c07aadSStefano Zampini #include <petsc/private/matimpl.h> 10a4af0ceeSJacob Faibussowitsch #include <petsc/private/deviceimpl.h> 1163c07aadSStefano Zampini #include <../src/mat/impls/hypre/mhypre.h> 1263c07aadSStefano Zampini #include <../src/mat/impls/aij/mpi/mpiaij.h> 1358968eb6SStefano Zampini #include <../src/vec/vec/impls/hypre/vhyp.h> 1458968eb6SStefano Zampini #include <HYPRE.h> 15c1a070e6SStefano Zampini #include <HYPRE_utilities.h> 16cd8bc7baSStefano Zampini #include <_hypre_parcsr_ls.h> 1768ec7858SStefano Zampini #include <_hypre_sstruct_ls.h> 1863c07aadSStefano Zampini 190e6427aaSSatish Balay #if PETSC_PKG_HYPRE_VERSION_LT(2,18,0) 200e6427aaSSatish Balay #define hypre_ParCSRMatrixClone(A,B) hypre_ParCSRMatrixCompleteClone(A) 210e6427aaSSatish Balay #endif 220e6427aaSSatish Balay 2363c07aadSStefano Zampini static PetscErrorCode MatHYPRE_CreateFromMat(Mat,Mat_HYPRE*); 2463c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixPreallocate(Mat,Mat,HYPRE_IJMatrix); 2563c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixFastCopy_MPIAIJ(Mat,HYPRE_IJMatrix); 2663c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixFastCopy_SeqAIJ(Mat,HYPRE_IJMatrix); 2739accc25SStefano Zampini static PetscErrorCode MatHYPRE_MultKernel_Private(Mat,HYPRE_Complex,Vec,HYPRE_Complex,Vec,PetscBool); 28225daaf8SStefano Zampini static PetscErrorCode hypre_array_destroy(void*); 296ea7df73SStefano Zampini static PetscErrorCode MatSetValues_HYPRE(Mat,PetscInt,const PetscInt[],PetscInt,const PetscInt[],const PetscScalar[],InsertMode ins); 3063c07aadSStefano Zampini 3163c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixPreallocate(Mat A_d, Mat A_o, HYPRE_IJMatrix ij) 3263c07aadSStefano Zampini { 3363c07aadSStefano Zampini PetscInt i,n_d,n_o; 3463c07aadSStefano Zampini const PetscInt *ia_d,*ia_o; 3563c07aadSStefano Zampini PetscBool done_d=PETSC_FALSE,done_o=PETSC_FALSE; 362cf14000SStefano Zampini HYPRE_Int *nnz_d=NULL,*nnz_o=NULL; 3763c07aadSStefano Zampini 3863c07aadSStefano Zampini PetscFunctionBegin; 3963c07aadSStefano Zampini if (A_d) { /* determine number of nonzero entries in local diagonal part */ 405f80ce2aSJacob Faibussowitsch CHKERRQ(MatGetRowIJ(A_d,0,PETSC_FALSE,PETSC_FALSE,&n_d,&ia_d,NULL,&done_d)); 4163c07aadSStefano Zampini if (done_d) { 425f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(n_d,&nnz_d)); 4363c07aadSStefano Zampini for (i=0; i<n_d; i++) { 4463c07aadSStefano Zampini nnz_d[i] = ia_d[i+1] - ia_d[i]; 4563c07aadSStefano Zampini } 4663c07aadSStefano Zampini } 475f80ce2aSJacob Faibussowitsch CHKERRQ(MatRestoreRowIJ(A_d,0,PETSC_FALSE,PETSC_FALSE,NULL,&ia_d,NULL,&done_d)); 4863c07aadSStefano Zampini } 4963c07aadSStefano Zampini if (A_o) { /* determine number of nonzero entries in local off-diagonal part */ 505f80ce2aSJacob Faibussowitsch CHKERRQ(MatGetRowIJ(A_o,0,PETSC_FALSE,PETSC_FALSE,&n_o,&ia_o,NULL,&done_o)); 5163c07aadSStefano Zampini if (done_o) { 525f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(n_o,&nnz_o)); 5363c07aadSStefano Zampini for (i=0; i<n_o; i++) { 5463c07aadSStefano Zampini nnz_o[i] = ia_o[i+1] - ia_o[i]; 5563c07aadSStefano Zampini } 5663c07aadSStefano Zampini } 575f80ce2aSJacob Faibussowitsch CHKERRQ(MatRestoreRowIJ(A_o,0,PETSC_FALSE,PETSC_FALSE,&n_o,&ia_o,NULL,&done_o)); 5863c07aadSStefano Zampini } 5963c07aadSStefano Zampini if (done_d) { /* set number of nonzeros in HYPRE IJ matrix */ 6063c07aadSStefano Zampini if (!done_o) { /* only diagonal part */ 615f80ce2aSJacob Faibussowitsch CHKERRQ(PetscCalloc1(n_d,&nnz_o)); 6263c07aadSStefano Zampini } 63c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2,16,0) 64c6698e78SStefano Zampini { /* If we don't do this, the columns of the matrix will be all zeros! */ 65c6698e78SStefano Zampini hypre_AuxParCSRMatrix *aux_matrix; 66c6698e78SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix*)hypre_IJMatrixTranslator(ij); 67c6698e78SStefano Zampini hypre_AuxParCSRMatrixDestroy(aux_matrix); 68c6698e78SStefano Zampini hypre_IJMatrixTranslator(ij) = NULL; 69a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixSetDiagOffdSizes,ij,nnz_d,nnz_o); 7022235d61SPierre Jolivet /* it seems they partially fixed it in 2.19.0 */ 7122235d61SPierre Jolivet #if PETSC_PKG_HYPRE_VERSION_LT(2,19,0) 72c6698e78SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix*)hypre_IJMatrixTranslator(ij); 73c6698e78SStefano Zampini hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 1; 7422235d61SPierre Jolivet #endif 75c6698e78SStefano Zampini } 76c6698e78SStefano Zampini #else 77a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixSetDiagOffdSizes,ij,nnz_d,nnz_o); 78c6698e78SStefano Zampini #endif 795f80ce2aSJacob Faibussowitsch CHKERRQ(PetscFree(nnz_d)); 805f80ce2aSJacob Faibussowitsch CHKERRQ(PetscFree(nnz_o)); 8163c07aadSStefano Zampini } 8263c07aadSStefano Zampini PetscFunctionReturn(0); 8363c07aadSStefano Zampini } 8463c07aadSStefano Zampini 8563c07aadSStefano Zampini static PetscErrorCode MatHYPRE_CreateFromMat(Mat A, Mat_HYPRE *hA) 8663c07aadSStefano Zampini { 8763c07aadSStefano Zampini PetscInt rstart,rend,cstart,cend; 8863c07aadSStefano Zampini 8963c07aadSStefano Zampini PetscFunctionBegin; 905f80ce2aSJacob Faibussowitsch CHKERRQ(PetscLayoutSetUp(A->rmap)); 915f80ce2aSJacob Faibussowitsch CHKERRQ(PetscLayoutSetUp(A->cmap)); 9263c07aadSStefano Zampini rstart = A->rmap->rstart; 9363c07aadSStefano Zampini rend = A->rmap->rend; 9463c07aadSStefano Zampini cstart = A->cmap->rstart; 9563c07aadSStefano Zampini cend = A->cmap->rend; 96a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixCreate,hA->comm,rstart,rend-1,cstart,cend-1,&hA->ij); 97a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixSetObjectType,hA->ij,HYPRE_PARCSR); 9863c07aadSStefano Zampini { 9963c07aadSStefano Zampini PetscBool same; 10063c07aadSStefano Zampini Mat A_d,A_o; 10163c07aadSStefano Zampini const PetscInt *colmap; 1025f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectBaseTypeCompare((PetscObject)A,MATMPIAIJ,&same)); 10363c07aadSStefano Zampini if (same) { 1045f80ce2aSJacob Faibussowitsch CHKERRQ(MatMPIAIJGetSeqAIJ(A,&A_d,&A_o,&colmap)); 1055f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPRE_IJMatrixPreallocate(A_d,A_o,hA->ij)); 10663c07aadSStefano Zampini PetscFunctionReturn(0); 10763c07aadSStefano Zampini } 1085f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectBaseTypeCompare((PetscObject)A,MATMPIBAIJ,&same)); 10963c07aadSStefano Zampini if (same) { 1105f80ce2aSJacob Faibussowitsch CHKERRQ(MatMPIBAIJGetSeqBAIJ(A,&A_d,&A_o,&colmap)); 1115f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPRE_IJMatrixPreallocate(A_d,A_o,hA->ij)); 11263c07aadSStefano Zampini PetscFunctionReturn(0); 11363c07aadSStefano Zampini } 1145f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectBaseTypeCompare((PetscObject)A,MATSEQAIJ,&same)); 11563c07aadSStefano Zampini if (same) { 1165f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPRE_IJMatrixPreallocate(A,NULL,hA->ij)); 11763c07aadSStefano Zampini PetscFunctionReturn(0); 11863c07aadSStefano Zampini } 1195f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectBaseTypeCompare((PetscObject)A,MATSEQBAIJ,&same)); 12063c07aadSStefano Zampini if (same) { 1215f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPRE_IJMatrixPreallocate(A,NULL,hA->ij)); 12263c07aadSStefano Zampini PetscFunctionReturn(0); 12363c07aadSStefano Zampini } 12463c07aadSStefano Zampini } 12563c07aadSStefano Zampini PetscFunctionReturn(0); 12663c07aadSStefano Zampini } 12763c07aadSStefano Zampini 12863c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixCopy(Mat A, HYPRE_IJMatrix ij) 12963c07aadSStefano Zampini { 13063c07aadSStefano Zampini PetscInt i,rstart,rend,ncols,nr,nc; 13163c07aadSStefano Zampini const PetscScalar *values; 13263c07aadSStefano Zampini const PetscInt *cols; 13363c07aadSStefano Zampini PetscBool flg; 13463c07aadSStefano Zampini 13563c07aadSStefano Zampini PetscFunctionBegin; 1366ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2,19,0) 137a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixInitialize,ij); 1386ea7df73SStefano Zampini #else 139a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixInitialize_v2,ij,HYPRE_MEMORY_HOST); 1406ea7df73SStefano Zampini #endif 1415f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectBaseTypeCompare((PetscObject)A,MATMPIAIJ,&flg)); 1425f80ce2aSJacob Faibussowitsch CHKERRQ(MatGetSize(A,&nr,&nc)); 14363c07aadSStefano Zampini if (flg && nr == nc) { 1445f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPRE_IJMatrixFastCopy_MPIAIJ(A,ij)); 14563c07aadSStefano Zampini PetscFunctionReturn(0); 14663c07aadSStefano Zampini } 1475f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectBaseTypeCompare((PetscObject)A,MATSEQAIJ,&flg)); 14863c07aadSStefano Zampini if (flg) { 1495f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPRE_IJMatrixFastCopy_SeqAIJ(A,ij)); 15063c07aadSStefano Zampini PetscFunctionReturn(0); 15163c07aadSStefano Zampini } 15263c07aadSStefano Zampini 1535f80ce2aSJacob Faibussowitsch CHKERRQ(MatGetOwnershipRange(A,&rstart,&rend)); 15463c07aadSStefano Zampini for (i=rstart; i<rend; i++) { 1555f80ce2aSJacob Faibussowitsch CHKERRQ(MatGetRow(A,i,&ncols,&cols,&values)); 156e3977e59Sstefano_zampini if (ncols) { 1572cf14000SStefano Zampini HYPRE_Int nc = (HYPRE_Int)ncols; 1582cf14000SStefano Zampini 1592c71b3e2SJacob Faibussowitsch PetscCheckFalse((PetscInt)nc != ncols,PETSC_COMM_SELF,PETSC_ERR_SUP,"Hypre overflow! number of columns %" PetscInt_FMT " for row %" PetscInt_FMT,ncols,i); 160a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixSetValues,ij,1,&nc,(HYPRE_BigInt *)&i,(HYPRE_BigInt *)cols,(HYPRE_Complex *)values); 161e3977e59Sstefano_zampini } 1625f80ce2aSJacob Faibussowitsch CHKERRQ(MatRestoreRow(A,i,&ncols,&cols,&values)); 16363c07aadSStefano Zampini } 16463c07aadSStefano Zampini PetscFunctionReturn(0); 16563c07aadSStefano Zampini } 16663c07aadSStefano Zampini 16763c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixFastCopy_SeqAIJ(Mat A, HYPRE_IJMatrix ij) 16863c07aadSStefano Zampini { 16963c07aadSStefano Zampini Mat_SeqAIJ *pdiag = (Mat_SeqAIJ*)A->data; 17058968eb6SStefano Zampini HYPRE_Int type; 17163c07aadSStefano Zampini hypre_ParCSRMatrix *par_matrix; 17263c07aadSStefano Zampini hypre_AuxParCSRMatrix *aux_matrix; 17363c07aadSStefano Zampini hypre_CSRMatrix *hdiag; 1742cf14000SStefano Zampini PetscBool sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int)); 1756ea7df73SStefano Zampini const PetscScalar *pa; 17663c07aadSStefano Zampini 17763c07aadSStefano Zampini PetscFunctionBegin; 178a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixGetObjectType,ij,&type); 1792c71b3e2SJacob Faibussowitsch PetscCheckFalse(type != HYPRE_PARCSR,PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported"); 180a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixGetObject,ij,(void**)&par_matrix); 18163c07aadSStefano Zampini hdiag = hypre_ParCSRMatrixDiag(par_matrix); 18263c07aadSStefano Zampini /* 18363c07aadSStefano Zampini this is the Hack part where we monkey directly with the hypre datastructures 18463c07aadSStefano Zampini */ 1852cf14000SStefano Zampini if (sameint) { 1865f80ce2aSJacob Faibussowitsch CHKERRQ(PetscArraycpy(hdiag->i,pdiag->i,A->rmap->n + 1)); 1875f80ce2aSJacob Faibussowitsch CHKERRQ(PetscArraycpy(hdiag->j,pdiag->j,pdiag->nz)); 1882cf14000SStefano Zampini } else { 1892cf14000SStefano Zampini PetscInt i; 1902cf14000SStefano Zampini 1912cf14000SStefano Zampini for (i=0;i<A->rmap->n + 1;i++) hdiag->i[i] = (HYPRE_Int)pdiag->i[i]; 1922cf14000SStefano Zampini for (i=0;i<pdiag->nz;i++) hdiag->j[i] = (HYPRE_Int)pdiag->j[i]; 1932cf14000SStefano Zampini } 1946ea7df73SStefano Zampini 1955f80ce2aSJacob Faibussowitsch CHKERRQ(MatSeqAIJGetArrayRead(A,&pa)); 1965f80ce2aSJacob Faibussowitsch CHKERRQ(PetscArraycpy(hdiag->data,pa,pdiag->nz)); 1975f80ce2aSJacob Faibussowitsch CHKERRQ(MatSeqAIJRestoreArrayRead(A,&pa)); 198ea9daf28SStefano Zampini 199ea9daf28SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix*)hypre_IJMatrixTranslator(ij); 20063c07aadSStefano Zampini hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0; 20163c07aadSStefano Zampini PetscFunctionReturn(0); 20263c07aadSStefano Zampini } 20363c07aadSStefano Zampini 20463c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixFastCopy_MPIAIJ(Mat A, HYPRE_IJMatrix ij) 20563c07aadSStefano Zampini { 20663c07aadSStefano Zampini Mat_MPIAIJ *pA = (Mat_MPIAIJ*)A->data; 20763c07aadSStefano Zampini Mat_SeqAIJ *pdiag,*poffd; 20863c07aadSStefano Zampini PetscInt i,*garray = pA->garray,*jj,cstart,*pjj; 2092cf14000SStefano Zampini HYPRE_Int *hjj,type; 21063c07aadSStefano Zampini hypre_ParCSRMatrix *par_matrix; 21163c07aadSStefano Zampini hypre_AuxParCSRMatrix *aux_matrix; 21263c07aadSStefano Zampini hypre_CSRMatrix *hdiag,*hoffd; 2132cf14000SStefano Zampini PetscBool sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int)); 2146ea7df73SStefano Zampini const PetscScalar *pa; 21563c07aadSStefano Zampini 21663c07aadSStefano Zampini PetscFunctionBegin; 21763c07aadSStefano Zampini pdiag = (Mat_SeqAIJ*) pA->A->data; 21863c07aadSStefano Zampini poffd = (Mat_SeqAIJ*) pA->B->data; 21963c07aadSStefano Zampini /* cstart is only valid for square MPIAIJ layed out in the usual way */ 2205f80ce2aSJacob Faibussowitsch CHKERRQ(MatGetOwnershipRange(A,&cstart,NULL)); 22163c07aadSStefano Zampini 222a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixGetObjectType,ij,&type); 2232c71b3e2SJacob Faibussowitsch PetscCheckFalse(type != HYPRE_PARCSR,PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported"); 224a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixGetObject,ij,(void**)&par_matrix); 22563c07aadSStefano Zampini hdiag = hypre_ParCSRMatrixDiag(par_matrix); 22663c07aadSStefano Zampini hoffd = hypre_ParCSRMatrixOffd(par_matrix); 22763c07aadSStefano Zampini 22863c07aadSStefano Zampini /* 22963c07aadSStefano Zampini this is the Hack part where we monkey directly with the hypre datastructures 23063c07aadSStefano Zampini */ 2312cf14000SStefano Zampini if (sameint) { 2325f80ce2aSJacob Faibussowitsch CHKERRQ(PetscArraycpy(hdiag->i,pdiag->i,pA->A->rmap->n + 1)); 2332cf14000SStefano Zampini } else { 2342cf14000SStefano Zampini for (i=0; i<pA->A->rmap->n + 1; i++) hdiag->i[i] = (HYPRE_Int)(pdiag->i[i]); 2352cf14000SStefano Zampini } 23663c07aadSStefano Zampini /* need to shift the diag column indices (hdiag->j) back to global numbering since hypre is expecting this */ 2372cf14000SStefano Zampini hjj = hdiag->j; 2382cf14000SStefano Zampini pjj = pdiag->j; 239c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2,16,0) 2402cf14000SStefano Zampini for (i=0; i<pdiag->nz; i++) hjj[i] = pjj[i]; 241c6698e78SStefano Zampini #else 2422cf14000SStefano Zampini for (i=0; i<pdiag->nz; i++) hjj[i] = cstart + pjj[i]; 243c6698e78SStefano Zampini #endif 2445f80ce2aSJacob Faibussowitsch CHKERRQ(MatSeqAIJGetArrayRead(pA->A,&pa)); 2455f80ce2aSJacob Faibussowitsch CHKERRQ(PetscArraycpy(hdiag->data,pa,pdiag->nz)); 2465f80ce2aSJacob Faibussowitsch CHKERRQ(MatSeqAIJRestoreArrayRead(pA->A,&pa)); 2472cf14000SStefano Zampini if (sameint) { 2485f80ce2aSJacob Faibussowitsch CHKERRQ(PetscArraycpy(hoffd->i,poffd->i,pA->A->rmap->n + 1)); 2492cf14000SStefano Zampini } else { 2502cf14000SStefano Zampini for (i=0; i<pA->A->rmap->n + 1; i++) hoffd->i[i] = (HYPRE_Int)(poffd->i[i]); 2512cf14000SStefano Zampini } 2522cf14000SStefano Zampini 25363c07aadSStefano Zampini /* need to move the offd column indices (hoffd->j) back to global numbering since hypre is expecting this 25463c07aadSStefano Zampini If we hacked a hypre a bit more we might be able to avoid this step */ 255c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2,16,0) 256a74df02fSJacob Faibussowitsch PetscStackCallStandard(hypre_CSRMatrixBigInitialize,hoffd); 257c6698e78SStefano Zampini jj = (PetscInt*) hoffd->big_j; 258c6698e78SStefano Zampini #else 25963c07aadSStefano Zampini jj = (PetscInt*) hoffd->j; 260c6698e78SStefano Zampini #endif 2612cf14000SStefano Zampini pjj = poffd->j; 26263c07aadSStefano Zampini for (i=0; i<poffd->nz; i++) jj[i] = garray[pjj[i]]; 263c6698e78SStefano Zampini 2645f80ce2aSJacob Faibussowitsch CHKERRQ(MatSeqAIJGetArrayRead(pA->B,&pa)); 2655f80ce2aSJacob Faibussowitsch CHKERRQ(PetscArraycpy(hoffd->data,pa,poffd->nz)); 2665f80ce2aSJacob Faibussowitsch CHKERRQ(MatSeqAIJRestoreArrayRead(pA->B,&pa)); 26763c07aadSStefano Zampini 268ea9daf28SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix*)hypre_IJMatrixTranslator(ij); 26963c07aadSStefano Zampini hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0; 27063c07aadSStefano Zampini PetscFunctionReturn(0); 27163c07aadSStefano Zampini } 27263c07aadSStefano Zampini 2732df22349SStefano Zampini static PetscErrorCode MatConvert_HYPRE_IS(Mat A, MatType mtype, MatReuse reuse, Mat* B) 2742df22349SStefano Zampini { 2752df22349SStefano Zampini Mat_HYPRE* mhA = (Mat_HYPRE*)(A->data); 2762df22349SStefano Zampini Mat lA; 2772df22349SStefano Zampini ISLocalToGlobalMapping rl2g,cl2g; 2782df22349SStefano Zampini IS is; 2792df22349SStefano Zampini hypre_ParCSRMatrix *hA; 2802df22349SStefano Zampini hypre_CSRMatrix *hdiag,*hoffd; 2812df22349SStefano Zampini MPI_Comm comm; 28239accc25SStefano Zampini HYPRE_Complex *hdd,*hod,*aa; 28339accc25SStefano Zampini PetscScalar *data; 2842cf14000SStefano Zampini HYPRE_BigInt *col_map_offd; 2852cf14000SStefano Zampini HYPRE_Int *hdi,*hdj,*hoi,*hoj; 2862df22349SStefano Zampini PetscInt *ii,*jj,*iptr,*jptr; 2872df22349SStefano Zampini PetscInt cum,dr,dc,oc,str,stc,nnz,i,jd,jo,M,N; 28858968eb6SStefano Zampini HYPRE_Int type; 2892df22349SStefano Zampini 2902df22349SStefano Zampini PetscFunctionBegin; 291a1787963SStefano Zampini comm = PetscObjectComm((PetscObject)A); 292a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixGetObjectType,mhA->ij,&type); 2932c71b3e2SJacob Faibussowitsch PetscCheckFalse(type != HYPRE_PARCSR,comm,PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported"); 294a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixGetObject,mhA->ij,(void**)&hA); 2952df22349SStefano Zampini M = hypre_ParCSRMatrixGlobalNumRows(hA); 2962df22349SStefano Zampini N = hypre_ParCSRMatrixGlobalNumCols(hA); 2972df22349SStefano Zampini str = hypre_ParCSRMatrixFirstRowIndex(hA); 2982df22349SStefano Zampini stc = hypre_ParCSRMatrixFirstColDiag(hA); 2992df22349SStefano Zampini hdiag = hypre_ParCSRMatrixDiag(hA); 3002df22349SStefano Zampini hoffd = hypre_ParCSRMatrixOffd(hA); 3012df22349SStefano Zampini dr = hypre_CSRMatrixNumRows(hdiag); 3022df22349SStefano Zampini dc = hypre_CSRMatrixNumCols(hdiag); 3032df22349SStefano Zampini nnz = hypre_CSRMatrixNumNonzeros(hdiag); 3042df22349SStefano Zampini hdi = hypre_CSRMatrixI(hdiag); 3052df22349SStefano Zampini hdj = hypre_CSRMatrixJ(hdiag); 3062df22349SStefano Zampini hdd = hypre_CSRMatrixData(hdiag); 3072df22349SStefano Zampini oc = hypre_CSRMatrixNumCols(hoffd); 3082df22349SStefano Zampini nnz += hypre_CSRMatrixNumNonzeros(hoffd); 3092df22349SStefano Zampini hoi = hypre_CSRMatrixI(hoffd); 3102df22349SStefano Zampini hoj = hypre_CSRMatrixJ(hoffd); 3112df22349SStefano Zampini hod = hypre_CSRMatrixData(hoffd); 3122df22349SStefano Zampini if (reuse != MAT_REUSE_MATRIX) { 3132df22349SStefano Zampini PetscInt *aux; 3142df22349SStefano Zampini 3152df22349SStefano Zampini /* generate l2g maps for rows and cols */ 3165f80ce2aSJacob Faibussowitsch CHKERRQ(ISCreateStride(comm,dr,str,1,&is)); 3175f80ce2aSJacob Faibussowitsch CHKERRQ(ISLocalToGlobalMappingCreateIS(is,&rl2g)); 3185f80ce2aSJacob Faibussowitsch CHKERRQ(ISDestroy(&is)); 3192df22349SStefano Zampini col_map_offd = hypre_ParCSRMatrixColMapOffd(hA); 3205f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(dc+oc,&aux)); 3212df22349SStefano Zampini for (i=0; i<dc; i++) aux[i] = i+stc; 3222df22349SStefano Zampini for (i=0; i<oc; i++) aux[i+dc] = col_map_offd[i]; 3235f80ce2aSJacob Faibussowitsch CHKERRQ(ISCreateGeneral(comm,dc+oc,aux,PETSC_OWN_POINTER,&is)); 3245f80ce2aSJacob Faibussowitsch CHKERRQ(ISLocalToGlobalMappingCreateIS(is,&cl2g)); 3255f80ce2aSJacob Faibussowitsch CHKERRQ(ISDestroy(&is)); 3262df22349SStefano Zampini /* create MATIS object */ 3275f80ce2aSJacob Faibussowitsch CHKERRQ(MatCreate(comm,B)); 3285f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetSizes(*B,dr,dc,M,N)); 3295f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetType(*B,MATIS)); 3305f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetLocalToGlobalMapping(*B,rl2g,cl2g)); 3315f80ce2aSJacob Faibussowitsch CHKERRQ(ISLocalToGlobalMappingDestroy(&rl2g)); 3325f80ce2aSJacob Faibussowitsch CHKERRQ(ISLocalToGlobalMappingDestroy(&cl2g)); 3332df22349SStefano Zampini 3342df22349SStefano Zampini /* allocate CSR for local matrix */ 3355f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(dr+1,&iptr)); 3365f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(nnz,&jptr)); 3375f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(nnz,&data)); 3382df22349SStefano Zampini } else { 3392df22349SStefano Zampini PetscInt nr; 3402df22349SStefano Zampini PetscBool done; 3415f80ce2aSJacob Faibussowitsch CHKERRQ(MatISGetLocalMat(*B,&lA)); 3425f80ce2aSJacob Faibussowitsch CHKERRQ(MatGetRowIJ(lA,0,PETSC_FALSE,PETSC_FALSE,&nr,(const PetscInt**)&iptr,(const PetscInt**)&jptr,&done)); 3432c71b3e2SJacob Faibussowitsch PetscCheckFalse(nr != dr,PETSC_COMM_SELF,PETSC_ERR_USER,"Cannot reuse mat: invalid number of rows in local mat! %" PetscInt_FMT " != %" PetscInt_FMT,nr,dr); 3442c71b3e2SJacob Faibussowitsch PetscCheckFalse(iptr[nr] < nnz,PETSC_COMM_SELF,PETSC_ERR_USER,"Cannot reuse mat: invalid number of nonzeros in local mat! reuse %" PetscInt_FMT " requested %" PetscInt_FMT,iptr[nr],nnz); 3455f80ce2aSJacob Faibussowitsch CHKERRQ(MatSeqAIJGetArray(lA,&data)); 3462df22349SStefano Zampini } 3472df22349SStefano Zampini /* merge local matrices */ 3482df22349SStefano Zampini ii = iptr; 3492df22349SStefano Zampini jj = jptr; 35039accc25SStefano Zampini aa = (HYPRE_Complex*)data; /* this cast fixes the clang error when doing the assignments below: implicit conversion from 'HYPRE_Complex' (aka '_Complex double') to 'double' is not permitted in C++ */ 3512df22349SStefano Zampini *ii = *(hdi++) + *(hoi++); 3522df22349SStefano Zampini for (jd=0,jo=0,cum=0; *ii<nnz; cum++) { 35339accc25SStefano Zampini PetscScalar *aold = (PetscScalar*)aa; 3542df22349SStefano Zampini PetscInt *jold = jj,nc = jd+jo; 3552df22349SStefano Zampini for (; jd<*hdi; jd++) { *jj++ = *hdj++; *aa++ = *hdd++; } 3562df22349SStefano Zampini for (; jo<*hoi; jo++) { *jj++ = *hoj++ + dc; *aa++ = *hod++; } 3572df22349SStefano Zampini *(++ii) = *(hdi++) + *(hoi++); 3585f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSortIntWithScalarArray(jd+jo-nc,jold,aold)); 3592df22349SStefano Zampini } 3602df22349SStefano Zampini for (; cum<dr; cum++) *(++ii) = nnz; 3612df22349SStefano Zampini if (reuse != MAT_REUSE_MATRIX) { 362a033916dSStefano Zampini Mat_SeqAIJ* a; 363a033916dSStefano Zampini 3645f80ce2aSJacob Faibussowitsch CHKERRQ(MatCreateSeqAIJWithArrays(PETSC_COMM_SELF,dr,dc+oc,iptr,jptr,data,&lA)); 3655f80ce2aSJacob Faibussowitsch CHKERRQ(MatISSetLocalMat(*B,lA)); 366a033916dSStefano Zampini /* hack SeqAIJ */ 367a033916dSStefano Zampini a = (Mat_SeqAIJ*)(lA->data); 368a033916dSStefano Zampini a->free_a = PETSC_TRUE; 369a033916dSStefano Zampini a->free_ij = PETSC_TRUE; 3705f80ce2aSJacob Faibussowitsch CHKERRQ(MatDestroy(&lA)); 3712df22349SStefano Zampini } 3725f80ce2aSJacob Faibussowitsch CHKERRQ(MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY)); 3735f80ce2aSJacob Faibussowitsch CHKERRQ(MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY)); 3742df22349SStefano Zampini if (reuse == MAT_INPLACE_MATRIX) { 3755f80ce2aSJacob Faibussowitsch CHKERRQ(MatHeaderReplace(A,B)); 3762df22349SStefano Zampini } 3772df22349SStefano Zampini PetscFunctionReturn(0); 3782df22349SStefano Zampini } 3792df22349SStefano Zampini 38063c07aadSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType type, MatReuse reuse, Mat *B) 38163c07aadSStefano Zampini { 38284d4e069SStefano Zampini Mat M = NULL; 38363c07aadSStefano Zampini Mat_HYPRE *hB; 38463c07aadSStefano Zampini MPI_Comm comm = PetscObjectComm((PetscObject)A); 38563c07aadSStefano Zampini 38663c07aadSStefano Zampini PetscFunctionBegin; 38763c07aadSStefano Zampini if (reuse == MAT_REUSE_MATRIX) { 38863c07aadSStefano Zampini /* always destroy the old matrix and create a new memory; 38963c07aadSStefano Zampini hope this does not churn the memory too much. The problem 39063c07aadSStefano Zampini is I do not know if it is possible to put the matrix back to 39163c07aadSStefano Zampini its initial state so that we can directly copy the values 39263c07aadSStefano Zampini the second time through. */ 39363c07aadSStefano Zampini hB = (Mat_HYPRE*)((*B)->data); 394a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixDestroy,hB->ij); 39563c07aadSStefano Zampini } else { 3965f80ce2aSJacob Faibussowitsch CHKERRQ(MatCreate(comm,&M)); 3975f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetType(M,MATHYPRE)); 3985f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetSizes(M,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N)); 39984d4e069SStefano Zampini hB = (Mat_HYPRE*)(M->data); 40084d4e069SStefano Zampini if (reuse == MAT_INITIAL_MATRIX) *B = M; 40163c07aadSStefano Zampini } 4025f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetOption(*B,MAT_SORTED_FULL,PETSC_TRUE)); /* "perfect" preallocation, so no need for hypre_AuxParCSRMatrixNeedAux */ 4035f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetOption(*B,MAT_NO_OFF_PROC_ENTRIES,PETSC_TRUE)); 4045f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPRE_CreateFromMat(A,hB)); 4055f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPRE_IJMatrixCopy(A,hB->ij)); 40684d4e069SStefano Zampini if (reuse == MAT_INPLACE_MATRIX) { 4075f80ce2aSJacob Faibussowitsch CHKERRQ(MatHeaderReplace(A,&M)); 40884d4e069SStefano Zampini } 4094ec6421dSstefano_zampini (*B)->preallocated = PETSC_TRUE; 4105f80ce2aSJacob Faibussowitsch CHKERRQ(MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY)); 4115f80ce2aSJacob Faibussowitsch CHKERRQ(MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY)); 41263c07aadSStefano Zampini PetscFunctionReturn(0); 41363c07aadSStefano Zampini } 41463c07aadSStefano Zampini 415ea9daf28SStefano Zampini static PetscErrorCode MatConvert_HYPRE_AIJ(Mat A, MatType mtype, MatReuse reuse, Mat *B) 41663c07aadSStefano Zampini { 41763c07aadSStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 41863c07aadSStefano Zampini hypre_ParCSRMatrix *parcsr; 41963c07aadSStefano Zampini hypre_CSRMatrix *hdiag,*hoffd; 42063c07aadSStefano Zampini MPI_Comm comm; 42163c07aadSStefano Zampini PetscScalar *da,*oa,*aptr; 42263c07aadSStefano Zampini PetscInt *dii,*djj,*oii,*ojj,*iptr; 42363c07aadSStefano Zampini PetscInt i,dnnz,onnz,m,n; 42458968eb6SStefano Zampini HYPRE_Int type; 42563c07aadSStefano Zampini PetscMPIInt size; 4262cf14000SStefano Zampini PetscBool sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int)); 42763c07aadSStefano Zampini 42863c07aadSStefano Zampini PetscFunctionBegin; 42963c07aadSStefano Zampini comm = PetscObjectComm((PetscObject)A); 430a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixGetObjectType,hA->ij,&type); 4312c71b3e2SJacob Faibussowitsch PetscCheckFalse(type != HYPRE_PARCSR,comm,PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported"); 43263c07aadSStefano Zampini if (reuse == MAT_REUSE_MATRIX) { 43363c07aadSStefano Zampini PetscBool ismpiaij,isseqaij; 4345f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectBaseTypeCompare((PetscObject)*B,MATMPIAIJ,&ismpiaij)); 4355f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectBaseTypeCompare((PetscObject)*B,MATSEQAIJ,&isseqaij)); 4362c71b3e2SJacob Faibussowitsch PetscCheckFalse(!ismpiaij && !isseqaij,comm,PETSC_ERR_SUP,"Only MATMPIAIJ or MATSEQAIJ are supported"); 43763c07aadSStefano Zampini } 4386ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 4392c71b3e2SJacob Faibussowitsch PetscCheckFalse(HYPRE_MEMORY_DEVICE == hypre_IJMatrixMemoryLocation(hA->ij),comm,PETSC_ERR_SUP,"Not yet implemented"); 4406ea7df73SStefano Zampini #endif 4415f80ce2aSJacob Faibussowitsch CHKERRMPI(MPI_Comm_size(comm,&size)); 44263c07aadSStefano Zampini 443a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixGetObject,hA->ij,(void**)&parcsr); 44463c07aadSStefano Zampini hdiag = hypre_ParCSRMatrixDiag(parcsr); 44563c07aadSStefano Zampini hoffd = hypre_ParCSRMatrixOffd(parcsr); 44663c07aadSStefano Zampini m = hypre_CSRMatrixNumRows(hdiag); 44763c07aadSStefano Zampini n = hypre_CSRMatrixNumCols(hdiag); 44863c07aadSStefano Zampini dnnz = hypre_CSRMatrixNumNonzeros(hdiag); 44963c07aadSStefano Zampini onnz = hypre_CSRMatrixNumNonzeros(hoffd); 450225daaf8SStefano Zampini if (reuse == MAT_INITIAL_MATRIX) { 4515f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(m+1,&dii)); 4525f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(dnnz,&djj)); 4535f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(dnnz,&da)); 454225daaf8SStefano Zampini } else if (reuse == MAT_REUSE_MATRIX) { 45563c07aadSStefano Zampini PetscInt nr; 45663c07aadSStefano Zampini PetscBool done; 45763c07aadSStefano Zampini if (size > 1) { 45863c07aadSStefano Zampini Mat_MPIAIJ *b = (Mat_MPIAIJ*)((*B)->data); 45963c07aadSStefano Zampini 4605f80ce2aSJacob Faibussowitsch CHKERRQ(MatGetRowIJ(b->A,0,PETSC_FALSE,PETSC_FALSE,&nr,(const PetscInt**)&dii,(const PetscInt**)&djj,&done)); 4612c71b3e2SJacob Faibussowitsch PetscCheckFalse(nr != m,PETSC_COMM_SELF,PETSC_ERR_USER,"Cannot reuse mat: invalid number of local rows in diag part! %" PetscInt_FMT " != %" PetscInt_FMT,nr,m); 4622c71b3e2SJacob Faibussowitsch PetscCheckFalse(dii[nr] < dnnz,PETSC_COMM_SELF,PETSC_ERR_USER,"Cannot reuse mat: invalid number of nonzeros in diag part! reuse %" PetscInt_FMT " hypre %" PetscInt_FMT,dii[nr],dnnz); 4635f80ce2aSJacob Faibussowitsch CHKERRQ(MatSeqAIJGetArray(b->A,&da)); 46463c07aadSStefano Zampini } else { 4655f80ce2aSJacob Faibussowitsch CHKERRQ(MatGetRowIJ(*B,0,PETSC_FALSE,PETSC_FALSE,&nr,(const PetscInt**)&dii,(const PetscInt**)&djj,&done)); 4662c71b3e2SJacob Faibussowitsch PetscCheckFalse(nr != m,PETSC_COMM_SELF,PETSC_ERR_USER,"Cannot reuse mat: invalid number of local rows! %" PetscInt_FMT " != %" PetscInt_FMT,nr,m); 4672c71b3e2SJacob Faibussowitsch PetscCheckFalse(dii[nr] < dnnz,PETSC_COMM_SELF,PETSC_ERR_USER,"Cannot reuse mat: invalid number of nonzeros! reuse %" PetscInt_FMT " hypre %" PetscInt_FMT,dii[nr],dnnz); 4685f80ce2aSJacob Faibussowitsch CHKERRQ(MatSeqAIJGetArray(*B,&da)); 46963c07aadSStefano Zampini } 470225daaf8SStefano Zampini } else { /* MAT_INPLACE_MATRIX */ 4712cf14000SStefano Zampini if (!sameint) { 4725f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(m+1,&dii)); 4735f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(dnnz,&djj)); 4742cf14000SStefano Zampini } else { 4757d968826Sstefano_zampini dii = (PetscInt*)hypre_CSRMatrixI(hdiag); 4767d968826Sstefano_zampini djj = (PetscInt*)hypre_CSRMatrixJ(hdiag); 47763c07aadSStefano Zampini } 47839accc25SStefano Zampini da = (PetscScalar*)hypre_CSRMatrixData(hdiag); 47963c07aadSStefano Zampini } 4802cf14000SStefano Zampini 4812cf14000SStefano Zampini if (!sameint) { 482a16187a7SStefano Zampini if (reuse != MAT_REUSE_MATRIX) { for (i=0;i<m+1;i++) dii[i] = (PetscInt)(hypre_CSRMatrixI(hdiag)[i]); } 4832cf14000SStefano Zampini for (i=0;i<dnnz;i++) djj[i] = (PetscInt)(hypre_CSRMatrixJ(hdiag)[i]); 4842cf14000SStefano Zampini } else { 4855f80ce2aSJacob Faibussowitsch if (reuse != MAT_REUSE_MATRIX) CHKERRQ(PetscArraycpy(dii,hypre_CSRMatrixI(hdiag),m+1)); 4865f80ce2aSJacob Faibussowitsch CHKERRQ(PetscArraycpy(djj,hypre_CSRMatrixJ(hdiag),dnnz)); 4872cf14000SStefano Zampini } 4885f80ce2aSJacob Faibussowitsch CHKERRQ(PetscArraycpy(da,hypre_CSRMatrixData(hdiag),dnnz)); 48963c07aadSStefano Zampini iptr = djj; 49063c07aadSStefano Zampini aptr = da; 49163c07aadSStefano Zampini for (i=0; i<m; i++) { 49263c07aadSStefano Zampini PetscInt nc = dii[i+1]-dii[i]; 4935f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSortIntWithScalarArray(nc,iptr,aptr)); 49463c07aadSStefano Zampini iptr += nc; 49563c07aadSStefano Zampini aptr += nc; 49663c07aadSStefano Zampini } 49763c07aadSStefano Zampini if (size > 1) { 4982cf14000SStefano Zampini HYPRE_BigInt *coffd; 4992cf14000SStefano Zampini HYPRE_Int *offdj; 50063c07aadSStefano Zampini 501225daaf8SStefano Zampini if (reuse == MAT_INITIAL_MATRIX) { 5025f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(m+1,&oii)); 5035f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(onnz,&ojj)); 5045f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(onnz,&oa)); 505225daaf8SStefano Zampini } else if (reuse == MAT_REUSE_MATRIX) { 50663c07aadSStefano Zampini Mat_MPIAIJ *b = (Mat_MPIAIJ*)((*B)->data); 50763c07aadSStefano Zampini PetscInt nr,hr = hypre_CSRMatrixNumRows(hoffd); 50863c07aadSStefano Zampini PetscBool done; 50963c07aadSStefano Zampini 5105f80ce2aSJacob Faibussowitsch CHKERRQ(MatGetRowIJ(b->B,0,PETSC_FALSE,PETSC_FALSE,&nr,(const PetscInt**)&oii,(const PetscInt**)&ojj,&done)); 5112c71b3e2SJacob Faibussowitsch PetscCheckFalse(nr != hr,PETSC_COMM_SELF,PETSC_ERR_USER,"Cannot reuse mat: invalid number of local rows in offdiag part! %" PetscInt_FMT " != %" PetscInt_FMT,nr,hr); 5122c71b3e2SJacob Faibussowitsch PetscCheckFalse(oii[nr] < onnz,PETSC_COMM_SELF,PETSC_ERR_USER,"Cannot reuse mat: invalid number of nonzeros in offdiag part! reuse %" PetscInt_FMT " hypre %" PetscInt_FMT,oii[nr],onnz); 5135f80ce2aSJacob Faibussowitsch CHKERRQ(MatSeqAIJGetArray(b->B,&oa)); 514225daaf8SStefano Zampini } else { /* MAT_INPLACE_MATRIX */ 5152cf14000SStefano Zampini if (!sameint) { 5165f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(m+1,&oii)); 5175f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(onnz,&ojj)); 5182cf14000SStefano Zampini } else { 5197d968826Sstefano_zampini oii = (PetscInt*)hypre_CSRMatrixI(hoffd); 5207d968826Sstefano_zampini ojj = (PetscInt*)hypre_CSRMatrixJ(hoffd); 52163c07aadSStefano Zampini } 52239accc25SStefano Zampini oa = (PetscScalar*)hypre_CSRMatrixData(hoffd); 52363c07aadSStefano Zampini } 524a16187a7SStefano Zampini if (reuse != MAT_REUSE_MATRIX) { 5252cf14000SStefano Zampini if (!sameint) { 5262cf14000SStefano Zampini for (i=0;i<m+1;i++) oii[i] = (PetscInt)(hypre_CSRMatrixI(hoffd)[i]); 5272cf14000SStefano Zampini } else { 5285f80ce2aSJacob Faibussowitsch CHKERRQ(PetscArraycpy(oii,hypre_CSRMatrixI(hoffd),m+1)); 5292cf14000SStefano Zampini } 530a16187a7SStefano Zampini } 5315f80ce2aSJacob Faibussowitsch CHKERRQ(PetscArraycpy(oa,hypre_CSRMatrixData(hoffd),onnz)); 532a16187a7SStefano Zampini 53363c07aadSStefano Zampini offdj = hypre_CSRMatrixJ(hoffd); 53463c07aadSStefano Zampini coffd = hypre_ParCSRMatrixColMapOffd(parcsr); 535a16187a7SStefano Zampini /* we only need the permutation to be computed properly, I don't know if HYPRE 536a16187a7SStefano Zampini messes up with the ordering. Just in case, allocate some memory and free it 537a16187a7SStefano Zampini later */ 538a16187a7SStefano Zampini if (reuse == MAT_REUSE_MATRIX) { 539a16187a7SStefano Zampini Mat_MPIAIJ *b = (Mat_MPIAIJ*)((*B)->data); 540a16187a7SStefano Zampini PetscInt mnz; 541a16187a7SStefano Zampini 5425f80ce2aSJacob Faibussowitsch CHKERRQ(MatSeqAIJGetMaxRowNonzeros(b->B,&mnz)); 5435f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(mnz,&ojj)); 544a16187a7SStefano Zampini } else for (i=0; i<onnz; i++) ojj[i] = coffd[offdj[i]]; 54563c07aadSStefano Zampini iptr = ojj; 54663c07aadSStefano Zampini aptr = oa; 54763c07aadSStefano Zampini for (i=0; i<m; i++) { 54863c07aadSStefano Zampini PetscInt nc = oii[i+1]-oii[i]; 549a16187a7SStefano Zampini if (reuse == MAT_REUSE_MATRIX) { 550a16187a7SStefano Zampini PetscInt j; 551a16187a7SStefano Zampini 552a16187a7SStefano Zampini iptr = ojj; 553a16187a7SStefano Zampini for (j=0; j<nc; j++) iptr[j] = coffd[offdj[oii[i] + j]]; 554a16187a7SStefano Zampini } 5555f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSortIntWithScalarArray(nc,iptr,aptr)); 55663c07aadSStefano Zampini iptr += nc; 55763c07aadSStefano Zampini aptr += nc; 55863c07aadSStefano Zampini } 5595f80ce2aSJacob Faibussowitsch if (reuse == MAT_REUSE_MATRIX) CHKERRQ(PetscFree(ojj)); 560225daaf8SStefano Zampini if (reuse == MAT_INITIAL_MATRIX) { 56163c07aadSStefano Zampini Mat_MPIAIJ *b; 56263c07aadSStefano Zampini Mat_SeqAIJ *d,*o; 563225daaf8SStefano Zampini 5645f80ce2aSJacob Faibussowitsch CHKERRQ(MatCreateMPIAIJWithSplitArrays(comm,m,n,PETSC_DECIDE,PETSC_DECIDE,dii,djj,da,oii,ojj,oa,B)); 56563c07aadSStefano Zampini /* hack MPIAIJ */ 56663c07aadSStefano Zampini b = (Mat_MPIAIJ*)((*B)->data); 56763c07aadSStefano Zampini d = (Mat_SeqAIJ*)b->A->data; 56863c07aadSStefano Zampini o = (Mat_SeqAIJ*)b->B->data; 56963c07aadSStefano Zampini d->free_a = PETSC_TRUE; 57063c07aadSStefano Zampini d->free_ij = PETSC_TRUE; 57163c07aadSStefano Zampini o->free_a = PETSC_TRUE; 57263c07aadSStefano Zampini o->free_ij = PETSC_TRUE; 573225daaf8SStefano Zampini } else if (reuse == MAT_INPLACE_MATRIX) { 574225daaf8SStefano Zampini Mat T; 5752cf14000SStefano Zampini 5765f80ce2aSJacob Faibussowitsch CHKERRQ(MatCreateMPIAIJWithSplitArrays(comm,m,n,PETSC_DECIDE,PETSC_DECIDE,dii,djj,da,oii,ojj,oa,&T)); 5772cf14000SStefano Zampini if (sameint) { /* ownership of CSR pointers is transferred to PETSc */ 578225daaf8SStefano Zampini hypre_CSRMatrixI(hdiag) = NULL; 579225daaf8SStefano Zampini hypre_CSRMatrixJ(hdiag) = NULL; 580225daaf8SStefano Zampini hypre_CSRMatrixI(hoffd) = NULL; 581225daaf8SStefano Zampini hypre_CSRMatrixJ(hoffd) = NULL; 5822cf14000SStefano Zampini } else { /* Hack MPIAIJ -> free ij but not a */ 5832cf14000SStefano Zampini Mat_MPIAIJ *b = (Mat_MPIAIJ*)(T->data); 5842cf14000SStefano Zampini Mat_SeqAIJ *d = (Mat_SeqAIJ*)(b->A->data); 5852cf14000SStefano Zampini Mat_SeqAIJ *o = (Mat_SeqAIJ*)(b->B->data); 5862cf14000SStefano Zampini 5872cf14000SStefano Zampini d->free_ij = PETSC_TRUE; 5882cf14000SStefano Zampini o->free_ij = PETSC_TRUE; 5892cf14000SStefano Zampini } 5902cf14000SStefano Zampini hypre_CSRMatrixData(hdiag) = NULL; 591225daaf8SStefano Zampini hypre_CSRMatrixData(hoffd) = NULL; 5925f80ce2aSJacob Faibussowitsch CHKERRQ(MatHeaderReplace(A,&T)); 59363c07aadSStefano Zampini } 594225daaf8SStefano Zampini } else { 595225daaf8SStefano Zampini oii = NULL; 596225daaf8SStefano Zampini ojj = NULL; 597225daaf8SStefano Zampini oa = NULL; 598225daaf8SStefano Zampini if (reuse == MAT_INITIAL_MATRIX) { 59963c07aadSStefano Zampini Mat_SeqAIJ* b; 6002cf14000SStefano Zampini 6015f80ce2aSJacob Faibussowitsch CHKERRQ(MatCreateSeqAIJWithArrays(comm,m,n,dii,djj,da,B)); 60263c07aadSStefano Zampini /* hack SeqAIJ */ 60363c07aadSStefano Zampini b = (Mat_SeqAIJ*)((*B)->data); 60463c07aadSStefano Zampini b->free_a = PETSC_TRUE; 60563c07aadSStefano Zampini b->free_ij = PETSC_TRUE; 606225daaf8SStefano Zampini } else if (reuse == MAT_INPLACE_MATRIX) { 607225daaf8SStefano Zampini Mat T; 6082cf14000SStefano Zampini 6095f80ce2aSJacob Faibussowitsch CHKERRQ(MatCreateSeqAIJWithArrays(comm,m,n,dii,djj,da,&T)); 6102cf14000SStefano Zampini if (sameint) { /* ownership of CSR pointers is transferred to PETSc */ 611225daaf8SStefano Zampini hypre_CSRMatrixI(hdiag) = NULL; 612225daaf8SStefano Zampini hypre_CSRMatrixJ(hdiag) = NULL; 6132cf14000SStefano Zampini } else { /* free ij but not a */ 6142cf14000SStefano Zampini Mat_SeqAIJ* b = (Mat_SeqAIJ*)(T->data); 6152cf14000SStefano Zampini 6162cf14000SStefano Zampini b->free_ij = PETSC_TRUE; 6172cf14000SStefano Zampini } 618225daaf8SStefano Zampini hypre_CSRMatrixData(hdiag) = NULL; 6195f80ce2aSJacob Faibussowitsch CHKERRQ(MatHeaderReplace(A,&T)); 62063c07aadSStefano Zampini } 621225daaf8SStefano Zampini } 622225daaf8SStefano Zampini 6232cf14000SStefano Zampini /* we have to use hypre_Tfree to free the HYPRE arrays 6242cf14000SStefano Zampini that PETSc now onws */ 62563c07aadSStefano Zampini if (reuse == MAT_INPLACE_MATRIX) { 6262cf14000SStefano Zampini PetscInt nh; 6272cf14000SStefano Zampini void *ptrs[6] = {da,oa,dii,djj,oii,ojj}; 6282cf14000SStefano Zampini const char *names[6] = {"_hypre_csr_da", 6292cf14000SStefano Zampini "_hypre_csr_oa", 6302cf14000SStefano Zampini "_hypre_csr_dii", 631225daaf8SStefano Zampini "_hypre_csr_djj", 632225daaf8SStefano Zampini "_hypre_csr_oii", 6332cf14000SStefano Zampini "_hypre_csr_ojj"}; 6342cf14000SStefano Zampini nh = sameint ? 6 : 2; 6352cf14000SStefano Zampini for (i=0; i<nh; i++) { 636225daaf8SStefano Zampini PetscContainer c; 637225daaf8SStefano Zampini 6385f80ce2aSJacob Faibussowitsch CHKERRQ(PetscContainerCreate(comm,&c)); 6395f80ce2aSJacob Faibussowitsch CHKERRQ(PetscContainerSetPointer(c,ptrs[i])); 6405f80ce2aSJacob Faibussowitsch CHKERRQ(PetscContainerSetUserDestroy(c,hypre_array_destroy)); 6415f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectCompose((PetscObject)(*B),names[i],(PetscObject)c)); 6425f80ce2aSJacob Faibussowitsch CHKERRQ(PetscContainerDestroy(&c)); 643225daaf8SStefano Zampini } 64463c07aadSStefano Zampini } 64563c07aadSStefano Zampini PetscFunctionReturn(0); 64663c07aadSStefano Zampini } 64763c07aadSStefano Zampini 648613e5ff0Sstefano_zampini static PetscErrorCode MatAIJGetParCSR_Private(Mat A, hypre_ParCSRMatrix **hA) 649c1a070e6SStefano Zampini { 650613e5ff0Sstefano_zampini hypre_ParCSRMatrix *tA; 651c1a070e6SStefano Zampini hypre_CSRMatrix *hdiag,*hoffd; 652c1a070e6SStefano Zampini Mat_SeqAIJ *diag,*offd; 6532cf14000SStefano Zampini PetscInt *garray,i,noffd,dnnz,onnz,*row_starts,*col_starts; 654c1a070e6SStefano Zampini MPI_Comm comm = PetscObjectComm((PetscObject)A); 655613e5ff0Sstefano_zampini PetscBool ismpiaij,isseqaij; 6562cf14000SStefano Zampini PetscBool sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int)); 6576ea7df73SStefano Zampini HYPRE_Int *hdi = NULL,*hdj = NULL,*hoi = NULL,*hoj = NULL; 6585c97c10fSStefano Zampini PetscInt *pdi = NULL,*pdj = NULL,*poi = NULL,*poj = NULL; 6596ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 6606ea7df73SStefano Zampini PetscBool iscuda = PETSC_FALSE; 6616ea7df73SStefano Zampini #endif 662c1a070e6SStefano Zampini 663c1a070e6SStefano Zampini PetscFunctionBegin; 6645f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectBaseTypeCompare((PetscObject)A,MATMPIAIJ,&ismpiaij)); 6655f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectBaseTypeCompare((PetscObject)A,MATSEQAIJ,&isseqaij)); 6662c71b3e2SJacob Faibussowitsch PetscCheckFalse(!ismpiaij && !isseqaij,comm,PETSC_ERR_SUP,"Unsupported type %s",((PetscObject)A)->type_name); 667c1a070e6SStefano Zampini if (ismpiaij) { 668c1a070e6SStefano Zampini Mat_MPIAIJ *a = (Mat_MPIAIJ*)(A->data); 669c1a070e6SStefano Zampini 670c1a070e6SStefano Zampini diag = (Mat_SeqAIJ*)a->A->data; 671c1a070e6SStefano Zampini offd = (Mat_SeqAIJ*)a->B->data; 6726ea7df73SStefano Zampini #if defined(PETSC_HAVE_CUDA) && defined(PETSC_HAVE_HYPRE_DEVICE) && defined(HYPRE_USING_CUDA) 6735f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectTypeCompare((PetscObject)A,MATMPIAIJCUSPARSE,&iscuda)); 6746ea7df73SStefano Zampini if (iscuda && !A->boundtocpu) { 6756ea7df73SStefano Zampini sameint = PETSC_TRUE; 6765f80ce2aSJacob Faibussowitsch CHKERRQ(MatSeqAIJCUSPARSEGetIJ(a->A,PETSC_FALSE,(const HYPRE_Int**)&hdi,(const HYPRE_Int**)&hdj)); 6775f80ce2aSJacob Faibussowitsch CHKERRQ(MatSeqAIJCUSPARSEGetIJ(a->B,PETSC_FALSE,(const HYPRE_Int**)&hoi,(const HYPRE_Int**)&hoj)); 6786ea7df73SStefano Zampini } else { 6796ea7df73SStefano Zampini #else 6806ea7df73SStefano Zampini { 6816ea7df73SStefano Zampini #endif 6826ea7df73SStefano Zampini pdi = diag->i; 6836ea7df73SStefano Zampini pdj = diag->j; 6846ea7df73SStefano Zampini poi = offd->i; 6856ea7df73SStefano Zampini poj = offd->j; 6866ea7df73SStefano Zampini if (sameint) { 6876ea7df73SStefano Zampini hdi = (HYPRE_Int*)pdi; 6886ea7df73SStefano Zampini hdj = (HYPRE_Int*)pdj; 6896ea7df73SStefano Zampini hoi = (HYPRE_Int*)poi; 6906ea7df73SStefano Zampini hoj = (HYPRE_Int*)poj; 6916ea7df73SStefano Zampini } 6926ea7df73SStefano Zampini } 693c1a070e6SStefano Zampini garray = a->garray; 694c1a070e6SStefano Zampini noffd = a->B->cmap->N; 695c1a070e6SStefano Zampini dnnz = diag->nz; 696c1a070e6SStefano Zampini onnz = offd->nz; 697c1a070e6SStefano Zampini } else { 698c1a070e6SStefano Zampini diag = (Mat_SeqAIJ*)A->data; 699c1a070e6SStefano Zampini offd = NULL; 7006ea7df73SStefano Zampini #if defined(PETSC_HAVE_CUDA) && defined(PETSC_HAVE_HYPRE_DEVICE) 7015f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectTypeCompare((PetscObject)A,MATSEQAIJCUSPARSE,&iscuda)); 7026ea7df73SStefano Zampini if (iscuda && !A->boundtocpu) { 7036ea7df73SStefano Zampini sameint = PETSC_TRUE; 7045f80ce2aSJacob Faibussowitsch CHKERRQ(MatSeqAIJCUSPARSEGetIJ(A,PETSC_FALSE,(const HYPRE_Int**)&hdi,(const HYPRE_Int**)&hdj)); 7056ea7df73SStefano Zampini } else { 7066ea7df73SStefano Zampini #else 7076ea7df73SStefano Zampini { 7086ea7df73SStefano Zampini #endif 7096ea7df73SStefano Zampini pdi = diag->i; 7106ea7df73SStefano Zampini pdj = diag->j; 7116ea7df73SStefano Zampini if (sameint) { 7126ea7df73SStefano Zampini hdi = (HYPRE_Int*)pdi; 7136ea7df73SStefano Zampini hdj = (HYPRE_Int*)pdj; 7146ea7df73SStefano Zampini } 7156ea7df73SStefano Zampini } 716c1a070e6SStefano Zampini garray = NULL; 717c1a070e6SStefano Zampini noffd = 0; 718c1a070e6SStefano Zampini dnnz = diag->nz; 719c1a070e6SStefano Zampini onnz = 0; 720c1a070e6SStefano Zampini } 721225daaf8SStefano Zampini 722c1a070e6SStefano Zampini /* create a temporary ParCSR */ 723c1a070e6SStefano Zampini if (HYPRE_AssumedPartitionCheck()) { 724c1a070e6SStefano Zampini PetscMPIInt myid; 725c1a070e6SStefano Zampini 7265f80ce2aSJacob Faibussowitsch CHKERRMPI(MPI_Comm_rank(comm,&myid)); 727c1a070e6SStefano Zampini row_starts = A->rmap->range + myid; 728c1a070e6SStefano Zampini col_starts = A->cmap->range + myid; 729c1a070e6SStefano Zampini } else { 730c1a070e6SStefano Zampini row_starts = A->rmap->range; 731c1a070e6SStefano Zampini col_starts = A->cmap->range; 732c1a070e6SStefano Zampini } 7332cf14000SStefano Zampini tA = hypre_ParCSRMatrixCreate(comm,A->rmap->N,A->cmap->N,(HYPRE_BigInt*)row_starts,(HYPRE_BigInt*)col_starts,noffd,dnnz,onnz); 734a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts) 735c1a070e6SStefano Zampini hypre_ParCSRMatrixSetRowStartsOwner(tA,0); 736c1a070e6SStefano Zampini hypre_ParCSRMatrixSetColStartsOwner(tA,0); 737a1d2239cSSatish Balay #endif 738c1a070e6SStefano Zampini 739225daaf8SStefano Zampini /* set diagonal part */ 740c1a070e6SStefano Zampini hdiag = hypre_ParCSRMatrixDiag(tA); 7416ea7df73SStefano Zampini if (!sameint) { /* malloc CSR pointers */ 7425f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc2(A->rmap->n+1,&hdi,dnnz,&hdj)); 7436ea7df73SStefano Zampini for (i = 0; i < A->rmap->n+1; i++) hdi[i] = (HYPRE_Int)(pdi[i]); 7446ea7df73SStefano Zampini for (i = 0; i < dnnz; i++) hdj[i] = (HYPRE_Int)(pdj[i]); 7452cf14000SStefano Zampini } 7466ea7df73SStefano Zampini hypre_CSRMatrixI(hdiag) = hdi; 7476ea7df73SStefano Zampini hypre_CSRMatrixJ(hdiag) = hdj; 74839accc25SStefano Zampini hypre_CSRMatrixData(hdiag) = (HYPRE_Complex*)diag->a; 749c1a070e6SStefano Zampini hypre_CSRMatrixNumNonzeros(hdiag) = diag->nz; 750c1a070e6SStefano Zampini hypre_CSRMatrixSetRownnz(hdiag); 751c1a070e6SStefano Zampini hypre_CSRMatrixSetDataOwner(hdiag,0); 752c1a070e6SStefano Zampini 753225daaf8SStefano Zampini /* set offdiagonal part */ 754c1a070e6SStefano Zampini hoffd = hypre_ParCSRMatrixOffd(tA); 755c1a070e6SStefano Zampini if (offd) { 7566ea7df73SStefano Zampini if (!sameint) { /* malloc CSR pointers */ 7575f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc2(A->rmap->n+1,&hoi,onnz,&hoj)); 7586ea7df73SStefano Zampini for (i = 0; i < A->rmap->n+1; i++) hoi[i] = (HYPRE_Int)(poi[i]); 7596ea7df73SStefano Zampini for (i = 0; i < onnz; i++) hoj[i] = (HYPRE_Int)(poj[i]); 7602cf14000SStefano Zampini } 7616ea7df73SStefano Zampini hypre_CSRMatrixI(hoffd) = hoi; 7626ea7df73SStefano Zampini hypre_CSRMatrixJ(hoffd) = hoj; 76339accc25SStefano Zampini hypre_CSRMatrixData(hoffd) = (HYPRE_Complex*)offd->a; 764c1a070e6SStefano Zampini hypre_CSRMatrixNumNonzeros(hoffd) = offd->nz; 765c1a070e6SStefano Zampini hypre_CSRMatrixSetRownnz(hoffd); 766c1a070e6SStefano Zampini hypre_CSRMatrixSetDataOwner(hoffd,0); 7676ea7df73SStefano Zampini } 7686ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 769a74df02fSJacob Faibussowitsch PetscStackCallStandard(hypre_ParCSRMatrixInitialize_v2,tA,iscuda ? HYPRE_MEMORY_DEVICE : HYPRE_MEMORY_HOST); 7706ea7df73SStefano Zampini #else 7716ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2,18,0) 772a74df02fSJacob Faibussowitsch PetscStackCallStandard(hypre_ParCSRMatrixInitialize,tA); 7736ea7df73SStefano Zampini #else 774a74df02fSJacob Faibussowitsch PetscStackCallStandard(hypre_ParCSRMatrixInitialize_v2,tA,HYPRE_MEMORY_HOST); 7756ea7df73SStefano Zampini #endif 7766ea7df73SStefano Zampini #endif 7776ea7df73SStefano Zampini hypre_TFree(hypre_ParCSRMatrixColMapOffd(tA),HYPRE_MEMORY_HOST); 778c1a070e6SStefano Zampini hypre_ParCSRMatrixSetNumNonzeros(tA); 7792cf14000SStefano Zampini hypre_ParCSRMatrixColMapOffd(tA) = (HYPRE_BigInt*)garray; 780a74df02fSJacob Faibussowitsch if (!hypre_ParCSRMatrixCommPkg(tA)) PetscStackCallStandard(hypre_MatvecCommPkgCreate,tA); 781613e5ff0Sstefano_zampini *hA = tA; 782613e5ff0Sstefano_zampini PetscFunctionReturn(0); 783613e5ff0Sstefano_zampini } 784c1a070e6SStefano Zampini 785613e5ff0Sstefano_zampini static PetscErrorCode MatAIJRestoreParCSR_Private(Mat A, hypre_ParCSRMatrix **hA) 786613e5ff0Sstefano_zampini { 787613e5ff0Sstefano_zampini hypre_CSRMatrix *hdiag,*hoffd; 7886ea7df73SStefano Zampini PetscBool ismpiaij,sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int)); 7896ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 7906ea7df73SStefano Zampini PetscBool iscuda = PETSC_FALSE; 7916ea7df73SStefano Zampini #endif 792c1a070e6SStefano Zampini 793613e5ff0Sstefano_zampini PetscFunctionBegin; 7945f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectBaseTypeCompare((PetscObject)A,MATMPIAIJ,&ismpiaij)); 7956ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 7965f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectTypeCompareAny((PetscObject)A,&iscuda,MATSEQAIJCUSPARSE,MATMPIAIJCUSPARSE,"")); 7976ea7df73SStefano Zampini if (iscuda) sameint = PETSC_TRUE; 7986ea7df73SStefano Zampini #endif 799613e5ff0Sstefano_zampini hdiag = hypre_ParCSRMatrixDiag(*hA); 800613e5ff0Sstefano_zampini hoffd = hypre_ParCSRMatrixOffd(*hA); 8016ea7df73SStefano Zampini /* free temporary memory allocated by PETSc 8026ea7df73SStefano Zampini set pointers to NULL before destroying tA */ 8032cf14000SStefano Zampini if (!sameint) { 8042cf14000SStefano Zampini HYPRE_Int *hi,*hj; 8052cf14000SStefano Zampini 8062cf14000SStefano Zampini hi = hypre_CSRMatrixI(hdiag); 8072cf14000SStefano Zampini hj = hypre_CSRMatrixJ(hdiag); 8085f80ce2aSJacob Faibussowitsch CHKERRQ(PetscFree2(hi,hj)); 8096ea7df73SStefano Zampini if (ismpiaij) { 8102cf14000SStefano Zampini hi = hypre_CSRMatrixI(hoffd); 8112cf14000SStefano Zampini hj = hypre_CSRMatrixJ(hoffd); 8125f80ce2aSJacob Faibussowitsch CHKERRQ(PetscFree2(hi,hj)); 8132cf14000SStefano Zampini } 8142cf14000SStefano Zampini } 815c1a070e6SStefano Zampini hypre_CSRMatrixI(hdiag) = NULL; 816c1a070e6SStefano Zampini hypre_CSRMatrixJ(hdiag) = NULL; 817c1a070e6SStefano Zampini hypre_CSRMatrixData(hdiag) = NULL; 8186ea7df73SStefano Zampini if (ismpiaij) { 819c1a070e6SStefano Zampini hypre_CSRMatrixI(hoffd) = NULL; 820c1a070e6SStefano Zampini hypre_CSRMatrixJ(hoffd) = NULL; 821c1a070e6SStefano Zampini hypre_CSRMatrixData(hoffd) = NULL; 8226ea7df73SStefano Zampini } 823613e5ff0Sstefano_zampini hypre_ParCSRMatrixColMapOffd(*hA) = NULL; 824613e5ff0Sstefano_zampini hypre_ParCSRMatrixDestroy(*hA); 825613e5ff0Sstefano_zampini *hA = NULL; 826613e5ff0Sstefano_zampini PetscFunctionReturn(0); 827613e5ff0Sstefano_zampini } 828613e5ff0Sstefano_zampini 829613e5ff0Sstefano_zampini /* calls RAP from BoomerAMG: 8303dad0653Sstefano_zampini the resulting ParCSR will not own the column and row starts 8316ea7df73SStefano Zampini It looks like we don't need to have the diagonal entries ordered first */ 832a055b5aaSBarry Smith static PetscErrorCode MatHYPRE_ParCSR_RAP(hypre_ParCSRMatrix *hR, hypre_ParCSRMatrix *hA,hypre_ParCSRMatrix *hP, hypre_ParCSRMatrix **hRAP) 833613e5ff0Sstefano_zampini { 834a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts) 835613e5ff0Sstefano_zampini HYPRE_Int P_owns_col_starts,R_owns_row_starts; 836a1d2239cSSatish Balay #endif 837613e5ff0Sstefano_zampini 838613e5ff0Sstefano_zampini PetscFunctionBegin; 839a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts) 840613e5ff0Sstefano_zampini P_owns_col_starts = hypre_ParCSRMatrixOwnsColStarts(hP); 841613e5ff0Sstefano_zampini R_owns_row_starts = hypre_ParCSRMatrixOwnsRowStarts(hR); 842a1d2239cSSatish Balay #endif 8436ea7df73SStefano Zampini /* can be replaced by version test later */ 8446ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 8456ea7df73SStefano Zampini PetscStackPush("hypre_ParCSRMatrixRAP"); 8466ea7df73SStefano Zampini *hRAP = hypre_ParCSRMatrixRAP(hR,hA,hP); 8476ea7df73SStefano Zampini PetscStackPop; 8486ea7df73SStefano Zampini #else 849a74df02fSJacob Faibussowitsch PetscStackCallStandard(hypre_BoomerAMGBuildCoarseOperator,hR,hA,hP,hRAP); 850a74df02fSJacob Faibussowitsch PetscStackCallStandard(hypre_ParCSRMatrixSetNumNonzeros,*hRAP); 8516ea7df73SStefano Zampini #endif 852613e5ff0Sstefano_zampini /* hypre_BoomerAMGBuildCoarseOperator steals the col_starts from P and the row_starts from R */ 853a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts) 854613e5ff0Sstefano_zampini hypre_ParCSRMatrixSetRowStartsOwner(*hRAP,0); 855613e5ff0Sstefano_zampini hypre_ParCSRMatrixSetColStartsOwner(*hRAP,0); 856613e5ff0Sstefano_zampini if (P_owns_col_starts) hypre_ParCSRMatrixSetColStartsOwner(hP,1); 857613e5ff0Sstefano_zampini if (R_owns_row_starts) hypre_ParCSRMatrixSetRowStartsOwner(hR,1); 858a1d2239cSSatish Balay #endif 859613e5ff0Sstefano_zampini PetscFunctionReturn(0); 860613e5ff0Sstefano_zampini } 861613e5ff0Sstefano_zampini 8626f231fbdSstefano_zampini static PetscErrorCode MatPtAPNumeric_AIJ_AIJ_wHYPRE(Mat A,Mat P,Mat C) 863613e5ff0Sstefano_zampini { 8646f231fbdSstefano_zampini Mat B; 8656abb4441SStefano Zampini hypre_ParCSRMatrix *hA,*hP,*hPtAP = NULL; 8664222ddf1SHong Zhang Mat_Product *product=C->product; 867613e5ff0Sstefano_zampini 868613e5ff0Sstefano_zampini PetscFunctionBegin; 8695f80ce2aSJacob Faibussowitsch CHKERRQ(MatAIJGetParCSR_Private(A,&hA)); 8705f80ce2aSJacob Faibussowitsch CHKERRQ(MatAIJGetParCSR_Private(P,&hP)); 8715f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPRE_ParCSR_RAP(hP,hA,hP,&hPtAP)); 8725f80ce2aSJacob Faibussowitsch CHKERRQ(MatCreateFromParCSR(hPtAP,MATAIJ,PETSC_OWN_POINTER,&B)); 8734222ddf1SHong Zhang 8745f80ce2aSJacob Faibussowitsch CHKERRQ(MatHeaderMerge(C,&B)); 8754222ddf1SHong Zhang C->product = product; 8764222ddf1SHong Zhang 8775f80ce2aSJacob Faibussowitsch CHKERRQ(MatAIJRestoreParCSR_Private(A,&hA)); 8785f80ce2aSJacob Faibussowitsch CHKERRQ(MatAIJRestoreParCSR_Private(P,&hP)); 8796f231fbdSstefano_zampini PetscFunctionReturn(0); 8806f231fbdSstefano_zampini } 8816f231fbdSstefano_zampini 8824222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatPtAPSymbolic_AIJ_AIJ_wHYPRE(Mat A,Mat P,PetscReal fill,Mat C) 8836f231fbdSstefano_zampini { 8846f231fbdSstefano_zampini PetscFunctionBegin; 8855f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetType(C,MATAIJ)); 8864222ddf1SHong Zhang C->ops->ptapnumeric = MatPtAPNumeric_AIJ_AIJ_wHYPRE; 8874222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_PtAP; 888613e5ff0Sstefano_zampini PetscFunctionReturn(0); 889613e5ff0Sstefano_zampini } 890613e5ff0Sstefano_zampini 8914cc28894Sstefano_zampini static PetscErrorCode MatPtAPNumeric_AIJ_HYPRE(Mat A,Mat P,Mat C) 892613e5ff0Sstefano_zampini { 8934cc28894Sstefano_zampini Mat B; 8944cc28894Sstefano_zampini Mat_HYPRE *hP; 8956abb4441SStefano Zampini hypre_ParCSRMatrix *hA = NULL,*Pparcsr,*ptapparcsr = NULL; 896613e5ff0Sstefano_zampini HYPRE_Int type; 897613e5ff0Sstefano_zampini MPI_Comm comm = PetscObjectComm((PetscObject)A); 8984cc28894Sstefano_zampini PetscBool ishypre; 899613e5ff0Sstefano_zampini 900613e5ff0Sstefano_zampini PetscFunctionBegin; 9015f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectTypeCompare((PetscObject)P,MATHYPRE,&ishypre)); 902*28b400f6SJacob Faibussowitsch PetscCheck(ishypre,comm,PETSC_ERR_USER,"P should be of type %s",MATHYPRE); 9034cc28894Sstefano_zampini hP = (Mat_HYPRE*)P->data; 904a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixGetObjectType,hP->ij,&type); 9052c71b3e2SJacob Faibussowitsch PetscCheckFalse(type != HYPRE_PARCSR,comm,PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported"); 906a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixGetObject,hP->ij,(void**)&Pparcsr); 907613e5ff0Sstefano_zampini 9085f80ce2aSJacob Faibussowitsch CHKERRQ(MatAIJGetParCSR_Private(A,&hA)); 9095f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPRE_ParCSR_RAP(Pparcsr,hA,Pparcsr,&ptapparcsr)); 9105f80ce2aSJacob Faibussowitsch CHKERRQ(MatAIJRestoreParCSR_Private(A,&hA)); 911225daaf8SStefano Zampini 9124cc28894Sstefano_zampini /* create temporary matrix and merge to C */ 9135f80ce2aSJacob Faibussowitsch CHKERRQ(MatCreateFromParCSR(ptapparcsr,((PetscObject)C)->type_name,PETSC_OWN_POINTER,&B)); 9145f80ce2aSJacob Faibussowitsch CHKERRQ(MatHeaderMerge(C,&B)); 9154cc28894Sstefano_zampini PetscFunctionReturn(0); 9164cc28894Sstefano_zampini } 9174cc28894Sstefano_zampini 9184cc28894Sstefano_zampini static PetscErrorCode MatPtAPNumeric_HYPRE_HYPRE(Mat A,Mat P,Mat C) 9194cc28894Sstefano_zampini { 9204cc28894Sstefano_zampini Mat B; 9216abb4441SStefano Zampini hypre_ParCSRMatrix *Aparcsr,*Pparcsr,*ptapparcsr = NULL; 9224cc28894Sstefano_zampini Mat_HYPRE *hA,*hP; 9234cc28894Sstefano_zampini PetscBool ishypre; 9244cc28894Sstefano_zampini HYPRE_Int type; 9254cc28894Sstefano_zampini 9264cc28894Sstefano_zampini PetscFunctionBegin; 9275f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectTypeCompare((PetscObject)P,MATHYPRE,&ishypre)); 928*28b400f6SJacob Faibussowitsch PetscCheck(ishypre,PetscObjectComm((PetscObject)P),PETSC_ERR_USER,"P should be of type %s",MATHYPRE); 9295f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectTypeCompare((PetscObject)A,MATHYPRE,&ishypre)); 930*28b400f6SJacob Faibussowitsch PetscCheck(ishypre,PetscObjectComm((PetscObject)A),PETSC_ERR_USER,"A should be of type %s",MATHYPRE); 9314cc28894Sstefano_zampini hA = (Mat_HYPRE*)A->data; 9324cc28894Sstefano_zampini hP = (Mat_HYPRE*)P->data; 933a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixGetObjectType,hA->ij,&type); 9342c71b3e2SJacob Faibussowitsch PetscCheckFalse(type != HYPRE_PARCSR,PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported"); 935a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixGetObjectType,hP->ij,&type); 9362c71b3e2SJacob Faibussowitsch PetscCheckFalse(type != HYPRE_PARCSR,PetscObjectComm((PetscObject)P),PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported"); 937a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixGetObject,hA->ij,(void**)&Aparcsr); 938a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixGetObject,hP->ij,(void**)&Pparcsr); 9395f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPRE_ParCSR_RAP(Pparcsr,Aparcsr,Pparcsr,&ptapparcsr)); 9405f80ce2aSJacob Faibussowitsch CHKERRQ(MatCreateFromParCSR(ptapparcsr,MATHYPRE,PETSC_OWN_POINTER,&B)); 9415f80ce2aSJacob Faibussowitsch CHKERRQ(MatHeaderMerge(C,&B)); 9424cc28894Sstefano_zampini PetscFunctionReturn(0); 9434cc28894Sstefano_zampini } 9444cc28894Sstefano_zampini 945d501dc42Sstefano_zampini /* calls hypre_ParMatmul 946d501dc42Sstefano_zampini hypre_ParMatMul uses hypre_ParMatrixCreate with the communicator of hA 9473dad0653Sstefano_zampini hypre_ParMatrixCreate does not duplicate the communicator 9486ea7df73SStefano Zampini It looks like we don't need to have the diagonal entries ordered first */ 949d501dc42Sstefano_zampini static PetscErrorCode MatHYPRE_ParCSR_MatMatMult(hypre_ParCSRMatrix *hA, hypre_ParCSRMatrix *hB, hypre_ParCSRMatrix **hAB) 950d501dc42Sstefano_zampini { 951d501dc42Sstefano_zampini PetscFunctionBegin; 9526ea7df73SStefano Zampini /* can be replaced by version test later */ 9536ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 9546ea7df73SStefano Zampini PetscStackPush("hypre_ParCSRMatMat"); 9556ea7df73SStefano Zampini *hAB = hypre_ParCSRMatMat(hA,hB); 9566ea7df73SStefano Zampini #else 957d501dc42Sstefano_zampini PetscStackPush("hypre_ParMatmul"); 958d501dc42Sstefano_zampini *hAB = hypre_ParMatmul(hA,hB); 9596ea7df73SStefano Zampini #endif 960d501dc42Sstefano_zampini PetscStackPop; 961d501dc42Sstefano_zampini PetscFunctionReturn(0); 962d501dc42Sstefano_zampini } 963d501dc42Sstefano_zampini 9645e5acdf2Sstefano_zampini static PetscErrorCode MatMatMultNumeric_AIJ_AIJ_wHYPRE(Mat A,Mat B,Mat C) 9655e5acdf2Sstefano_zampini { 9665e5acdf2Sstefano_zampini Mat D; 967d501dc42Sstefano_zampini hypre_ParCSRMatrix *hA,*hB,*hAB = NULL; 9684222ddf1SHong Zhang Mat_Product *product=C->product; 9695e5acdf2Sstefano_zampini 9705e5acdf2Sstefano_zampini PetscFunctionBegin; 9715f80ce2aSJacob Faibussowitsch CHKERRQ(MatAIJGetParCSR_Private(A,&hA)); 9725f80ce2aSJacob Faibussowitsch CHKERRQ(MatAIJGetParCSR_Private(B,&hB)); 9735f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPRE_ParCSR_MatMatMult(hA,hB,&hAB)); 9745f80ce2aSJacob Faibussowitsch CHKERRQ(MatCreateFromParCSR(hAB,MATAIJ,PETSC_OWN_POINTER,&D)); 9754222ddf1SHong Zhang 9765f80ce2aSJacob Faibussowitsch CHKERRQ(MatHeaderMerge(C,&D)); 9774222ddf1SHong Zhang C->product = product; 9784222ddf1SHong Zhang 9795f80ce2aSJacob Faibussowitsch CHKERRQ(MatAIJRestoreParCSR_Private(A,&hA)); 9805f80ce2aSJacob Faibussowitsch CHKERRQ(MatAIJRestoreParCSR_Private(B,&hB)); 9815e5acdf2Sstefano_zampini PetscFunctionReturn(0); 9825e5acdf2Sstefano_zampini } 9835e5acdf2Sstefano_zampini 9844222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatMatMultSymbolic_AIJ_AIJ_wHYPRE(Mat A,Mat B,PetscReal fill,Mat C) 9855e5acdf2Sstefano_zampini { 9865e5acdf2Sstefano_zampini PetscFunctionBegin; 9875f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetType(C,MATAIJ)); 9884222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_AIJ_AIJ_wHYPRE; 9894222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_AB; 9905e5acdf2Sstefano_zampini PetscFunctionReturn(0); 9915e5acdf2Sstefano_zampini } 9925e5acdf2Sstefano_zampini 993d501dc42Sstefano_zampini static PetscErrorCode MatMatMultNumeric_HYPRE_HYPRE(Mat A,Mat B,Mat C) 994d501dc42Sstefano_zampini { 995d501dc42Sstefano_zampini Mat D; 996d501dc42Sstefano_zampini hypre_ParCSRMatrix *Aparcsr,*Bparcsr,*ABparcsr = NULL; 997d501dc42Sstefano_zampini Mat_HYPRE *hA,*hB; 998d501dc42Sstefano_zampini PetscBool ishypre; 999d501dc42Sstefano_zampini HYPRE_Int type; 10004222ddf1SHong Zhang Mat_Product *product; 1001d501dc42Sstefano_zampini 1002d501dc42Sstefano_zampini PetscFunctionBegin; 10035f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectTypeCompare((PetscObject)B,MATHYPRE,&ishypre)); 1004*28b400f6SJacob Faibussowitsch PetscCheck(ishypre,PetscObjectComm((PetscObject)B),PETSC_ERR_USER,"B should be of type %s",MATHYPRE); 10055f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectTypeCompare((PetscObject)A,MATHYPRE,&ishypre)); 1006*28b400f6SJacob Faibussowitsch PetscCheck(ishypre,PetscObjectComm((PetscObject)A),PETSC_ERR_USER,"A should be of type %s",MATHYPRE); 1007d501dc42Sstefano_zampini hA = (Mat_HYPRE*)A->data; 1008d501dc42Sstefano_zampini hB = (Mat_HYPRE*)B->data; 1009a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixGetObjectType,hA->ij,&type); 10102c71b3e2SJacob Faibussowitsch PetscCheckFalse(type != HYPRE_PARCSR,PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported"); 1011a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixGetObjectType,hB->ij,&type); 10122c71b3e2SJacob Faibussowitsch PetscCheckFalse(type != HYPRE_PARCSR,PetscObjectComm((PetscObject)B),PETSC_ERR_SUP,"Only HYPRE_PARCSR is supported"); 1013a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixGetObject,hA->ij,(void**)&Aparcsr); 1014a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixGetObject,hB->ij,(void**)&Bparcsr); 10155f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPRE_ParCSR_MatMatMult(Aparcsr,Bparcsr,&ABparcsr)); 10165f80ce2aSJacob Faibussowitsch CHKERRQ(MatCreateFromParCSR(ABparcsr,MATHYPRE,PETSC_OWN_POINTER,&D)); 10174222ddf1SHong Zhang 1018d501dc42Sstefano_zampini /* need to use HeaderReplace because HeaderMerge messes up with the communicator */ 10194222ddf1SHong Zhang product = C->product; /* save it from MatHeaderReplace() */ 10204222ddf1SHong Zhang C->product = NULL; 10215f80ce2aSJacob Faibussowitsch CHKERRQ(MatHeaderReplace(C,&D)); 10224222ddf1SHong Zhang C->product = product; 1023d501dc42Sstefano_zampini C->ops->matmultnumeric = MatMatMultNumeric_HYPRE_HYPRE; 10244222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_AB; 1025d501dc42Sstefano_zampini PetscFunctionReturn(0); 1026d501dc42Sstefano_zampini } 1027d501dc42Sstefano_zampini 10283dad0653Sstefano_zampini PETSC_INTERN PetscErrorCode MatTransposeMatMatMultNumeric_AIJ_AIJ_AIJ_wHYPRE(Mat A,Mat B,Mat C,Mat D) 102920e1dc0dSstefano_zampini { 103020e1dc0dSstefano_zampini Mat E; 10316abb4441SStefano Zampini hypre_ParCSRMatrix *hA,*hB,*hC,*hABC = NULL; 103220e1dc0dSstefano_zampini 103320e1dc0dSstefano_zampini PetscFunctionBegin; 10345f80ce2aSJacob Faibussowitsch CHKERRQ(MatAIJGetParCSR_Private(A,&hA)); 10355f80ce2aSJacob Faibussowitsch CHKERRQ(MatAIJGetParCSR_Private(B,&hB)); 10365f80ce2aSJacob Faibussowitsch CHKERRQ(MatAIJGetParCSR_Private(C,&hC)); 10375f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPRE_ParCSR_RAP(hA,hB,hC,&hABC)); 10385f80ce2aSJacob Faibussowitsch CHKERRQ(MatCreateFromParCSR(hABC,MATAIJ,PETSC_OWN_POINTER,&E)); 10395f80ce2aSJacob Faibussowitsch CHKERRQ(MatHeaderMerge(D,&E)); 10405f80ce2aSJacob Faibussowitsch CHKERRQ(MatAIJRestoreParCSR_Private(A,&hA)); 10415f80ce2aSJacob Faibussowitsch CHKERRQ(MatAIJRestoreParCSR_Private(B,&hB)); 10425f80ce2aSJacob Faibussowitsch CHKERRQ(MatAIJRestoreParCSR_Private(C,&hC)); 104320e1dc0dSstefano_zampini PetscFunctionReturn(0); 104420e1dc0dSstefano_zampini } 104520e1dc0dSstefano_zampini 10464222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatTransposeMatMatMultSymbolic_AIJ_AIJ_AIJ_wHYPRE(Mat A,Mat B,Mat C,PetscReal fill,Mat D) 104720e1dc0dSstefano_zampini { 104820e1dc0dSstefano_zampini PetscFunctionBegin; 10495f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetType(D,MATAIJ)); 105020e1dc0dSstefano_zampini PetscFunctionReturn(0); 105120e1dc0dSstefano_zampini } 105220e1dc0dSstefano_zampini 10534222ddf1SHong Zhang /* ---------------------------------------------------- */ 10544222ddf1SHong Zhang static PetscErrorCode MatProductSymbolic_AB_HYPRE(Mat C) 10554222ddf1SHong Zhang { 10564222ddf1SHong Zhang PetscFunctionBegin; 10574222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_AB; 10584222ddf1SHong Zhang PetscFunctionReturn(0); 10594222ddf1SHong Zhang } 10604222ddf1SHong Zhang 10614222ddf1SHong Zhang static PetscErrorCode MatProductSetFromOptions_HYPRE_AB(Mat C) 10624222ddf1SHong Zhang { 10634222ddf1SHong Zhang Mat_Product *product = C->product; 10644222ddf1SHong Zhang PetscBool Ahypre; 10654222ddf1SHong Zhang 10664222ddf1SHong Zhang PetscFunctionBegin; 10675f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectTypeCompare((PetscObject)product->A,MATHYPRE,&Ahypre)); 10684222ddf1SHong Zhang if (Ahypre) { /* A is a Hypre matrix */ 10695f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetType(C,MATHYPRE)); 10704222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_AB_HYPRE; 10714222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_HYPRE_HYPRE; 10724222ddf1SHong Zhang PetscFunctionReturn(0); 10736718818eSStefano Zampini } 10744222ddf1SHong Zhang PetscFunctionReturn(0); 10754222ddf1SHong Zhang } 10764222ddf1SHong Zhang 10774222ddf1SHong Zhang static PetscErrorCode MatProductSymbolic_PtAP_HYPRE(Mat C) 10784222ddf1SHong Zhang { 10794222ddf1SHong Zhang PetscFunctionBegin; 10804222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_PtAP; 10814222ddf1SHong Zhang PetscFunctionReturn(0); 10824222ddf1SHong Zhang } 10834222ddf1SHong Zhang 10844222ddf1SHong Zhang static PetscErrorCode MatProductSetFromOptions_HYPRE_PtAP(Mat C) 10854222ddf1SHong Zhang { 10864222ddf1SHong Zhang Mat_Product *product = C->product; 10874222ddf1SHong Zhang PetscBool flg; 10884222ddf1SHong Zhang PetscInt type = 0; 10894222ddf1SHong Zhang const char *outTypes[4] = {"aij","seqaij","mpiaij","hypre"}; 10904222ddf1SHong Zhang PetscInt ntype = 4; 10914222ddf1SHong Zhang Mat A = product->A; 10924222ddf1SHong Zhang PetscBool Ahypre; 10935f80ce2aSJacob Faibussowitsch PetscErrorCode ierr; 10944222ddf1SHong Zhang 10954222ddf1SHong Zhang PetscFunctionBegin; 10965f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectTypeCompare((PetscObject)A,MATHYPRE,&Ahypre)); 10974222ddf1SHong Zhang if (Ahypre) { /* A is a Hypre matrix */ 10985f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetType(C,MATHYPRE)); 10994222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_PtAP_HYPRE; 11004222ddf1SHong Zhang C->ops->ptapnumeric = MatPtAPNumeric_HYPRE_HYPRE; 11014222ddf1SHong Zhang PetscFunctionReturn(0); 11024222ddf1SHong Zhang } 11034222ddf1SHong Zhang 11044222ddf1SHong Zhang /* A is AIJ, P is Hypre, C = PtAP can be either AIJ or Hypre format */ 11054222ddf1SHong Zhang /* Get runtime option */ 11064222ddf1SHong Zhang if (product->api_user) { 11074222ddf1SHong Zhang ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)C),((PetscObject)C)->prefix,"MatPtAP_HYPRE","Mat");CHKERRQ(ierr); 11085f80ce2aSJacob Faibussowitsch CHKERRQ(PetscOptionsEList("-matptap_hypre_outtype","MatPtAP outtype","MatPtAP outtype",outTypes,ntype,outTypes[type],&type,&flg)); 11094222ddf1SHong Zhang ierr = PetscOptionsEnd();CHKERRQ(ierr); 11104222ddf1SHong Zhang } else { 11114222ddf1SHong Zhang ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)C),((PetscObject)C)->prefix,"MatProduct_PtAP_HYPRE","Mat");CHKERRQ(ierr); 11125f80ce2aSJacob Faibussowitsch CHKERRQ(PetscOptionsEList("-mat_product_algorithm_hypre_outtype","MatProduct_PtAP outtype","MatProduct_PtAP",outTypes,ntype,outTypes[type],&type,&flg)); 11134222ddf1SHong Zhang ierr = PetscOptionsEnd();CHKERRQ(ierr); 11144222ddf1SHong Zhang } 11154222ddf1SHong Zhang 11164222ddf1SHong Zhang if (type == 0 || type == 1 || type == 2) { 11175f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetType(C,MATAIJ)); 11184222ddf1SHong Zhang } else if (type == 3) { 11195f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetType(C,MATHYPRE)); 11204222ddf1SHong Zhang } else SETERRQ(PetscObjectComm((PetscObject)C),PETSC_ERR_SUP,"MatPtAP outtype is not supported"); 11214222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_PtAP_HYPRE; 11224222ddf1SHong Zhang C->ops->ptapnumeric = MatPtAPNumeric_AIJ_HYPRE; 11234222ddf1SHong Zhang PetscFunctionReturn(0); 11244222ddf1SHong Zhang } 11254222ddf1SHong Zhang 11264222ddf1SHong Zhang static PetscErrorCode MatProductSetFromOptions_HYPRE(Mat C) 11274222ddf1SHong Zhang { 11284222ddf1SHong Zhang Mat_Product *product = C->product; 11294222ddf1SHong Zhang 11304222ddf1SHong Zhang PetscFunctionBegin; 11314222ddf1SHong Zhang switch (product->type) { 11324222ddf1SHong Zhang case MATPRODUCT_AB: 11335f80ce2aSJacob Faibussowitsch CHKERRQ(MatProductSetFromOptions_HYPRE_AB(C)); 11344222ddf1SHong Zhang break; 11354222ddf1SHong Zhang case MATPRODUCT_PtAP: 11365f80ce2aSJacob Faibussowitsch CHKERRQ(MatProductSetFromOptions_HYPRE_PtAP(C)); 11374222ddf1SHong Zhang break; 11386718818eSStefano Zampini default: 11396718818eSStefano Zampini break; 11404222ddf1SHong Zhang } 11414222ddf1SHong Zhang PetscFunctionReturn(0); 11424222ddf1SHong Zhang } 11434222ddf1SHong Zhang 11444222ddf1SHong Zhang /* -------------------------------------------------------- */ 11454222ddf1SHong Zhang 1146ea9daf28SStefano Zampini static PetscErrorCode MatMultTranspose_HYPRE(Mat A, Vec x, Vec y) 114763c07aadSStefano Zampini { 114863c07aadSStefano Zampini PetscFunctionBegin; 11495f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPRE_MultKernel_Private(A,1.0,x,0.0,y,PETSC_TRUE)); 115063c07aadSStefano Zampini PetscFunctionReturn(0); 115163c07aadSStefano Zampini } 115263c07aadSStefano Zampini 1153ea9daf28SStefano Zampini static PetscErrorCode MatMult_HYPRE(Mat A, Vec x, Vec y) 115463c07aadSStefano Zampini { 115563c07aadSStefano Zampini PetscFunctionBegin; 11565f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPRE_MultKernel_Private(A,1.0,x,0.0,y,PETSC_FALSE)); 115763c07aadSStefano Zampini PetscFunctionReturn(0); 115863c07aadSStefano Zampini } 115963c07aadSStefano Zampini 1160414bd5c3SStefano Zampini static PetscErrorCode MatMultAdd_HYPRE(Mat A, Vec x, Vec y, Vec z) 1161414bd5c3SStefano Zampini { 1162414bd5c3SStefano Zampini PetscFunctionBegin; 1163414bd5c3SStefano Zampini if (y != z) { 11645f80ce2aSJacob Faibussowitsch CHKERRQ(VecCopy(y,z)); 1165414bd5c3SStefano Zampini } 11665f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPRE_MultKernel_Private(A,1.0,x,1.0,z,PETSC_FALSE)); 1167414bd5c3SStefano Zampini PetscFunctionReturn(0); 1168414bd5c3SStefano Zampini } 1169414bd5c3SStefano Zampini 1170414bd5c3SStefano Zampini static PetscErrorCode MatMultTransposeAdd_HYPRE(Mat A, Vec x, Vec y, Vec z) 1171414bd5c3SStefano Zampini { 1172414bd5c3SStefano Zampini PetscFunctionBegin; 1173414bd5c3SStefano Zampini if (y != z) { 11745f80ce2aSJacob Faibussowitsch CHKERRQ(VecCopy(y,z)); 1175414bd5c3SStefano Zampini } 11765f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPRE_MultKernel_Private(A,1.0,x,1.0,z,PETSC_TRUE)); 1177414bd5c3SStefano Zampini PetscFunctionReturn(0); 1178414bd5c3SStefano Zampini } 1179414bd5c3SStefano Zampini 1180414bd5c3SStefano Zampini /* y = a * A * x + b * y or y = a * A^t * x + b * y depending on trans */ 118139accc25SStefano Zampini static PetscErrorCode MatHYPRE_MultKernel_Private(Mat A, HYPRE_Complex a, Vec x, HYPRE_Complex b, Vec y, PetscBool trans) 118263c07aadSStefano Zampini { 118363c07aadSStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 118463c07aadSStefano Zampini hypre_ParCSRMatrix *parcsr; 118563c07aadSStefano Zampini hypre_ParVector *hx,*hy; 118663c07aadSStefano Zampini 118763c07aadSStefano Zampini PetscFunctionBegin; 118863c07aadSStefano Zampini if (trans) { 11895f80ce2aSJacob Faibussowitsch CHKERRQ(VecHYPRE_IJVectorPushVecRead(hA->b,x)); 11905f80ce2aSJacob Faibussowitsch if (b != 0.0) CHKERRQ(VecHYPRE_IJVectorPushVec(hA->x,y)); 11915f80ce2aSJacob Faibussowitsch else CHKERRQ(VecHYPRE_IJVectorPushVecWrite(hA->x,y)); 1192a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJVectorGetObject,hA->b->ij,(void**)&hx); 1193a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJVectorGetObject,hA->x->ij,(void**)&hy); 119463c07aadSStefano Zampini } else { 11955f80ce2aSJacob Faibussowitsch CHKERRQ(VecHYPRE_IJVectorPushVecRead(hA->x,x)); 11965f80ce2aSJacob Faibussowitsch if (b != 0.0) CHKERRQ(VecHYPRE_IJVectorPushVec(hA->b,y)); 11975f80ce2aSJacob Faibussowitsch else CHKERRQ(VecHYPRE_IJVectorPushVecWrite(hA->b,y)); 1198a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJVectorGetObject,hA->x->ij,(void**)&hx); 1199a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJVectorGetObject,hA->b->ij,(void**)&hy); 120063c07aadSStefano Zampini } 1201a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixGetObject,hA->ij,(void**)&parcsr); 12026ea7df73SStefano Zampini if (trans) { 1203a74df02fSJacob Faibussowitsch PetscStackCallStandard(hypre_ParCSRMatrixMatvecT,a,parcsr,hx,b,hy); 12046ea7df73SStefano Zampini } else { 1205a74df02fSJacob Faibussowitsch PetscStackCallStandard(hypre_ParCSRMatrixMatvec,a,parcsr,hx,b,hy); 12066ea7df73SStefano Zampini } 12075f80ce2aSJacob Faibussowitsch CHKERRQ(VecHYPRE_IJVectorPopVec(hA->x)); 12085f80ce2aSJacob Faibussowitsch CHKERRQ(VecHYPRE_IJVectorPopVec(hA->b)); 120963c07aadSStefano Zampini PetscFunctionReturn(0); 121063c07aadSStefano Zampini } 121163c07aadSStefano Zampini 1212ea9daf28SStefano Zampini static PetscErrorCode MatDestroy_HYPRE(Mat A) 121363c07aadSStefano Zampini { 121463c07aadSStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 121563c07aadSStefano Zampini 121663c07aadSStefano Zampini PetscFunctionBegin; 12175f80ce2aSJacob Faibussowitsch CHKERRQ(VecHYPRE_IJVectorDestroy(&hA->x)); 12185f80ce2aSJacob Faibussowitsch CHKERRQ(VecHYPRE_IJVectorDestroy(&hA->b)); 1219978814f1SStefano Zampini if (hA->ij) { 1220978814f1SStefano Zampini if (!hA->inner_free) hypre_IJMatrixObject(hA->ij) = NULL; 1221a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixDestroy,hA->ij); 1222978814f1SStefano Zampini } 12235f80ce2aSJacob Faibussowitsch if (hA->comm) CHKERRQ(PetscCommRestoreComm(PetscObjectComm((PetscObject)A),&hA->comm)); 1224c69f721fSFande Kong 12255f80ce2aSJacob Faibussowitsch CHKERRQ(MatStashDestroy_Private(&A->stash)); 1226c69f721fSFande Kong 12275f80ce2aSJacob Faibussowitsch CHKERRQ(PetscFree(hA->array)); 1228c69f721fSFande Kong 12295f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatConvert_hypre_aij_C",NULL)); 12305f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatConvert_hypre_is_C",NULL)); 12315f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqaij_hypre_C",NULL)); 12325f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_mpiaij_hypre_C",NULL)); 12335f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatHYPRESetPreallocation_C",NULL)); 12345f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatHYPREGetParCSR_C",NULL)); 12355f80ce2aSJacob Faibussowitsch CHKERRQ(PetscFree(A->data)); 123663c07aadSStefano Zampini PetscFunctionReturn(0); 123763c07aadSStefano Zampini } 123863c07aadSStefano Zampini 1239ea9daf28SStefano Zampini static PetscErrorCode MatSetUp_HYPRE(Mat A) 124063c07aadSStefano Zampini { 12414ec6421dSstefano_zampini PetscFunctionBegin; 12425f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPRESetPreallocation(A,PETSC_DEFAULT,NULL,PETSC_DEFAULT,NULL)); 12434ec6421dSstefano_zampini PetscFunctionReturn(0); 12444ec6421dSstefano_zampini } 12454ec6421dSstefano_zampini 12466ea7df73SStefano Zampini //TODO FIX hypre_CSRMatrixMatvecOutOfPlace 12476ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 12486ea7df73SStefano Zampini static PetscErrorCode MatBindToCPU_HYPRE(Mat A, PetscBool bind) 12496ea7df73SStefano Zampini { 12506ea7df73SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 12516ea7df73SStefano Zampini HYPRE_MemoryLocation hmem = bind ? HYPRE_MEMORY_HOST : HYPRE_MEMORY_DEVICE; 12526ea7df73SStefano Zampini 12536ea7df73SStefano Zampini PetscFunctionBegin; 12546ea7df73SStefano Zampini A->boundtocpu = bind; 12556ea7df73SStefano Zampini if (hypre_IJMatrixAssembleFlag(hA->ij) && hmem != hypre_IJMatrixMemoryLocation(hA->ij)) { 12566ea7df73SStefano Zampini hypre_ParCSRMatrix *parcsr; 1257a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixGetObject,hA->ij,(void**)&parcsr); 1258a74df02fSJacob Faibussowitsch PetscStackCallStandard(hypre_ParCSRMatrixMigrate,parcsr, hmem); 12596ea7df73SStefano Zampini } 12605f80ce2aSJacob Faibussowitsch if (hA->x) CHKERRQ(VecHYPRE_IJBindToCPU(hA->x,bind)); 12615f80ce2aSJacob Faibussowitsch if (hA->b) CHKERRQ(VecHYPRE_IJBindToCPU(hA->b,bind)); 12626ea7df73SStefano Zampini PetscFunctionReturn(0); 12636ea7df73SStefano Zampini } 12646ea7df73SStefano Zampini #endif 12656ea7df73SStefano Zampini 12664ec6421dSstefano_zampini static PetscErrorCode MatAssemblyEnd_HYPRE(Mat A, MatAssemblyType mode) 12674ec6421dSstefano_zampini { 126863c07aadSStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 1269c69f721fSFande Kong PetscMPIInt n; 1270c69f721fSFande Kong PetscInt i,j,rstart,ncols,flg; 1271c69f721fSFande Kong PetscInt *row,*col; 1272c69f721fSFande Kong PetscScalar *val; 127363c07aadSStefano Zampini 127463c07aadSStefano Zampini PetscFunctionBegin; 12752c71b3e2SJacob Faibussowitsch PetscCheckFalse(mode == MAT_FLUSH_ASSEMBLY,PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"MAT_FLUSH_ASSEMBLY currently not supported with MATHYPRE"); 1276c69f721fSFande Kong 1277c69f721fSFande Kong if (!A->nooffprocentries) { 1278c69f721fSFande Kong while (1) { 12795f80ce2aSJacob Faibussowitsch CHKERRQ(MatStashScatterGetMesg_Private(&A->stash,&n,&row,&col,&val,&flg)); 1280c69f721fSFande Kong if (!flg) break; 1281c69f721fSFande Kong 1282c69f721fSFande Kong for (i=0; i<n;) { 1283c69f721fSFande Kong /* Now identify the consecutive vals belonging to the same row */ 1284c69f721fSFande Kong for (j=i,rstart=row[j]; j<n; j++) { 1285c69f721fSFande Kong if (row[j] != rstart) break; 1286c69f721fSFande Kong } 1287c69f721fSFande Kong if (j < n) ncols = j-i; 1288c69f721fSFande Kong else ncols = n-i; 1289c69f721fSFande Kong /* Now assemble all these values with a single function call */ 12905f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetValues_HYPRE(A,1,row+i,ncols,col+i,val+i,A->insertmode)); 1291c69f721fSFande Kong 1292c69f721fSFande Kong i = j; 1293c69f721fSFande Kong } 1294c69f721fSFande Kong } 12955f80ce2aSJacob Faibussowitsch CHKERRQ(MatStashScatterEnd_Private(&A->stash)); 1296c69f721fSFande Kong } 1297c69f721fSFande Kong 1298a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixAssemble,hA->ij); 1299336664bdSPierre Jolivet /* The assembly routine destroys the aux_matrix, we recreate it here by calling HYPRE_IJMatrixInitialize */ 1300336664bdSPierre Jolivet /* If the option MAT_SORTED_FULL is set to true, the indices and values can be passed to hypre directly, so we don't need the aux_matrix */ 1301336664bdSPierre Jolivet if (!hA->sorted_full) { 1302af1cf968SStefano Zampini hypre_AuxParCSRMatrix *aux_matrix; 1303af1cf968SStefano Zampini 1304af1cf968SStefano Zampini /* call destroy just to make sure we do not leak anything */ 1305af1cf968SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix*)hypre_IJMatrixTranslator(hA->ij); 1306a74df02fSJacob Faibussowitsch PetscStackCallStandard(hypre_AuxParCSRMatrixDestroy,aux_matrix); 1307af1cf968SStefano Zampini hypre_IJMatrixTranslator(hA->ij) = NULL; 1308af1cf968SStefano Zampini 1309af1cf968SStefano Zampini /* Initialize with assembled flag -> it only recreates the aux_par_matrix */ 1310a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixInitialize,hA->ij); 1311af1cf968SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix*)hypre_IJMatrixTranslator(hA->ij); 13126ea7df73SStefano Zampini if (aux_matrix) { 1313af1cf968SStefano Zampini hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 1; /* see comment in MatHYPRESetPreallocation_HYPRE */ 131422235d61SPierre Jolivet #if PETSC_PKG_HYPRE_VERSION_LT(2,19,0) 1315a74df02fSJacob Faibussowitsch PetscStackCallStandard(hypre_AuxParCSRMatrixInitialize,aux_matrix); 131622235d61SPierre Jolivet #else 1317a74df02fSJacob Faibussowitsch PetscStackCallStandard(hypre_AuxParCSRMatrixInitialize_v2,aux_matrix,HYPRE_MEMORY_HOST); 131822235d61SPierre Jolivet #endif 1319af1cf968SStefano Zampini } 13206ea7df73SStefano Zampini } 13216ea7df73SStefano Zampini { 13226ea7df73SStefano Zampini hypre_ParCSRMatrix *parcsr; 13236ea7df73SStefano Zampini 1324a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixGetObject,hA->ij,(void**)&parcsr); 1325a74df02fSJacob Faibussowitsch if (!hypre_ParCSRMatrixCommPkg(parcsr)) PetscStackCallStandard(hypre_MatvecCommPkgCreate,parcsr); 13266ea7df73SStefano Zampini } 13275f80ce2aSJacob Faibussowitsch if (!hA->x) CHKERRQ(VecHYPRE_IJVectorCreate(A->cmap,&hA->x)); 13285f80ce2aSJacob Faibussowitsch if (!hA->b) CHKERRQ(VecHYPRE_IJVectorCreate(A->rmap,&hA->b)); 13296ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 13305f80ce2aSJacob Faibussowitsch CHKERRQ(MatBindToCPU_HYPRE(A,A->boundtocpu)); 13316ea7df73SStefano Zampini #endif 133263c07aadSStefano Zampini PetscFunctionReturn(0); 133363c07aadSStefano Zampini } 133463c07aadSStefano Zampini 1335c69f721fSFande Kong static PetscErrorCode MatGetArray_HYPRE(Mat A, PetscInt size, void **array) 1336c69f721fSFande Kong { 1337c69f721fSFande Kong Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 1338c69f721fSFande Kong 1339c69f721fSFande Kong PetscFunctionBegin; 1340*28b400f6SJacob Faibussowitsch PetscCheck(hA->available,PETSC_COMM_SELF,PETSC_ERR_ARG_NULL,"Temporary space is in use"); 1341c69f721fSFande Kong 134239accc25SStefano Zampini if (hA->size >= size) { 134339accc25SStefano Zampini *array = hA->array; 134439accc25SStefano Zampini } else { 13455f80ce2aSJacob Faibussowitsch CHKERRQ(PetscFree(hA->array)); 1346c69f721fSFande Kong hA->size = size; 13475f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc(hA->size,&hA->array)); 1348c69f721fSFande Kong *array = hA->array; 1349c69f721fSFande Kong } 1350c69f721fSFande Kong 1351c69f721fSFande Kong hA->available = PETSC_FALSE; 1352c69f721fSFande Kong PetscFunctionReturn(0); 1353c69f721fSFande Kong } 1354c69f721fSFande Kong 1355708542d2SFande Kong static PetscErrorCode MatRestoreArray_HYPRE(Mat A, void **array) 1356c69f721fSFande Kong { 1357c69f721fSFande Kong Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 1358c69f721fSFande Kong 1359c69f721fSFande Kong PetscFunctionBegin; 1360c69f721fSFande Kong *array = NULL; 1361c69f721fSFande Kong hA->available = PETSC_TRUE; 1362c69f721fSFande Kong PetscFunctionReturn(0); 1363c69f721fSFande Kong } 1364c69f721fSFande Kong 13656ea7df73SStefano Zampini static PetscErrorCode MatSetValues_HYPRE(Mat A, PetscInt nr, const PetscInt rows[], PetscInt nc, const PetscInt cols[], const PetscScalar v[], InsertMode ins) 1366d975228cSstefano_zampini { 1367d975228cSstefano_zampini Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 1368d975228cSstefano_zampini PetscScalar *vals = (PetscScalar *)v; 136939accc25SStefano Zampini HYPRE_Complex *sscr; 1370c69f721fSFande Kong PetscInt *cscr[2]; 1371c69f721fSFande Kong PetscInt i,nzc; 137208defe43SFande Kong void *array = NULL; 1373d975228cSstefano_zampini 1374d975228cSstefano_zampini PetscFunctionBegin; 13755f80ce2aSJacob Faibussowitsch CHKERRQ(MatGetArray_HYPRE(A,sizeof(PetscInt)*(2*nc)+sizeof(HYPRE_Complex)*nc*nr,&array)); 1376c69f721fSFande Kong cscr[0] = (PetscInt*)array; 1377c69f721fSFande Kong cscr[1] = ((PetscInt*)array)+nc; 137839accc25SStefano Zampini sscr = (HYPRE_Complex*)(((PetscInt*)array)+nc*2); 1379d975228cSstefano_zampini for (i=0,nzc=0;i<nc;i++) { 1380d975228cSstefano_zampini if (cols[i] >= 0) { 1381d975228cSstefano_zampini cscr[0][nzc ] = cols[i]; 1382d975228cSstefano_zampini cscr[1][nzc++] = i; 1383d975228cSstefano_zampini } 1384d975228cSstefano_zampini } 1385c69f721fSFande Kong if (!nzc) { 13865f80ce2aSJacob Faibussowitsch CHKERRQ(MatRestoreArray_HYPRE(A,&array)); 1387c69f721fSFande Kong PetscFunctionReturn(0); 1388c69f721fSFande Kong } 1389d975228cSstefano_zampini 13906ea7df73SStefano Zampini #if 0 //defined(PETSC_HAVE_HYPRE_DEVICE) 13916ea7df73SStefano Zampini if (HYPRE_MEMORY_HOST != hypre_IJMatrixMemoryLocation(hA->ij)) { 13926ea7df73SStefano Zampini hypre_ParCSRMatrix *parcsr; 13936ea7df73SStefano Zampini 1394a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixGetObject,hA->ij,(void**)&parcsr); 1395a74df02fSJacob Faibussowitsch PetscStackCallStandard(hypre_ParCSRMatrixMigrate,parcsr, HYPRE_MEMORY_HOST); 13966ea7df73SStefano Zampini } 13976ea7df73SStefano Zampini #endif 13986ea7df73SStefano Zampini 1399d975228cSstefano_zampini if (ins == ADD_VALUES) { 1400d975228cSstefano_zampini for (i=0;i<nr;i++) { 14016ea7df73SStefano Zampini if (rows[i] >= 0) { 1402d975228cSstefano_zampini PetscInt j; 14032cf14000SStefano Zampini HYPRE_Int hnc = (HYPRE_Int)nzc; 14042cf14000SStefano Zampini 14052c71b3e2SJacob Faibussowitsch PetscCheckFalse((PetscInt)hnc != nzc,PETSC_COMM_SELF,PETSC_ERR_SUP,"Hypre overflow! number of columns %" PetscInt_FMT " for row %" PetscInt_FMT,nzc,rows[i]); 14065f80ce2aSJacob Faibussowitsch for (j=0;j<nzc;j++) CHKERRQ(PetscHYPREScalarCast(vals[cscr[1][j]],&sscr[j])); 1407a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixAddToValues,hA->ij,1,&hnc,(HYPRE_BigInt*)(rows+i),(HYPRE_BigInt*)cscr[0],sscr); 1408d975228cSstefano_zampini } 1409d975228cSstefano_zampini vals += nc; 1410d975228cSstefano_zampini } 1411d975228cSstefano_zampini } else { /* INSERT_VALUES */ 1412d975228cSstefano_zampini PetscInt rst,ren; 1413c69f721fSFande Kong 14145f80ce2aSJacob Faibussowitsch CHKERRQ(MatGetOwnershipRange(A,&rst,&ren)); 1415d975228cSstefano_zampini for (i=0;i<nr;i++) { 14166ea7df73SStefano Zampini if (rows[i] >= 0) { 1417d975228cSstefano_zampini PetscInt j; 14182cf14000SStefano Zampini HYPRE_Int hnc = (HYPRE_Int)nzc; 14192cf14000SStefano Zampini 14202c71b3e2SJacob Faibussowitsch PetscCheckFalse((PetscInt)hnc != nzc,PETSC_COMM_SELF,PETSC_ERR_SUP,"Hypre overflow! number of columns %" PetscInt_FMT " for row %" PetscInt_FMT,nzc,rows[i]); 14215f80ce2aSJacob Faibussowitsch for (j=0;j<nzc;j++) CHKERRQ(PetscHYPREScalarCast(vals[cscr[1][j]],&sscr[j])); 1422c69f721fSFande Kong /* nonlocal values */ 14235f80ce2aSJacob Faibussowitsch if (rows[i] < rst || rows[i] >= ren) CHKERRQ(MatStashValuesRow_Private(&A->stash,rows[i],nzc,cscr[0],(PetscScalar*)sscr,PETSC_FALSE)); 1424c69f721fSFande Kong /* local values */ 1425a74df02fSJacob Faibussowitsch else PetscStackCallStandard(HYPRE_IJMatrixSetValues,hA->ij,1,&hnc,(HYPRE_BigInt*)(rows+i),(HYPRE_BigInt*)cscr[0],sscr); 1426d975228cSstefano_zampini } 1427d975228cSstefano_zampini vals += nc; 1428d975228cSstefano_zampini } 1429d975228cSstefano_zampini } 1430c69f721fSFande Kong 14315f80ce2aSJacob Faibussowitsch CHKERRQ(MatRestoreArray_HYPRE(A,&array)); 1432d975228cSstefano_zampini PetscFunctionReturn(0); 1433d975228cSstefano_zampini } 1434d975228cSstefano_zampini 1435d975228cSstefano_zampini static PetscErrorCode MatHYPRESetPreallocation_HYPRE(Mat A, PetscInt dnz, const PetscInt dnnz[], PetscInt onz, const PetscInt onnz[]) 1436d975228cSstefano_zampini { 1437d975228cSstefano_zampini Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 14387d968826Sstefano_zampini HYPRE_Int *hdnnz,*honnz; 143906a29025Sstefano_zampini PetscInt i,rs,re,cs,ce,bs; 1440d975228cSstefano_zampini PetscMPIInt size; 1441d975228cSstefano_zampini 1442d975228cSstefano_zampini PetscFunctionBegin; 14435f80ce2aSJacob Faibussowitsch CHKERRQ(PetscLayoutSetUp(A->rmap)); 14445f80ce2aSJacob Faibussowitsch CHKERRQ(PetscLayoutSetUp(A->cmap)); 1445d975228cSstefano_zampini rs = A->rmap->rstart; 1446d975228cSstefano_zampini re = A->rmap->rend; 1447d975228cSstefano_zampini cs = A->cmap->rstart; 1448d975228cSstefano_zampini ce = A->cmap->rend; 1449d975228cSstefano_zampini if (!hA->ij) { 1450a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixCreate,hA->comm,rs,re-1,cs,ce-1,&hA->ij); 1451a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixSetObjectType,hA->ij,HYPRE_PARCSR); 1452d975228cSstefano_zampini } else { 14532cf14000SStefano Zampini HYPRE_BigInt hrs,hre,hcs,hce; 1454a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixGetLocalRange,hA->ij,&hrs,&hre,&hcs,&hce); 14552c71b3e2SJacob Faibussowitsch PetscCheckFalse(hre-hrs+1 != re -rs,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Inconsistent local rows: IJMatrix [%" PetscInt_FMT ",%" PetscInt_FMT "), PETSc [%" PetscInt_FMT ",%" PetscInt_FMT ")",hrs,hre+1,rs,re); 14562c71b3e2SJacob Faibussowitsch PetscCheckFalse(hce-hcs+1 != ce -cs,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Inconsistent local cols: IJMatrix [%" PetscInt_FMT ",%" PetscInt_FMT "), PETSc [%" PetscInt_FMT ",%" PetscInt_FMT ")",hcs,hce+1,cs,ce); 1457d975228cSstefano_zampini } 14585f80ce2aSJacob Faibussowitsch CHKERRQ(MatGetBlockSize(A,&bs)); 145906a29025Sstefano_zampini if (dnz == PETSC_DEFAULT || dnz == PETSC_DECIDE) dnz = 10*bs; 146006a29025Sstefano_zampini if (onz == PETSC_DEFAULT || onz == PETSC_DECIDE) onz = 10*bs; 146106a29025Sstefano_zampini 1462d975228cSstefano_zampini if (!dnnz) { 14635f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(A->rmap->n,&hdnnz)); 1464d975228cSstefano_zampini for (i=0;i<A->rmap->n;i++) hdnnz[i] = dnz; 1465d975228cSstefano_zampini } else { 14667d968826Sstefano_zampini hdnnz = (HYPRE_Int*)dnnz; 1467d975228cSstefano_zampini } 14685f80ce2aSJacob Faibussowitsch CHKERRMPI(MPI_Comm_size(PetscObjectComm((PetscObject)A),&size)); 1469d975228cSstefano_zampini if (size > 1) { 1470ddbeb582SStefano Zampini hypre_AuxParCSRMatrix *aux_matrix; 1471d975228cSstefano_zampini if (!onnz) { 14725f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(A->rmap->n,&honnz)); 1473d975228cSstefano_zampini for (i=0;i<A->rmap->n;i++) honnz[i] = onz; 147422235d61SPierre Jolivet } else honnz = (HYPRE_Int*)onnz; 1475ddbeb582SStefano Zampini /* SetDiagOffdSizes sets hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0, since it seems 1476ddbeb582SStefano Zampini they assume the user will input the entire row values, properly sorted 1477336664bdSPierre Jolivet In PETSc, we don't make such an assumption and set this flag to 1, 1478336664bdSPierre Jolivet unless the option MAT_SORTED_FULL is set to true. 1479ddbeb582SStefano Zampini Also, to avoid possible memory leaks, we destroy and recreate the translator 1480ddbeb582SStefano Zampini This has to be done here, as HYPRE_IJMatrixInitialize will properly initialize 1481ddbeb582SStefano Zampini the IJ matrix for us */ 1482ddbeb582SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix*)hypre_IJMatrixTranslator(hA->ij); 1483ddbeb582SStefano Zampini hypre_AuxParCSRMatrixDestroy(aux_matrix); 1484ddbeb582SStefano Zampini hypre_IJMatrixTranslator(hA->ij) = NULL; 1485a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixSetDiagOffdSizes,hA->ij,hdnnz,honnz); 1486ddbeb582SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix*)hypre_IJMatrixTranslator(hA->ij); 1487336664bdSPierre Jolivet hypre_AuxParCSRMatrixNeedAux(aux_matrix) = !hA->sorted_full; 1488d975228cSstefano_zampini } else { 1489d975228cSstefano_zampini honnz = NULL; 1490a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixSetRowSizes,hA->ij,hdnnz); 1491d975228cSstefano_zampini } 1492ddbeb582SStefano Zampini 1493af1cf968SStefano Zampini /* reset assembled flag and call the initialize method */ 1494af1cf968SStefano Zampini hypre_IJMatrixAssembleFlag(hA->ij) = 0; 14956ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2,19,0) 1496a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixInitialize,hA->ij); 14976ea7df73SStefano Zampini #else 1498a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixInitialize_v2,hA->ij,HYPRE_MEMORY_HOST); 14996ea7df73SStefano Zampini #endif 1500d975228cSstefano_zampini if (!dnnz) { 15015f80ce2aSJacob Faibussowitsch CHKERRQ(PetscFree(hdnnz)); 1502d975228cSstefano_zampini } 1503d975228cSstefano_zampini if (!onnz && honnz) { 15045f80ce2aSJacob Faibussowitsch CHKERRQ(PetscFree(honnz)); 1505d975228cSstefano_zampini } 1506af1cf968SStefano Zampini /* Match AIJ logic */ 150706a29025Sstefano_zampini A->preallocated = PETSC_TRUE; 1508af1cf968SStefano Zampini A->assembled = PETSC_FALSE; 1509d975228cSstefano_zampini PetscFunctionReturn(0); 1510d975228cSstefano_zampini } 1511d975228cSstefano_zampini 1512d975228cSstefano_zampini /*@C 1513d975228cSstefano_zampini MatHYPRESetPreallocation - Preallocates memory for a sparse parallel matrix in HYPRE IJ format 1514d975228cSstefano_zampini 1515d975228cSstefano_zampini Collective on Mat 1516d975228cSstefano_zampini 1517d975228cSstefano_zampini Input Parameters: 1518d975228cSstefano_zampini + A - the matrix 1519d975228cSstefano_zampini . dnz - number of nonzeros per row in DIAGONAL portion of local submatrix 1520d975228cSstefano_zampini (same value is used for all local rows) 1521d975228cSstefano_zampini . dnnz - array containing the number of nonzeros in the various rows of the 1522d975228cSstefano_zampini DIAGONAL portion of the local submatrix (possibly different for each row) 1523d975228cSstefano_zampini or NULL (PETSC_NULL_INTEGER in Fortran), if d_nz is used to specify the nonzero structure. 1524d975228cSstefano_zampini The size of this array is equal to the number of local rows, i.e 'm'. 1525d975228cSstefano_zampini For matrices that will be factored, you must leave room for (and set) 1526d975228cSstefano_zampini the diagonal entry even if it is zero. 1527d975228cSstefano_zampini . onz - number of nonzeros per row in the OFF-DIAGONAL portion of local 1528d975228cSstefano_zampini submatrix (same value is used for all local rows). 1529d975228cSstefano_zampini - onnz - array containing the number of nonzeros in the various rows of the 1530d975228cSstefano_zampini OFF-DIAGONAL portion of the local submatrix (possibly different for 1531d975228cSstefano_zampini each row) or NULL (PETSC_NULL_INTEGER in Fortran), if o_nz is used to specify the nonzero 1532d975228cSstefano_zampini structure. The size of this array is equal to the number 1533d975228cSstefano_zampini of local rows, i.e 'm'. 1534d975228cSstefano_zampini 153595452b02SPatrick Sanan Notes: 153695452b02SPatrick Sanan If the *nnz parameter is given then the *nz parameter is ignored; for sequential matrices, onz and onnz are ignored. 1537d975228cSstefano_zampini 1538d975228cSstefano_zampini Level: intermediate 1539d975228cSstefano_zampini 1540af1cf968SStefano Zampini .seealso: MatCreate(), MatMPIAIJSetPreallocation(), MATHYPRE 1541d975228cSstefano_zampini @*/ 1542d975228cSstefano_zampini PetscErrorCode MatHYPRESetPreallocation(Mat A, PetscInt dnz, const PetscInt dnnz[], PetscInt onz, const PetscInt onnz[]) 1543d975228cSstefano_zampini { 1544d975228cSstefano_zampini PetscFunctionBegin; 1545d975228cSstefano_zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1546d975228cSstefano_zampini PetscValidType(A,1); 15475f80ce2aSJacob Faibussowitsch CHKERRQ(PetscTryMethod(A,"MatHYPRESetPreallocation_C",(Mat,PetscInt,const PetscInt[],PetscInt,const PetscInt[]),(A,dnz,dnnz,onz,onnz))); 1548d975228cSstefano_zampini PetscFunctionReturn(0); 1549d975228cSstefano_zampini } 1550d975228cSstefano_zampini 1551225daaf8SStefano Zampini /* 1552225daaf8SStefano Zampini MatCreateFromParCSR - Creates a matrix from a hypre_ParCSRMatrix 1553225daaf8SStefano Zampini 1554225daaf8SStefano Zampini Collective 1555225daaf8SStefano Zampini 1556225daaf8SStefano Zampini Input Parameters: 155745b8d346SStefano Zampini + parcsr - the pointer to the hypre_ParCSRMatrix 1558bb4689ddSStefano Zampini . mtype - matrix type to be created. Currently MATAIJ, MATIS and MATHYPRE are supported. 1559225daaf8SStefano Zampini - copymode - PETSc copying options 1560225daaf8SStefano Zampini 1561225daaf8SStefano Zampini Output Parameter: 1562225daaf8SStefano Zampini . A - the matrix 1563225daaf8SStefano Zampini 1564225daaf8SStefano Zampini Level: intermediate 1565225daaf8SStefano Zampini 1566225daaf8SStefano Zampini .seealso: MatHYPRE, PetscCopyMode 1567225daaf8SStefano Zampini */ 156845b8d346SStefano Zampini PETSC_EXTERN PetscErrorCode MatCreateFromParCSR(hypre_ParCSRMatrix *parcsr, MatType mtype, PetscCopyMode copymode, Mat* A) 1569978814f1SStefano Zampini { 1570225daaf8SStefano Zampini Mat T; 1571978814f1SStefano Zampini Mat_HYPRE *hA; 1572978814f1SStefano Zampini MPI_Comm comm; 1573978814f1SStefano Zampini PetscInt rstart,rend,cstart,cend,M,N; 1574d248a85cSRichard Tran Mills PetscBool isseqaij,isseqaijmkl,ismpiaij,isaij,ishyp,isis; 1575978814f1SStefano Zampini 1576978814f1SStefano Zampini PetscFunctionBegin; 1577978814f1SStefano Zampini comm = hypre_ParCSRMatrixComm(parcsr); 15785f80ce2aSJacob Faibussowitsch CHKERRQ(PetscStrcmp(mtype,MATSEQAIJ,&isseqaij)); 15795f80ce2aSJacob Faibussowitsch CHKERRQ(PetscStrcmp(mtype,MATSEQAIJMKL,&isseqaijmkl)); 15805f80ce2aSJacob Faibussowitsch CHKERRQ(PetscStrcmp(mtype,MATMPIAIJ,&ismpiaij)); 15815f80ce2aSJacob Faibussowitsch CHKERRQ(PetscStrcmp(mtype,MATAIJ,&isaij)); 15825f80ce2aSJacob Faibussowitsch CHKERRQ(PetscStrcmp(mtype,MATHYPRE,&ishyp)); 15835f80ce2aSJacob Faibussowitsch CHKERRQ(PetscStrcmp(mtype,MATIS,&isis)); 1584d248a85cSRichard Tran Mills isaij = (PetscBool)(isseqaij || isseqaijmkl || ismpiaij || isaij); 15856ea7df73SStefano Zampini /* TODO */ 15862c71b3e2SJacob Faibussowitsch PetscCheckFalse(!isaij && !ishyp && !isis,comm,PETSC_ERR_SUP,"Unsupported MatType %s! Supported types are %s, %s, %s, %s, %s, and %s",mtype,MATAIJ,MATSEQAIJ,MATSEQAIJMKL,MATMPIAIJ,MATIS,MATHYPRE); 1587978814f1SStefano Zampini /* access ParCSRMatrix */ 1588978814f1SStefano Zampini rstart = hypre_ParCSRMatrixFirstRowIndex(parcsr); 1589978814f1SStefano Zampini rend = hypre_ParCSRMatrixLastRowIndex(parcsr); 1590978814f1SStefano Zampini cstart = hypre_ParCSRMatrixFirstColDiag(parcsr); 1591978814f1SStefano Zampini cend = hypre_ParCSRMatrixLastColDiag(parcsr); 1592978814f1SStefano Zampini M = hypre_ParCSRMatrixGlobalNumRows(parcsr); 1593978814f1SStefano Zampini N = hypre_ParCSRMatrixGlobalNumCols(parcsr); 1594978814f1SStefano Zampini 1595fa92c42cSstefano_zampini /* fix for empty local rows/columns */ 1596fa92c42cSstefano_zampini if (rend < rstart) rend = rstart; 1597fa92c42cSstefano_zampini if (cend < cstart) cend = cstart; 1598fa92c42cSstefano_zampini 1599e6471dc9SStefano Zampini /* PETSc convention */ 1600e6471dc9SStefano Zampini rend++; 1601e6471dc9SStefano Zampini cend++; 1602e6471dc9SStefano Zampini rend = PetscMin(rend,M); 1603e6471dc9SStefano Zampini cend = PetscMin(cend,N); 1604e6471dc9SStefano Zampini 1605978814f1SStefano Zampini /* create PETSc matrix with MatHYPRE */ 16065f80ce2aSJacob Faibussowitsch CHKERRQ(MatCreate(comm,&T)); 16075f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetSizes(T,rend-rstart,cend-cstart,M,N)); 16085f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetType(T,MATHYPRE)); 1609225daaf8SStefano Zampini hA = (Mat_HYPRE*)(T->data); 1610978814f1SStefano Zampini 1611978814f1SStefano Zampini /* create HYPRE_IJMatrix */ 1612a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixCreate,hA->comm,rstart,rend-1,cstart,cend-1,&hA->ij); 1613a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixSetObjectType,hA->ij,HYPRE_PARCSR); 161445b8d346SStefano Zampini 16156ea7df73SStefano Zampini // TODO DEV 161645b8d346SStefano Zampini /* create new ParCSR object if needed */ 161745b8d346SStefano Zampini if (ishyp && copymode == PETSC_COPY_VALUES) { 161845b8d346SStefano Zampini hypre_ParCSRMatrix *new_parcsr; 16196ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2,18,0) 162045b8d346SStefano Zampini hypre_CSRMatrix *hdiag,*hoffd,*ndiag,*noffd; 162145b8d346SStefano Zampini 16220e6427aaSSatish Balay new_parcsr = hypre_ParCSRMatrixClone(parcsr,0); 162345b8d346SStefano Zampini hdiag = hypre_ParCSRMatrixDiag(parcsr); 162445b8d346SStefano Zampini hoffd = hypre_ParCSRMatrixOffd(parcsr); 162545b8d346SStefano Zampini ndiag = hypre_ParCSRMatrixDiag(new_parcsr); 162645b8d346SStefano Zampini noffd = hypre_ParCSRMatrixOffd(new_parcsr); 16275f80ce2aSJacob Faibussowitsch CHKERRQ(PetscArraycpy(hypre_CSRMatrixData(ndiag),hypre_CSRMatrixData(hdiag),hypre_CSRMatrixNumNonzeros(hdiag))); 16285f80ce2aSJacob Faibussowitsch CHKERRQ(PetscArraycpy(hypre_CSRMatrixData(noffd),hypre_CSRMatrixData(hoffd),hypre_CSRMatrixNumNonzeros(hoffd))); 16296ea7df73SStefano Zampini #else 16306ea7df73SStefano Zampini new_parcsr = hypre_ParCSRMatrixClone(parcsr,1); 16316ea7df73SStefano Zampini #endif 163245b8d346SStefano Zampini parcsr = new_parcsr; 163345b8d346SStefano Zampini copymode = PETSC_OWN_POINTER; 163445b8d346SStefano Zampini } 1635978814f1SStefano Zampini 1636978814f1SStefano Zampini /* set ParCSR object */ 1637978814f1SStefano Zampini hypre_IJMatrixObject(hA->ij) = parcsr; 16384ec6421dSstefano_zampini T->preallocated = PETSC_TRUE; 1639978814f1SStefano Zampini 1640978814f1SStefano Zampini /* set assembled flag */ 1641978814f1SStefano Zampini hypre_IJMatrixAssembleFlag(hA->ij) = 1; 16426ea7df73SStefano Zampini #if 0 1643a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixInitialize,hA->ij); 16446ea7df73SStefano Zampini #endif 1645225daaf8SStefano Zampini if (ishyp) { 16466d2a658fSstefano_zampini PetscMPIInt myid = 0; 16476d2a658fSstefano_zampini 16486d2a658fSstefano_zampini /* make sure we always have row_starts and col_starts available */ 16496d2a658fSstefano_zampini if (HYPRE_AssumedPartitionCheck()) { 16505f80ce2aSJacob Faibussowitsch CHKERRMPI(MPI_Comm_rank(comm,&myid)); 16516d2a658fSstefano_zampini } 1652a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts) 16536d2a658fSstefano_zampini if (!hypre_ParCSRMatrixOwnsColStarts(parcsr)) { 16546d2a658fSstefano_zampini PetscLayout map; 16556d2a658fSstefano_zampini 16565f80ce2aSJacob Faibussowitsch CHKERRQ(MatGetLayouts(T,NULL,&map)); 16575f80ce2aSJacob Faibussowitsch CHKERRQ(PetscLayoutSetUp(map)); 16582cf14000SStefano Zampini hypre_ParCSRMatrixColStarts(parcsr) = (HYPRE_BigInt*)(map->range + myid); 16596d2a658fSstefano_zampini } 16606d2a658fSstefano_zampini if (!hypre_ParCSRMatrixOwnsRowStarts(parcsr)) { 16616d2a658fSstefano_zampini PetscLayout map; 16626d2a658fSstefano_zampini 16635f80ce2aSJacob Faibussowitsch CHKERRQ(MatGetLayouts(T,&map,NULL)); 16645f80ce2aSJacob Faibussowitsch CHKERRQ(PetscLayoutSetUp(map)); 16652cf14000SStefano Zampini hypre_ParCSRMatrixRowStarts(parcsr) = (HYPRE_BigInt*)(map->range + myid); 16666d2a658fSstefano_zampini } 1667a1d2239cSSatish Balay #endif 1668978814f1SStefano Zampini /* prevent from freeing the pointer */ 1669978814f1SStefano Zampini if (copymode == PETSC_USE_POINTER) hA->inner_free = PETSC_FALSE; 1670225daaf8SStefano Zampini *A = T; 16715f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetOption(*A,MAT_SORTED_FULL,PETSC_TRUE)); 16725f80ce2aSJacob Faibussowitsch CHKERRQ(MatAssemblyBegin(*A,MAT_FINAL_ASSEMBLY)); 16735f80ce2aSJacob Faibussowitsch CHKERRQ(MatAssemblyEnd(*A,MAT_FINAL_ASSEMBLY)); 1674bb4689ddSStefano Zampini } else if (isaij) { 1675bb4689ddSStefano Zampini if (copymode != PETSC_OWN_POINTER) { 1676225daaf8SStefano Zampini /* prevent from freeing the pointer */ 1677225daaf8SStefano Zampini hA->inner_free = PETSC_FALSE; 16785f80ce2aSJacob Faibussowitsch CHKERRQ(MatConvert_HYPRE_AIJ(T,MATAIJ,MAT_INITIAL_MATRIX,A)); 16795f80ce2aSJacob Faibussowitsch CHKERRQ(MatDestroy(&T)); 1680225daaf8SStefano Zampini } else { /* AIJ return type with PETSC_OWN_POINTER */ 16815f80ce2aSJacob Faibussowitsch CHKERRQ(MatConvert_HYPRE_AIJ(T,MATAIJ,MAT_INPLACE_MATRIX,&T)); 1682225daaf8SStefano Zampini *A = T; 1683225daaf8SStefano Zampini } 1684bb4689ddSStefano Zampini } else if (isis) { 16855f80ce2aSJacob Faibussowitsch CHKERRQ(MatConvert_HYPRE_IS(T,MATIS,MAT_INITIAL_MATRIX,A)); 16868cfe8d00SStefano Zampini if (copymode != PETSC_OWN_POINTER) hA->inner_free = PETSC_FALSE; 16875f80ce2aSJacob Faibussowitsch CHKERRQ(MatDestroy(&T)); 1688bb4689ddSStefano Zampini } 1689978814f1SStefano Zampini PetscFunctionReturn(0); 1690978814f1SStefano Zampini } 1691978814f1SStefano Zampini 169268ec7858SStefano Zampini static PetscErrorCode MatHYPREGetParCSR_HYPRE(Mat A, hypre_ParCSRMatrix **parcsr) 1693dd9c0a25Sstefano_zampini { 1694dd9c0a25Sstefano_zampini Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 1695dd9c0a25Sstefano_zampini HYPRE_Int type; 1696dd9c0a25Sstefano_zampini 1697dd9c0a25Sstefano_zampini PetscFunctionBegin; 1698*28b400f6SJacob Faibussowitsch PetscCheck(hA->ij,PetscObjectComm((PetscObject)A),PETSC_ERR_PLIB,"HYPRE_IJMatrix not present"); 1699a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixGetObjectType,hA->ij,&type); 17002c71b3e2SJacob Faibussowitsch PetscCheckFalse(type != HYPRE_PARCSR,PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"HYPRE_IJMatrix is not of type HYPRE_PARCSR"); 1701a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixGetObject,hA->ij,(void**)parcsr); 1702dd9c0a25Sstefano_zampini PetscFunctionReturn(0); 1703dd9c0a25Sstefano_zampini } 1704dd9c0a25Sstefano_zampini 1705dd9c0a25Sstefano_zampini /* 1706dd9c0a25Sstefano_zampini MatHYPREGetParCSR - Gets the pointer to the ParCSR matrix 1707dd9c0a25Sstefano_zampini 1708dd9c0a25Sstefano_zampini Not collective 1709dd9c0a25Sstefano_zampini 1710dd9c0a25Sstefano_zampini Input Parameters: 1711dd9c0a25Sstefano_zampini + A - the MATHYPRE object 1712dd9c0a25Sstefano_zampini 1713dd9c0a25Sstefano_zampini Output Parameter: 1714dd9c0a25Sstefano_zampini . parcsr - the pointer to the hypre_ParCSRMatrix 1715dd9c0a25Sstefano_zampini 1716dd9c0a25Sstefano_zampini Level: intermediate 1717dd9c0a25Sstefano_zampini 1718dd9c0a25Sstefano_zampini .seealso: MatHYPRE, PetscCopyMode 1719dd9c0a25Sstefano_zampini */ 1720dd9c0a25Sstefano_zampini PetscErrorCode MatHYPREGetParCSR(Mat A, hypre_ParCSRMatrix **parcsr) 1721dd9c0a25Sstefano_zampini { 1722dd9c0a25Sstefano_zampini PetscFunctionBegin; 1723dd9c0a25Sstefano_zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1724dd9c0a25Sstefano_zampini PetscValidType(A,1); 17255f80ce2aSJacob Faibussowitsch CHKERRQ(PetscUseMethod(A,"MatHYPREGetParCSR_C",(Mat,hypre_ParCSRMatrix**),(A,parcsr))); 1726dd9c0a25Sstefano_zampini PetscFunctionReturn(0); 1727dd9c0a25Sstefano_zampini } 1728dd9c0a25Sstefano_zampini 172968ec7858SStefano Zampini static PetscErrorCode MatMissingDiagonal_HYPRE(Mat A, PetscBool *missing, PetscInt *dd) 173068ec7858SStefano Zampini { 173168ec7858SStefano Zampini hypre_ParCSRMatrix *parcsr; 173268ec7858SStefano Zampini hypre_CSRMatrix *ha; 173368ec7858SStefano Zampini PetscInt rst; 173468ec7858SStefano Zampini 173568ec7858SStefano Zampini PetscFunctionBegin; 17362c71b3e2SJacob Faibussowitsch PetscCheckFalse(A->rmap->n != A->cmap->n,PETSC_COMM_SELF,PETSC_ERR_SUP,"Not implemented with non-square diagonal blocks"); 17375f80ce2aSJacob Faibussowitsch CHKERRQ(MatGetOwnershipRange(A,&rst,NULL)); 17385f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPREGetParCSR_HYPRE(A,&parcsr)); 173968ec7858SStefano Zampini if (missing) *missing = PETSC_FALSE; 174068ec7858SStefano Zampini if (dd) *dd = -1; 174168ec7858SStefano Zampini ha = hypre_ParCSRMatrixDiag(parcsr); 174268ec7858SStefano Zampini if (ha) { 174368299464SStefano Zampini PetscInt size,i; 174468299464SStefano Zampini HYPRE_Int *ii,*jj; 174568ec7858SStefano Zampini 174668ec7858SStefano Zampini size = hypre_CSRMatrixNumRows(ha); 174768ec7858SStefano Zampini ii = hypre_CSRMatrixI(ha); 174868ec7858SStefano Zampini jj = hypre_CSRMatrixJ(ha); 174968ec7858SStefano Zampini for (i = 0; i < size; i++) { 175068ec7858SStefano Zampini PetscInt j; 175168ec7858SStefano Zampini PetscBool found = PETSC_FALSE; 175268ec7858SStefano Zampini 175368ec7858SStefano Zampini for (j = ii[i]; j < ii[i+1] && !found; j++) 175468ec7858SStefano Zampini found = (jj[j] == i) ? PETSC_TRUE : PETSC_FALSE; 175568ec7858SStefano Zampini 175668ec7858SStefano Zampini if (!found) { 17577d3de750SJacob Faibussowitsch PetscInfo(A,"Matrix is missing local diagonal entry %" PetscInt_FMT "\n",i); 175868ec7858SStefano Zampini if (missing) *missing = PETSC_TRUE; 175968ec7858SStefano Zampini if (dd) *dd = i+rst; 176068ec7858SStefano Zampini PetscFunctionReturn(0); 176168ec7858SStefano Zampini } 176268ec7858SStefano Zampini } 176368ec7858SStefano Zampini if (!size) { 176468ec7858SStefano Zampini PetscInfo(A,"Matrix has no diagonal entries therefore is missing diagonal\n"); 176568ec7858SStefano Zampini if (missing) *missing = PETSC_TRUE; 176668ec7858SStefano Zampini if (dd) *dd = rst; 176768ec7858SStefano Zampini } 176868ec7858SStefano Zampini } else { 176968ec7858SStefano Zampini PetscInfo(A,"Matrix has no diagonal entries therefore is missing diagonal\n"); 177068ec7858SStefano Zampini if (missing) *missing = PETSC_TRUE; 177168ec7858SStefano Zampini if (dd) *dd = rst; 177268ec7858SStefano Zampini } 177368ec7858SStefano Zampini PetscFunctionReturn(0); 177468ec7858SStefano Zampini } 177568ec7858SStefano Zampini 177668ec7858SStefano Zampini static PetscErrorCode MatScale_HYPRE(Mat A, PetscScalar s) 177768ec7858SStefano Zampini { 177868ec7858SStefano Zampini hypre_ParCSRMatrix *parcsr; 17796ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2,19,0) 178068ec7858SStefano Zampini hypre_CSRMatrix *ha; 17816ea7df73SStefano Zampini #endif 178239accc25SStefano Zampini HYPRE_Complex hs; 178368ec7858SStefano Zampini 178468ec7858SStefano Zampini PetscFunctionBegin; 17855f80ce2aSJacob Faibussowitsch CHKERRQ(PetscHYPREScalarCast(s,&hs)); 17865f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPREGetParCSR_HYPRE(A,&parcsr)); 17876ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2,19,0) 1788a74df02fSJacob Faibussowitsch PetscStackCallStandard(hypre_ParCSRMatrixScale,parcsr,hs); 17896ea7df73SStefano Zampini #else /* diagonal part */ 179068ec7858SStefano Zampini ha = hypre_ParCSRMatrixDiag(parcsr); 179168ec7858SStefano Zampini if (ha) { 179268299464SStefano Zampini PetscInt size,i; 179368299464SStefano Zampini HYPRE_Int *ii; 179439accc25SStefano Zampini HYPRE_Complex *a; 179568ec7858SStefano Zampini 179668ec7858SStefano Zampini size = hypre_CSRMatrixNumRows(ha); 179768ec7858SStefano Zampini a = hypre_CSRMatrixData(ha); 179868ec7858SStefano Zampini ii = hypre_CSRMatrixI(ha); 179939accc25SStefano Zampini for (i = 0; i < ii[size]; i++) a[i] *= hs; 180068ec7858SStefano Zampini } 180168ec7858SStefano Zampini /* offdiagonal part */ 180268ec7858SStefano Zampini ha = hypre_ParCSRMatrixOffd(parcsr); 180368ec7858SStefano Zampini if (ha) { 180468299464SStefano Zampini PetscInt size,i; 180568299464SStefano Zampini HYPRE_Int *ii; 180639accc25SStefano Zampini HYPRE_Complex *a; 180768ec7858SStefano Zampini 180868ec7858SStefano Zampini size = hypre_CSRMatrixNumRows(ha); 180968ec7858SStefano Zampini a = hypre_CSRMatrixData(ha); 181068ec7858SStefano Zampini ii = hypre_CSRMatrixI(ha); 181139accc25SStefano Zampini for (i = 0; i < ii[size]; i++) a[i] *= hs; 181268ec7858SStefano Zampini } 18136ea7df73SStefano Zampini #endif 181468ec7858SStefano Zampini PetscFunctionReturn(0); 181568ec7858SStefano Zampini } 181668ec7858SStefano Zampini 181768ec7858SStefano Zampini static PetscErrorCode MatZeroRowsColumns_HYPRE(Mat A, PetscInt numRows, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 181868ec7858SStefano Zampini { 181968ec7858SStefano Zampini hypre_ParCSRMatrix *parcsr; 182068299464SStefano Zampini HYPRE_Int *lrows; 182168299464SStefano Zampini PetscInt rst,ren,i; 182268ec7858SStefano Zampini 182368ec7858SStefano Zampini PetscFunctionBegin; 18242c71b3e2SJacob Faibussowitsch PetscCheckFalse(x || b,PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"To be implemented"); 18255f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPREGetParCSR_HYPRE(A,&parcsr)); 18265f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(numRows,&lrows)); 18275f80ce2aSJacob Faibussowitsch CHKERRQ(MatGetOwnershipRange(A,&rst,&ren)); 182868ec7858SStefano Zampini for (i=0;i<numRows;i++) { 182968ec7858SStefano Zampini if (rows[i] < rst || rows[i] >= ren) 183068ec7858SStefano Zampini SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Non-local rows not yet supported"); 183168ec7858SStefano Zampini lrows[i] = rows[i] - rst; 183268ec7858SStefano Zampini } 1833a74df02fSJacob Faibussowitsch PetscStackCallStandard(hypre_ParCSRMatrixEliminateRowsCols,parcsr,numRows,lrows); 18345f80ce2aSJacob Faibussowitsch CHKERRQ(PetscFree(lrows)); 183568ec7858SStefano Zampini PetscFunctionReturn(0); 183668ec7858SStefano Zampini } 183768ec7858SStefano Zampini 1838c69f721fSFande Kong static PetscErrorCode MatZeroEntries_HYPRE_CSRMatrix(hypre_CSRMatrix *ha) 1839c69f721fSFande Kong { 1840c69f721fSFande Kong PetscFunctionBegin; 1841c69f721fSFande Kong if (ha) { 1842c69f721fSFande Kong HYPRE_Int *ii, size; 1843c69f721fSFande Kong HYPRE_Complex *a; 1844c69f721fSFande Kong 1845c69f721fSFande Kong size = hypre_CSRMatrixNumRows(ha); 1846c69f721fSFande Kong a = hypre_CSRMatrixData(ha); 1847c69f721fSFande Kong ii = hypre_CSRMatrixI(ha); 1848c69f721fSFande Kong 18495f80ce2aSJacob Faibussowitsch if (a) CHKERRQ(PetscArrayzero(a,ii[size])); 1850c69f721fSFande Kong } 1851c69f721fSFande Kong PetscFunctionReturn(0); 1852c69f721fSFande Kong } 1853c69f721fSFande Kong 1854c69f721fSFande Kong PetscErrorCode MatZeroEntries_HYPRE(Mat A) 1855c69f721fSFande Kong { 18566ea7df73SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 18576ea7df73SStefano Zampini 18586ea7df73SStefano Zampini PetscFunctionBegin; 18596ea7df73SStefano Zampini if (HYPRE_MEMORY_DEVICE == hypre_IJMatrixMemoryLocation(hA->ij)) { 1860a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixSetConstantValues,hA->ij,0.0); 18616ea7df73SStefano Zampini } else { 1862c69f721fSFande Kong hypre_ParCSRMatrix *parcsr; 1863c69f721fSFande Kong 18645f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPREGetParCSR_HYPRE(A,&parcsr)); 18655f80ce2aSJacob Faibussowitsch CHKERRQ(MatZeroEntries_HYPRE_CSRMatrix(hypre_ParCSRMatrixDiag(parcsr))); 18665f80ce2aSJacob Faibussowitsch CHKERRQ(MatZeroEntries_HYPRE_CSRMatrix(hypre_ParCSRMatrixOffd(parcsr))); 18676ea7df73SStefano Zampini } 1868c69f721fSFande Kong PetscFunctionReturn(0); 1869c69f721fSFande Kong } 1870c69f721fSFande Kong 187139accc25SStefano Zampini static PetscErrorCode MatZeroRows_HYPRE_CSRMatrix(hypre_CSRMatrix *hA,PetscInt N,const PetscInt rows[],HYPRE_Complex diag) 1872c69f721fSFande Kong { 187339accc25SStefano Zampini PetscInt ii; 187439accc25SStefano Zampini HYPRE_Int *i, *j; 187539accc25SStefano Zampini HYPRE_Complex *a; 1876c69f721fSFande Kong 1877c69f721fSFande Kong PetscFunctionBegin; 1878c69f721fSFande Kong if (!hA) PetscFunctionReturn(0); 1879c69f721fSFande Kong 188039accc25SStefano Zampini i = hypre_CSRMatrixI(hA); 188139accc25SStefano Zampini j = hypre_CSRMatrixJ(hA); 1882c69f721fSFande Kong a = hypre_CSRMatrixData(hA); 1883c69f721fSFande Kong 1884c69f721fSFande Kong for (ii = 0; ii < N; ii++) { 188539accc25SStefano Zampini HYPRE_Int jj, ibeg, iend, irow; 188639accc25SStefano Zampini 1887c69f721fSFande Kong irow = rows[ii]; 1888c69f721fSFande Kong ibeg = i[irow]; 1889c69f721fSFande Kong iend = i[irow+1]; 1890c69f721fSFande Kong for (jj = ibeg; jj < iend; jj++) 1891c69f721fSFande Kong if (j[jj] == irow) a[jj] = diag; 1892c69f721fSFande Kong else a[jj] = 0.0; 1893c69f721fSFande Kong } 1894c69f721fSFande Kong PetscFunctionReturn(0); 1895c69f721fSFande Kong } 1896c69f721fSFande Kong 1897ddbeb582SStefano Zampini static PetscErrorCode MatZeroRows_HYPRE(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 1898c69f721fSFande Kong { 1899c69f721fSFande Kong hypre_ParCSRMatrix *parcsr; 1900c69f721fSFande Kong PetscInt *lrows,len; 190139accc25SStefano Zampini HYPRE_Complex hdiag; 1902c69f721fSFande Kong 1903c69f721fSFande Kong PetscFunctionBegin; 19042c71b3e2SJacob Faibussowitsch PetscCheckFalse(x || b,PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Does not support to modify the solution and the right hand size"); 19055f80ce2aSJacob Faibussowitsch CHKERRQ(PetscHYPREScalarCast(diag,&hdiag)); 1906c69f721fSFande Kong /* retrieve the internal matrix */ 19075f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPREGetParCSR_HYPRE(A,&parcsr)); 1908c69f721fSFande Kong /* get locally owned rows */ 19095f80ce2aSJacob Faibussowitsch CHKERRQ(MatZeroRowsMapLocal_Private(A,N,rows,&len,&lrows)); 1910c69f721fSFande Kong /* zero diagonal part */ 19115f80ce2aSJacob Faibussowitsch CHKERRQ(MatZeroRows_HYPRE_CSRMatrix(hypre_ParCSRMatrixDiag(parcsr),len,lrows,hdiag)); 1912c69f721fSFande Kong /* zero off-diagonal part */ 19135f80ce2aSJacob Faibussowitsch CHKERRQ(MatZeroRows_HYPRE_CSRMatrix(hypre_ParCSRMatrixOffd(parcsr),len,lrows,0.0)); 1914c69f721fSFande Kong 19155f80ce2aSJacob Faibussowitsch CHKERRQ(PetscFree(lrows)); 1916c69f721fSFande Kong PetscFunctionReturn(0); 1917c69f721fSFande Kong } 1918c69f721fSFande Kong 1919ddbeb582SStefano Zampini static PetscErrorCode MatAssemblyBegin_HYPRE(Mat mat,MatAssemblyType mode) 1920c69f721fSFande Kong { 1921c69f721fSFande Kong PetscFunctionBegin; 1922c69f721fSFande Kong if (mat->nooffprocentries) PetscFunctionReturn(0); 1923c69f721fSFande Kong 19245f80ce2aSJacob Faibussowitsch CHKERRQ(MatStashScatterBegin_Private(mat,&mat->stash,mat->rmap->range)); 1925c69f721fSFande Kong PetscFunctionReturn(0); 1926c69f721fSFande Kong } 1927c69f721fSFande Kong 1928ddbeb582SStefano Zampini static PetscErrorCode MatGetRow_HYPRE(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 1929c69f721fSFande Kong { 1930c69f721fSFande Kong hypre_ParCSRMatrix *parcsr; 19312cf14000SStefano Zampini HYPRE_Int hnz; 1932c69f721fSFande Kong 1933c69f721fSFande Kong PetscFunctionBegin; 1934c69f721fSFande Kong /* retrieve the internal matrix */ 19355f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPREGetParCSR_HYPRE(A,&parcsr)); 1936c69f721fSFande Kong /* call HYPRE API */ 1937a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_ParCSRMatrixGetRow,parcsr,row,&hnz,(HYPRE_BigInt**)idx,(HYPRE_Complex**)v); 19382cf14000SStefano Zampini if (nz) *nz = (PetscInt)hnz; 1939c69f721fSFande Kong PetscFunctionReturn(0); 1940c69f721fSFande Kong } 1941c69f721fSFande Kong 1942ddbeb582SStefano Zampini static PetscErrorCode MatRestoreRow_HYPRE(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 1943c69f721fSFande Kong { 1944c69f721fSFande Kong hypre_ParCSRMatrix *parcsr; 19452cf14000SStefano Zampini HYPRE_Int hnz; 1946c69f721fSFande Kong 1947c69f721fSFande Kong PetscFunctionBegin; 1948c69f721fSFande Kong /* retrieve the internal matrix */ 19495f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPREGetParCSR_HYPRE(A,&parcsr)); 1950c69f721fSFande Kong /* call HYPRE API */ 19512cf14000SStefano Zampini hnz = nz ? (HYPRE_Int)(*nz) : 0; 1952a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_ParCSRMatrixRestoreRow,parcsr,row,&hnz,(HYPRE_BigInt**)idx,(HYPRE_Complex**)v); 1953c69f721fSFande Kong PetscFunctionReturn(0); 1954c69f721fSFande Kong } 1955c69f721fSFande Kong 1956ddbeb582SStefano Zampini static PetscErrorCode MatGetValues_HYPRE(Mat A,PetscInt m,const PetscInt idxm[],PetscInt n,const PetscInt idxn[],PetscScalar v[]) 1957c69f721fSFande Kong { 195845b8d346SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 1959c69f721fSFande Kong PetscInt i; 19601d4906efSStefano Zampini 1961c69f721fSFande Kong PetscFunctionBegin; 1962c69f721fSFande Kong if (!m || !n) PetscFunctionReturn(0); 1963c69f721fSFande Kong /* Ignore negative row indices 1964c69f721fSFande Kong * And negative column indices should be automatically ignored in hypre 1965c69f721fSFande Kong * */ 19662cf14000SStefano Zampini for (i=0; i<m; i++) { 19672cf14000SStefano Zampini if (idxm[i] >= 0) { 19682cf14000SStefano Zampini HYPRE_Int hn = (HYPRE_Int)n; 1969a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixGetValues,hA->ij,1,&hn,(HYPRE_BigInt*)&idxm[i],(HYPRE_BigInt*)idxn,(HYPRE_Complex*)(v + i*n)); 19702cf14000SStefano Zampini } 19712cf14000SStefano Zampini } 1972c69f721fSFande Kong PetscFunctionReturn(0); 1973c69f721fSFande Kong } 1974c69f721fSFande Kong 1975ddbeb582SStefano Zampini static PetscErrorCode MatSetOption_HYPRE(Mat A,MatOption op,PetscBool flg) 1976ddbeb582SStefano Zampini { 1977ddbeb582SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 1978ddbeb582SStefano Zampini 1979ddbeb582SStefano Zampini PetscFunctionBegin; 1980c6698e78SStefano Zampini switch (op) { 1981ddbeb582SStefano Zampini case MAT_NO_OFF_PROC_ENTRIES: 1982ddbeb582SStefano Zampini if (flg) { 1983a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixSetMaxOffProcElmts,hA->ij,0); 1984ddbeb582SStefano Zampini } 1985ddbeb582SStefano Zampini break; 1986336664bdSPierre Jolivet case MAT_SORTED_FULL: 1987336664bdSPierre Jolivet hA->sorted_full = flg; 1988336664bdSPierre Jolivet break; 1989ddbeb582SStefano Zampini default: 1990ddbeb582SStefano Zampini break; 1991ddbeb582SStefano Zampini } 1992ddbeb582SStefano Zampini PetscFunctionReturn(0); 1993ddbeb582SStefano Zampini } 1994c69f721fSFande Kong 199545b8d346SStefano Zampini static PetscErrorCode MatView_HYPRE(Mat A, PetscViewer view) 199645b8d346SStefano Zampini { 199745b8d346SStefano Zampini PetscViewerFormat format; 199845b8d346SStefano Zampini 199945b8d346SStefano Zampini PetscFunctionBegin; 20005f80ce2aSJacob Faibussowitsch CHKERRQ(PetscViewerGetFormat(view,&format)); 20016ea7df73SStefano Zampini if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(0); 200245b8d346SStefano Zampini if (format != PETSC_VIEWER_NATIVE) { 20036ea7df73SStefano Zampini Mat B; 20046ea7df73SStefano Zampini hypre_ParCSRMatrix *parcsr; 20056ea7df73SStefano Zampini PetscErrorCode (*mview)(Mat,PetscViewer) = NULL; 20066ea7df73SStefano Zampini 20075f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPREGetParCSR_HYPRE(A,&parcsr)); 20085f80ce2aSJacob Faibussowitsch CHKERRQ(MatCreateFromParCSR(parcsr,MATAIJ,PETSC_USE_POINTER,&B)); 20095f80ce2aSJacob Faibussowitsch CHKERRQ(MatGetOperation(B,MATOP_VIEW,(void(**)(void))&mview)); 2010*28b400f6SJacob Faibussowitsch PetscCheck(mview,PetscObjectComm((PetscObject)A),PETSC_ERR_PLIB,"Missing view operation"); 20115f80ce2aSJacob Faibussowitsch CHKERRQ((*mview)(B,view)); 20125f80ce2aSJacob Faibussowitsch CHKERRQ(MatDestroy(&B)); 201345b8d346SStefano Zampini } else { 201445b8d346SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE*)A->data; 201545b8d346SStefano Zampini PetscMPIInt size; 201645b8d346SStefano Zampini PetscBool isascii; 201745b8d346SStefano Zampini const char *filename; 201845b8d346SStefano Zampini 201945b8d346SStefano Zampini /* HYPRE uses only text files */ 20205f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectTypeCompare((PetscObject)view,PETSCVIEWERASCII,&isascii)); 2021*28b400f6SJacob Faibussowitsch PetscCheck(isascii,PetscObjectComm((PetscObject)view),PETSC_ERR_SUP,"PetscViewerType %s: native HYPRE format needs PETSCVIEWERASCII",((PetscObject)view)->type_name); 20225f80ce2aSJacob Faibussowitsch CHKERRQ(PetscViewerFileGetName(view,&filename)); 2023a74df02fSJacob Faibussowitsch PetscStackCallStandard(HYPRE_IJMatrixPrint,hA->ij,filename); 20245f80ce2aSJacob Faibussowitsch CHKERRMPI(MPI_Comm_size(hA->comm,&size)); 202545b8d346SStefano Zampini if (size > 1) { 20265f80ce2aSJacob Faibussowitsch CHKERRQ(PetscViewerASCIIPrintf(view,"Matrix files: %s.%05d ... %s.%05d\n",filename,0,filename,size-1)); 202745b8d346SStefano Zampini } else { 20285f80ce2aSJacob Faibussowitsch CHKERRQ(PetscViewerASCIIPrintf(view,"Matrix file: %s.%05d\n",filename,0)); 202945b8d346SStefano Zampini } 203045b8d346SStefano Zampini } 203145b8d346SStefano Zampini PetscFunctionReturn(0); 203245b8d346SStefano Zampini } 203345b8d346SStefano Zampini 203445b8d346SStefano Zampini static PetscErrorCode MatDuplicate_HYPRE(Mat A,MatDuplicateOption op, Mat *B) 203545b8d346SStefano Zampini { 20366abb4441SStefano Zampini hypre_ParCSRMatrix *parcsr = NULL; 203745b8d346SStefano Zampini PetscCopyMode cpmode; 203845b8d346SStefano Zampini 203945b8d346SStefano Zampini PetscFunctionBegin; 20405f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPREGetParCSR_HYPRE(A,&parcsr)); 204145b8d346SStefano Zampini if (op == MAT_DO_NOT_COPY_VALUES || op == MAT_SHARE_NONZERO_PATTERN) { 20420e6427aaSSatish Balay parcsr = hypre_ParCSRMatrixClone(parcsr,0); 204345b8d346SStefano Zampini cpmode = PETSC_OWN_POINTER; 204445b8d346SStefano Zampini } else { 204545b8d346SStefano Zampini cpmode = PETSC_COPY_VALUES; 204645b8d346SStefano Zampini } 20475f80ce2aSJacob Faibussowitsch CHKERRQ(MatCreateFromParCSR(parcsr,MATHYPRE,cpmode,B)); 204845b8d346SStefano Zampini PetscFunctionReturn(0); 204945b8d346SStefano Zampini } 205045b8d346SStefano Zampini 2051465edc17SStefano Zampini static PetscErrorCode MatCopy_HYPRE(Mat A, Mat B, MatStructure str) 2052465edc17SStefano Zampini { 2053465edc17SStefano Zampini hypre_ParCSRMatrix *acsr,*bcsr; 2054465edc17SStefano Zampini 2055465edc17SStefano Zampini PetscFunctionBegin; 2056465edc17SStefano Zampini if (str == SAME_NONZERO_PATTERN && A->ops->copy == B->ops->copy) { 20575f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPREGetParCSR_HYPRE(A,&acsr)); 20585f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPREGetParCSR_HYPRE(B,&bcsr)); 2059a74df02fSJacob Faibussowitsch PetscStackCallStandard(hypre_ParCSRMatrixCopy,acsr,bcsr,1); 20605f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetOption(B,MAT_SORTED_FULL,PETSC_TRUE)); /* "perfect" preallocation, so no need for hypre_AuxParCSRMatrixNeedAux */ 20615f80ce2aSJacob Faibussowitsch CHKERRQ(MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY)); 20625f80ce2aSJacob Faibussowitsch CHKERRQ(MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY)); 2063465edc17SStefano Zampini } else { 20645f80ce2aSJacob Faibussowitsch CHKERRQ(MatCopy_Basic(A,B,str)); 2065465edc17SStefano Zampini } 2066465edc17SStefano Zampini PetscFunctionReturn(0); 2067465edc17SStefano Zampini } 2068465edc17SStefano Zampini 20696305df00SStefano Zampini static PetscErrorCode MatGetDiagonal_HYPRE(Mat A, Vec d) 20706305df00SStefano Zampini { 20716305df00SStefano Zampini hypre_ParCSRMatrix *parcsr; 20726305df00SStefano Zampini hypre_CSRMatrix *dmat; 207339accc25SStefano Zampini HYPRE_Complex *a; 207439accc25SStefano Zampini HYPRE_Complex *data = NULL; 20752cf14000SStefano Zampini HYPRE_Int *diag = NULL; 20762cf14000SStefano Zampini PetscInt i; 20776305df00SStefano Zampini PetscBool cong; 20786305df00SStefano Zampini 20796305df00SStefano Zampini PetscFunctionBegin; 20805f80ce2aSJacob Faibussowitsch CHKERRQ(MatHasCongruentLayouts(A,&cong)); 2081*28b400f6SJacob Faibussowitsch PetscCheck(cong,PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Only for square matrices with same local distributions of rows and columns"); 208276bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 20836305df00SStefano Zampini PetscBool miss; 20845f80ce2aSJacob Faibussowitsch CHKERRQ(MatMissingDiagonal(A,&miss,NULL)); 20852c71b3e2SJacob Faibussowitsch PetscCheckFalse(miss && A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_SUP,"Not implemented when diagonal entries are missing"); 20866305df00SStefano Zampini } 20875f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPREGetParCSR_HYPRE(A,&parcsr)); 20886305df00SStefano Zampini dmat = hypre_ParCSRMatrixDiag(parcsr); 20896305df00SStefano Zampini if (dmat) { 209039accc25SStefano Zampini /* this cast fixes the clang error: implicit conversion from 'HYPRE_Complex' (aka '_Complex double') to 'double' is not permitted in C++ */ 20915f80ce2aSJacob Faibussowitsch CHKERRQ(VecGetArray(d,(PetscScalar**)&a)); 20922cf14000SStefano Zampini diag = hypre_CSRMatrixI(dmat); 209339accc25SStefano Zampini data = hypre_CSRMatrixData(dmat); 20946305df00SStefano Zampini for (i=0;i<A->rmap->n;i++) a[i] = data[diag[i]]; 20955f80ce2aSJacob Faibussowitsch CHKERRQ(VecRestoreArray(d,(PetscScalar**)&a)); 20966305df00SStefano Zampini } 20976305df00SStefano Zampini PetscFunctionReturn(0); 20986305df00SStefano Zampini } 20996305df00SStefano Zampini 2100363d496dSStefano Zampini #include <petscblaslapack.h> 2101363d496dSStefano Zampini 2102363d496dSStefano Zampini static PetscErrorCode MatAXPY_HYPRE(Mat Y,PetscScalar a,Mat X,MatStructure str) 2103363d496dSStefano Zampini { 2104363d496dSStefano Zampini PetscFunctionBegin; 21056ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 21066ea7df73SStefano Zampini { 21076ea7df73SStefano Zampini Mat B; 21086ea7df73SStefano Zampini hypre_ParCSRMatrix *x,*y,*z; 21096ea7df73SStefano Zampini 21105f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPREGetParCSR(Y,&y)); 21115f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPREGetParCSR(X,&x)); 2112a74df02fSJacob Faibussowitsch PetscStackCallStandard(hypre_ParCSRMatrixAdd,1.0,y,1.0,x,&z); 21135f80ce2aSJacob Faibussowitsch CHKERRQ(MatCreateFromParCSR(z,MATHYPRE,PETSC_OWN_POINTER,&B)); 21145f80ce2aSJacob Faibussowitsch CHKERRQ(MatHeaderMerge(Y,&B)); 21156ea7df73SStefano Zampini } 21166ea7df73SStefano Zampini #else 2117363d496dSStefano Zampini if (str == SAME_NONZERO_PATTERN) { 2118363d496dSStefano Zampini hypre_ParCSRMatrix *x,*y; 2119363d496dSStefano Zampini hypre_CSRMatrix *xloc,*yloc; 2120363d496dSStefano Zampini PetscInt xnnz,ynnz; 212139accc25SStefano Zampini HYPRE_Complex *xarr,*yarr; 2122363d496dSStefano Zampini PetscBLASInt one=1,bnz; 2123363d496dSStefano Zampini 21245f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPREGetParCSR(Y,&y)); 21255f80ce2aSJacob Faibussowitsch CHKERRQ(MatHYPREGetParCSR(X,&x)); 2126363d496dSStefano Zampini 2127363d496dSStefano Zampini /* diagonal block */ 2128363d496dSStefano Zampini xloc = hypre_ParCSRMatrixDiag(x); 2129363d496dSStefano Zampini yloc = hypre_ParCSRMatrixDiag(y); 2130363d496dSStefano Zampini xnnz = 0; 2131363d496dSStefano Zampini ynnz = 0; 2132363d496dSStefano Zampini xarr = NULL; 2133363d496dSStefano Zampini yarr = NULL; 2134363d496dSStefano Zampini if (xloc) { 213539accc25SStefano Zampini xarr = hypre_CSRMatrixData(xloc); 2136363d496dSStefano Zampini xnnz = hypre_CSRMatrixNumNonzeros(xloc); 2137363d496dSStefano Zampini } 2138363d496dSStefano Zampini if (yloc) { 213939accc25SStefano Zampini yarr = hypre_CSRMatrixData(yloc); 2140363d496dSStefano Zampini ynnz = hypre_CSRMatrixNumNonzeros(yloc); 2141363d496dSStefano Zampini } 21422c71b3e2SJacob Faibussowitsch PetscCheckFalse(xnnz != ynnz,PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Different number of nonzeros in diagonal block %" PetscInt_FMT " != %" PetscInt_FMT,xnnz,ynnz); 21435f80ce2aSJacob Faibussowitsch CHKERRQ(PetscBLASIntCast(xnnz,&bnz)); 214439accc25SStefano Zampini PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&bnz,&a,(PetscScalar*)xarr,&one,(PetscScalar*)yarr,&one)); 2145363d496dSStefano Zampini 2146363d496dSStefano Zampini /* off-diagonal block */ 2147363d496dSStefano Zampini xloc = hypre_ParCSRMatrixOffd(x); 2148363d496dSStefano Zampini yloc = hypre_ParCSRMatrixOffd(y); 2149363d496dSStefano Zampini xnnz = 0; 2150363d496dSStefano Zampini ynnz = 0; 2151363d496dSStefano Zampini xarr = NULL; 2152363d496dSStefano Zampini yarr = NULL; 2153363d496dSStefano Zampini if (xloc) { 215439accc25SStefano Zampini xarr = hypre_CSRMatrixData(xloc); 2155363d496dSStefano Zampini xnnz = hypre_CSRMatrixNumNonzeros(xloc); 2156363d496dSStefano Zampini } 2157363d496dSStefano Zampini if (yloc) { 215839accc25SStefano Zampini yarr = hypre_CSRMatrixData(yloc); 2159363d496dSStefano Zampini ynnz = hypre_CSRMatrixNumNonzeros(yloc); 2160363d496dSStefano Zampini } 21612c71b3e2SJacob Faibussowitsch PetscCheckFalse(xnnz != ynnz,PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Different number of nonzeros in off-diagonal block %" PetscInt_FMT " != %" PetscInt_FMT,xnnz,ynnz); 21625f80ce2aSJacob Faibussowitsch CHKERRQ(PetscBLASIntCast(xnnz,&bnz)); 216339accc25SStefano Zampini PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&bnz,&a,(PetscScalar*)xarr,&one,(PetscScalar*)yarr,&one)); 2164363d496dSStefano Zampini } else if (str == SUBSET_NONZERO_PATTERN) { 21655f80ce2aSJacob Faibussowitsch CHKERRQ(MatAXPY_Basic(Y,a,X,str)); 2166363d496dSStefano Zampini } else { 2167363d496dSStefano Zampini Mat B; 2168363d496dSStefano Zampini 21695f80ce2aSJacob Faibussowitsch CHKERRQ(MatAXPY_Basic_Preallocate(Y,X,&B)); 21705f80ce2aSJacob Faibussowitsch CHKERRQ(MatAXPY_BasicWithPreallocation(B,Y,a,X,str)); 21715f80ce2aSJacob Faibussowitsch CHKERRQ(MatHeaderReplace(Y,&B)); 2172363d496dSStefano Zampini } 21736ea7df73SStefano Zampini #endif 2174363d496dSStefano Zampini PetscFunctionReturn(0); 2175363d496dSStefano Zampini } 2176363d496dSStefano Zampini 2177a055b5aaSBarry Smith /*MC 2178a055b5aaSBarry Smith MATHYPRE - MATHYPRE = "hypre" - A matrix type to be used for sequential and parallel sparse matrices 2179a055b5aaSBarry Smith based on the hypre IJ interface. 2180a055b5aaSBarry Smith 2181a055b5aaSBarry Smith Level: intermediate 2182a055b5aaSBarry Smith 2183a055b5aaSBarry Smith .seealso: MatCreate() 2184a055b5aaSBarry Smith M*/ 2185a055b5aaSBarry Smith 218663c07aadSStefano Zampini PETSC_EXTERN PetscErrorCode MatCreate_HYPRE(Mat B) 218763c07aadSStefano Zampini { 218863c07aadSStefano Zampini Mat_HYPRE *hB; 218963c07aadSStefano Zampini 219063c07aadSStefano Zampini PetscFunctionBegin; 21915f80ce2aSJacob Faibussowitsch CHKERRQ(PetscNewLog(B,&hB)); 21926ea7df73SStefano Zampini 2193978814f1SStefano Zampini hB->inner_free = PETSC_TRUE; 2194c69f721fSFande Kong hB->available = PETSC_TRUE; 2195336664bdSPierre Jolivet hB->sorted_full = PETSC_FALSE; /* no assumption whether column indices are sorted or not */ 2196c69f721fSFande Kong hB->size = 0; 2197c69f721fSFande Kong hB->array = NULL; 2198978814f1SStefano Zampini 219963c07aadSStefano Zampini B->data = (void*)hB; 220063c07aadSStefano Zampini B->assembled = PETSC_FALSE; 220163c07aadSStefano Zampini 22025f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMemzero(B->ops,sizeof(struct _MatOps))); 220363c07aadSStefano Zampini B->ops->mult = MatMult_HYPRE; 220463c07aadSStefano Zampini B->ops->multtranspose = MatMultTranspose_HYPRE; 2205414bd5c3SStefano Zampini B->ops->multadd = MatMultAdd_HYPRE; 2206414bd5c3SStefano Zampini B->ops->multtransposeadd = MatMultTransposeAdd_HYPRE; 220763c07aadSStefano Zampini B->ops->setup = MatSetUp_HYPRE; 220863c07aadSStefano Zampini B->ops->destroy = MatDestroy_HYPRE; 220963c07aadSStefano Zampini B->ops->assemblyend = MatAssemblyEnd_HYPRE; 2210c69f721fSFande Kong B->ops->assemblybegin = MatAssemblyBegin_HYPRE; 2211d975228cSstefano_zampini B->ops->setvalues = MatSetValues_HYPRE; 221268ec7858SStefano Zampini B->ops->missingdiagonal = MatMissingDiagonal_HYPRE; 221368ec7858SStefano Zampini B->ops->scale = MatScale_HYPRE; 221468ec7858SStefano Zampini B->ops->zerorowscolumns = MatZeroRowsColumns_HYPRE; 2215c69f721fSFande Kong B->ops->zeroentries = MatZeroEntries_HYPRE; 2216c69f721fSFande Kong B->ops->zerorows = MatZeroRows_HYPRE; 2217c69f721fSFande Kong B->ops->getrow = MatGetRow_HYPRE; 2218c69f721fSFande Kong B->ops->restorerow = MatRestoreRow_HYPRE; 2219c69f721fSFande Kong B->ops->getvalues = MatGetValues_HYPRE; 2220ddbeb582SStefano Zampini B->ops->setoption = MatSetOption_HYPRE; 222145b8d346SStefano Zampini B->ops->duplicate = MatDuplicate_HYPRE; 2222465edc17SStefano Zampini B->ops->copy = MatCopy_HYPRE; 222345b8d346SStefano Zampini B->ops->view = MatView_HYPRE; 22246305df00SStefano Zampini B->ops->getdiagonal = MatGetDiagonal_HYPRE; 2225363d496dSStefano Zampini B->ops->axpy = MatAXPY_HYPRE; 22264222ddf1SHong Zhang B->ops->productsetfromoptions = MatProductSetFromOptions_HYPRE; 22276ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 22286ea7df73SStefano Zampini B->ops->bindtocpu = MatBindToCPU_HYPRE; 22296ea7df73SStefano Zampini B->boundtocpu = PETSC_FALSE; 22306ea7df73SStefano Zampini #endif 223145b8d346SStefano Zampini 223245b8d346SStefano Zampini /* build cache for off array entries formed */ 22335f80ce2aSJacob Faibussowitsch CHKERRQ(MatStashCreate_Private(PetscObjectComm((PetscObject)B),1,&B->stash)); 223463c07aadSStefano Zampini 22355f80ce2aSJacob Faibussowitsch CHKERRQ(PetscCommGetComm(PetscObjectComm((PetscObject)B),&hB->comm)); 22365f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectChangeTypeName((PetscObject)B,MATHYPRE)); 22375f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectComposeFunction((PetscObject)B,"MatConvert_hypre_aij_C",MatConvert_HYPRE_AIJ)); 22385f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectComposeFunction((PetscObject)B,"MatConvert_hypre_is_C",MatConvert_HYPRE_IS)); 22395f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaij_hypre_C",MatProductSetFromOptions_HYPRE)); 22405f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_mpiaij_hypre_C",MatProductSetFromOptions_HYPRE)); 22415f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectComposeFunction((PetscObject)B,"MatHYPRESetPreallocation_C",MatHYPRESetPreallocation_HYPRE)); 22425f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectComposeFunction((PetscObject)B,"MatHYPREGetParCSR_C",MatHYPREGetParCSR_HYPRE)); 22436ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE) 22446ea7df73SStefano Zampini #if defined(HYPRE_USING_HIP) 22455f80ce2aSJacob Faibussowitsch CHKERRQ(PetscDeviceInitialize(PETSC_DEVICE_HIP)); 22465f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetVecType(B,VECHIP)); 22476ea7df73SStefano Zampini #endif 22486ea7df73SStefano Zampini #if defined(HYPRE_USING_CUDA) 22495f80ce2aSJacob Faibussowitsch CHKERRQ(PetscDeviceInitialize(PETSC_DEVICE_CUDA)); 22505f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetVecType(B,VECCUDA)); 22516ea7df73SStefano Zampini #endif 22526ea7df73SStefano Zampini #endif 225363c07aadSStefano Zampini PetscFunctionReturn(0); 225463c07aadSStefano Zampini } 225563c07aadSStefano Zampini 2256225daaf8SStefano Zampini static PetscErrorCode hypre_array_destroy(void *ptr) 2257225daaf8SStefano Zampini { 2258225daaf8SStefano Zampini PetscFunctionBegin; 2259e6de0934SSatish Balay hypre_TFree(ptr,HYPRE_MEMORY_HOST); 2260225daaf8SStefano Zampini PetscFunctionReturn(0); 2261225daaf8SStefano Zampini } 2262