15b89ad90SMark F. Adams /* 20cd22d39SHong Zhang GAMG geometric-algebric multigrid PC - Mark Adams 2011 35b89ad90SMark F. Adams */ 4389730f3SMark F. Adams #include <../src/ksp/pc/impls/gamg/gamg.h> /*I "petscpc.h" I*/ 518c3aa7eSMark #include <../src/ksp/ksp/impls/cheby/chebyshevimpl.h> /*I "petscksp.h" I*/ 6f96513f1SMatthew G Knepley 7c9567895SMark #if defined(PETSC_HAVE_CUDA) 8c9567895SMark #include <cuda_runtime.h> 9c9567895SMark #endif 10c9567895SMark 11c9567895SMark #if defined(PETSC_HAVE_HIP) 12c9567895SMark #include <hip/hip_runtime.h> 13c9567895SMark #endif 14c9567895SMark 15849bee69SMark Adams PetscLogEvent petsc_gamg_setup_events[GAMG_NUM_SET]; 164555aa8cSStefano Zampini PetscLogEvent petsc_gamg_setup_matmat_events[PETSC_MG_MAXLEVELS][3]; 170cbbd2e1SMark F. Adams 18849bee69SMark Adams // #define GAMG_STAGES 194555aa8cSStefano Zampini #if defined(GAMG_STAGES) 2018c3aa7eSMark static PetscLogStage gamg_stages[PETSC_MG_MAXLEVELS]; 21b4fbaa2aSMark F. Adams #endif 22f96513f1SMatthew G Knepley 230a545947SLisandro Dalcin static PetscFunctionList GAMGList = NULL; 243e3471ccSMark Adams static PetscBool PCGAMGPackageInitialized; 259d5b6da9SMark F. Adams 2666976f2fSJacob Faibussowitsch static PetscErrorCode PCReset_GAMG(PC pc) 27d71ae5a4SJacob Faibussowitsch { 28d3d6bff4SMark F. Adams PC_MG *mg = (PC_MG *)pc->data; 29d3d6bff4SMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 30d3d6bff4SMark F. Adams 31d3d6bff4SMark F. Adams PetscFunctionBegin; 329566063dSJacob Faibussowitsch PetscCall(PetscFree(pc_gamg->data)); 331c1aac46SBarry Smith pc_gamg->data_sz = 0; 349566063dSJacob Faibussowitsch PetscCall(PetscFree(pc_gamg->orig_data)); 355f80ce2aSJacob Faibussowitsch for (PetscInt level = 0; level < PETSC_MG_MAXLEVELS; level++) { 3618c3aa7eSMark mg->min_eigen_DinvA[level] = 0; 3718c3aa7eSMark mg->max_eigen_DinvA[level] = 0; 3818c3aa7eSMark } 3918c3aa7eSMark pc_gamg->emin = 0; 4018c3aa7eSMark pc_gamg->emax = 0; 41978e3cbaSStefano Zampini PetscCall(PCReset_MG(pc)); 42e0b7e82fSBarry Smith PetscCall(MatCoarsenDestroy(&pc_gamg->asm_crs)); 433ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44a2f3521dSMark F. Adams } 45a2f3521dSMark F. Adams 465b89ad90SMark F. Adams /* 47c238b0ebSToby Isaac PCGAMGCreateLevel_GAMG: create coarse op with RAP. repartition and/or reduce number 48a147abb0SMark F. Adams of active processors. 495b89ad90SMark F. Adams 505b89ad90SMark F. Adams Input Parameter: 51a2f3521dSMark F. Adams . pc - parameters + side effect: coarse data in 'pc_gamg->data' and 52a2f3521dSMark F. Adams 'pc_gamg->data_sz' are changed via repartitioning/reduction. 539d5b6da9SMark F. Adams . Amat_fine - matrix on this fine (k) level 54c5bfad50SMark F. Adams . cr_bs - coarse block size 553530afc2SMark F. Adams In/Output Parameter: 56a2f3521dSMark F. Adams . a_P_inout - prolongation operator to the next level (k-->k-1) 57afc97cdcSMark F. Adams . a_nactive_proc - number of active procs 5811e60469SMark F. Adams Output Parameter: 593530afc2SMark F. Adams . a_Amat_crs - coarse matrix that is created (k-1) 605b89ad90SMark F. Adams */ 61d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCGAMGCreateLevel_GAMG(PC pc, Mat Amat_fine, PetscInt cr_bs, Mat *a_P_inout, Mat *a_Amat_crs, PetscMPIInt *a_nactive_proc, IS *Pcolumnperm, PetscBool is_last) 62d71ae5a4SJacob Faibussowitsch { 639d5b6da9SMark F. Adams PC_MG *mg = (PC_MG *)pc->data; 64486a8d0bSJed Brown PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 656c34c54dSStefano Zampini Mat Cmat = NULL, Pold = *a_P_inout; 663b4367a7SBarry Smith MPI_Comm comm; 67c5df96a5SBarry Smith PetscMPIInt rank, size, new_size, nactive = *a_nactive_proc; 683ae0bb68SMark Adams PetscInt ncrs_eq, ncrs, f_bs; 695b89ad90SMark F. Adams 705b89ad90SMark F. Adams PetscFunctionBegin; 719566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)Amat_fine, &comm)); 729566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_rank(comm, &rank)); 739566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(comm, &size)); 749566063dSJacob Faibussowitsch PetscCall(MatGetBlockSize(Amat_fine, &f_bs)); 75038e3b61SMark F. Adams 76ce7c7f2fSMark Adams if (Pcolumnperm) *Pcolumnperm = NULL; 77ce7c7f2fSMark Adams 783ae0bb68SMark Adams /* set 'ncrs' (nodes), 'ncrs_eq' (equations)*/ 796c34c54dSStefano Zampini PetscCall(MatGetLocalSize(Pold, NULL, &ncrs_eq)); 803ae0bb68SMark Adams if (pc_gamg->data_cell_rows > 0) { 813ae0bb68SMark Adams ncrs = pc_gamg->data_sz / pc_gamg->data_cell_cols / pc_gamg->data_cell_rows; 8273911c69SBarry Smith } else { 833ae0bb68SMark Adams PetscInt bs; 846c34c54dSStefano Zampini PetscCall(MatGetBlockSizes(Pold, NULL, &bs)); 853ae0bb68SMark Adams ncrs = ncrs_eq / bs; 863ae0bb68SMark Adams } 87c5df96a5SBarry Smith /* get number of PEs to make active 'new_size', reduce, can be any integer 1-P */ 88c9567895SMark if (pc_gamg->level_reduction_factors[pc_gamg->current_level] == 0 && PetscDefined(HAVE_CUDA) && pc_gamg->current_level == 0) { /* 0 turns reducing to 1 process/device on; do for HIP, etc. */ 89c9567895SMark #if defined(PETSC_HAVE_CUDA) 90c9567895SMark PetscShmComm pshmcomm; 91c9567895SMark PetscMPIInt locrank; 92c9567895SMark MPI_Comm loccomm; 93c9567895SMark PetscInt s_nnodes, r_nnodes, new_new_size; 94c9567895SMark cudaError_t cerr; 95c9567895SMark int devCount; 969566063dSJacob Faibussowitsch PetscCall(PetscShmCommGet(comm, &pshmcomm)); 979566063dSJacob Faibussowitsch PetscCall(PetscShmCommGetMpiShmComm(pshmcomm, &loccomm)); 989566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_rank(loccomm, &locrank)); 99c9567895SMark s_nnodes = !locrank; 100712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&s_nnodes, &r_nnodes, 1, MPIU_INT, MPI_SUM, comm)); 10163a3b9bcSJacob Faibussowitsch PetscCheck((size % r_nnodes) == 0, PETSC_COMM_SELF, PETSC_ERR_PLIB, "odd number of nodes np=%d nnodes%" PetscInt_FMT, size, r_nnodes); 102c9567895SMark devCount = 0; 103c9567895SMark cerr = cudaGetDeviceCount(&devCount); 104c9567895SMark cudaGetLastError(); /* Reset the last error */ 105c9567895SMark if (cerr == cudaSuccess && devCount >= 1) { /* There are devices, else go to heuristic */ 106c9567895SMark new_new_size = r_nnodes * devCount; 107c9567895SMark new_size = new_new_size; 10863a3b9bcSJacob Faibussowitsch PetscCall(PetscInfo(pc, "%s: Fine grid with Cuda. %" PetscInt_FMT " nodes. Change new active set size %d --> %d (devCount=%d #nodes=%" PetscInt_FMT ")\n", ((PetscObject)pc)->prefix, r_nnodes, nactive, new_size, devCount, r_nnodes)); 109c9567895SMark } else { 1109d3446b2SPierre Jolivet PetscCall(PetscInfo(pc, "%s: With Cuda but no device. Use heuristics.\n", ((PetscObject)pc)->prefix)); 111c9567895SMark goto HEURISTIC; 112c9567895SMark } 113c9567895SMark #else 114c9567895SMark SETERRQ(PETSC_COMM_SELF, PETSC_ERR_PLIB, "should not be here"); 115c9567895SMark #endif 116c9567895SMark } else if (pc_gamg->level_reduction_factors[pc_gamg->current_level] > 0) { 1177509f629SMark Adams if (nactive < pc_gamg->level_reduction_factors[pc_gamg->current_level]) { 1187509f629SMark Adams new_size = 1; 1197509f629SMark Adams PetscCall(PetscInfo(pc, "%s: reduction factor too small for %d active processes: reduce to one process\n", ((PetscObject)pc)->prefix, new_size)); 1207509f629SMark Adams } else { 12163a3b9bcSJacob Faibussowitsch PetscCheck(nactive % pc_gamg->level_reduction_factors[pc_gamg->current_level] == 0, PETSC_COMM_SELF, PETSC_ERR_PLIB, "odd number of active process %d wrt reduction factor %" PetscInt_FMT, nactive, pc_gamg->level_reduction_factors[pc_gamg->current_level]); 122c9567895SMark new_size = nactive / pc_gamg->level_reduction_factors[pc_gamg->current_level]; 12363a3b9bcSJacob Faibussowitsch PetscCall(PetscInfo(pc, "%s: Manually setting reduction to %d active processes (%d/%" PetscInt_FMT ")\n", ((PetscObject)pc)->prefix, new_size, nactive, pc_gamg->level_reduction_factors[pc_gamg->current_level])); 1247509f629SMark Adams } 125c9567895SMark } else if (is_last && !pc_gamg->use_parallel_coarse_grid_solver) { 126c9567895SMark new_size = 1; 1279566063dSJacob Faibussowitsch PetscCall(PetscInfo(pc, "%s: Force coarsest grid reduction to %d active processes\n", ((PetscObject)pc)->prefix, new_size)); 128c9567895SMark } else { 129472110cdSMark F. Adams PetscInt ncrs_eq_glob; 130c9567895SMark #if defined(PETSC_HAVE_CUDA) 131c9567895SMark HEURISTIC: 132c9567895SMark #endif 1336c34c54dSStefano Zampini PetscCall(MatGetSize(Pold, NULL, &ncrs_eq_glob)); 134a90e85d9SMark Adams new_size = (PetscMPIInt)((float)ncrs_eq_glob / (float)pc_gamg->min_eq_proc + 0.5); /* hardwire min. number of eq/proc */ 135da81f932SPierre Jolivet if (!new_size) new_size = 1; /* not likely, possible? */ 136c5df96a5SBarry Smith else if (new_size >= nactive) new_size = nactive; /* no change, rare */ 1379566063dSJacob Faibussowitsch PetscCall(PetscInfo(pc, "%s: Coarse grid reduction from %d to %d active processes\n", ((PetscObject)pc)->prefix, nactive, new_size)); 138a2f3521dSMark F. Adams } 1392e3501ffSMark Adams if (new_size == nactive) { 1406c34c54dSStefano Zampini /* output - no repartitioning or reduction - could bail here 1416c34c54dSStefano Zampini we know that the grid structure can be reused in MatPtAP */ 1426c34c54dSStefano Zampini PetscCall(PetscLogEventBegin(petsc_gamg_setup_events[GAMG_PTAP], 0, 0, 0, 0)); 1436c34c54dSStefano Zampini PetscCall(PetscLogEventBegin(petsc_gamg_setup_matmat_events[pc_gamg->current_level][1], 0, 0, 0, 0)); 1446c34c54dSStefano Zampini PetscCall(MatPtAP(Amat_fine, Pold, MAT_INITIAL_MATRIX, 2.0, a_Amat_crs)); 1456c34c54dSStefano Zampini PetscCall(PetscLogEventEnd(petsc_gamg_setup_matmat_events[pc_gamg->current_level][1], 0, 0, 0, 0)); 1466c34c54dSStefano Zampini PetscCall(PetscLogEventEnd(petsc_gamg_setup_events[GAMG_PTAP], 0, 0, 0, 0)); 147ce7c7f2fSMark Adams if (new_size < size) { 148ce7c7f2fSMark Adams /* odd case where multiple coarse grids are on one processor or no coarsening ... */ 1499566063dSJacob Faibussowitsch PetscCall(PetscInfo(pc, "%s: reduced grid using same number of processors (%d) as last grid (use larger coarse grid)\n", ((PetscObject)pc)->prefix, nactive)); 150ce7c7f2fSMark Adams if (pc_gamg->cpu_pin_coarse_grids) { 1519566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*a_Amat_crs, PETSC_TRUE)); 1529566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*a_P_inout, PETSC_TRUE)); 153ce7c7f2fSMark Adams } 154ce7c7f2fSMark Adams } 1552e3501ffSMark Adams } else { /* reduce active processors - we know that the grid structure can NOT be reused in MatPtAP */ 156192c0e8bSMark Adams PetscInt *counts, *newproc_idx, ii, jj, kk, strideNew, *tidx, ncrs_new, ncrs_eq_new, nloc_old, expand_factor = 1, rfactor = 1; 1576c34c54dSStefano Zampini IS is_eq_newproc, is_eq_num, new_eq_indices; 158849bee69SMark Adams PetscCall(PetscLogEventBegin(petsc_gamg_setup_events[GAMG_REDUCE], 0, 0, 0, 0)); 15971959b99SBarry Smith nloc_old = ncrs_eq / cr_bs; 16063a3b9bcSJacob Faibussowitsch PetscCheck(ncrs_eq % cr_bs == 0, PETSC_COMM_SELF, PETSC_ERR_PLIB, "ncrs_eq %" PetscInt_FMT " not divisible by cr_bs %" PetscInt_FMT, ncrs_eq, cr_bs); 161ce7c7f2fSMark Adams /* get new_size and rfactor */ 162ce7c7f2fSMark Adams if (pc_gamg->layout_type == PCGAMG_LAYOUT_SPREAD || !pc_gamg->repart) { 163ce7c7f2fSMark Adams /* find factor */ 164ce7c7f2fSMark Adams if (new_size == 1) rfactor = size; /* don't modify */ 165ce7c7f2fSMark Adams else { 166ce7c7f2fSMark Adams PetscReal best_fact = 0.; 167ce7c7f2fSMark Adams jj = -1; 168ce7c7f2fSMark Adams for (kk = 1; kk <= size; kk++) { 169ce7c7f2fSMark Adams if (!(size % kk)) { /* a candidate */ 170ce7c7f2fSMark Adams PetscReal nactpe = (PetscReal)size / (PetscReal)kk, fact = nactpe / (PetscReal)new_size; 171ce7c7f2fSMark Adams if (fact > 1.0) fact = 1. / fact; /* keep fact < 1 */ 172ce7c7f2fSMark Adams if (fact > best_fact) { 1739371c9d4SSatish Balay best_fact = fact; 1749371c9d4SSatish Balay jj = kk; 175ce7c7f2fSMark Adams } 176ce7c7f2fSMark Adams } 177ce7c7f2fSMark Adams } 178ce7c7f2fSMark Adams if (jj != -1) rfactor = jj; 179ce7c7f2fSMark Adams else rfactor = 1; /* a prime */ 180ce7c7f2fSMark Adams if (pc_gamg->layout_type == PCGAMG_LAYOUT_COMPACT) expand_factor = 1; 181ce7c7f2fSMark Adams else expand_factor = rfactor; 182ce7c7f2fSMark Adams } 183ce7c7f2fSMark Adams new_size = size / rfactor; /* make new size one that is factor */ 1844cdfd227SMark if (new_size == nactive) { /* no repartitioning or reduction, bail out because nested here (rare) */ 18563a3b9bcSJacob Faibussowitsch PetscCall(PetscInfo(pc, "%s: Finding factorable processor set stopped reduction: new_size=%d, neq(loc)=%" PetscInt_FMT "\n", ((PetscObject)pc)->prefix, new_size, ncrs_eq)); 186849bee69SMark Adams PetscCall(PetscLogEventEnd(petsc_gamg_setup_events[GAMG_REDUCE], 0, 0, 0, 0)); 1876c34c54dSStefano Zampini PetscCall(PetscLogEventBegin(petsc_gamg_setup_events[GAMG_PTAP], 0, 0, 0, 0)); 1886c34c54dSStefano Zampini PetscCall(PetscLogEventBegin(petsc_gamg_setup_matmat_events[pc_gamg->current_level][1], 0, 0, 0, 0)); 1896c34c54dSStefano Zampini PetscCall(MatPtAP(Amat_fine, Pold, MAT_INITIAL_MATRIX, 2.0, a_Amat_crs)); 1906c34c54dSStefano Zampini PetscCall(PetscLogEventEnd(petsc_gamg_setup_matmat_events[pc_gamg->current_level][1], 0, 0, 0, 0)); 1916c34c54dSStefano Zampini PetscCall(PetscLogEventEnd(petsc_gamg_setup_events[GAMG_PTAP], 0, 0, 0, 0)); 1923ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 193ce7c7f2fSMark Adams } 194ce7c7f2fSMark Adams } 195a2f3521dSMark F. Adams /* make 'is_eq_newproc' */ 196849bee69SMark Adams if (pc_gamg->repart) { /* Repartition Cmat_{k} and move columns of P^{k}_{k-1} and coordinates of primal part accordingly */ 1975a9b9e01SMark F. Adams Mat adj; 1986c34c54dSStefano Zampini 1996c34c54dSStefano Zampini PetscCall(PetscLogEventBegin(petsc_gamg_setup_events[GAMG_PTAP], 0, 0, 0, 0)); 2006c34c54dSStefano Zampini PetscCall(PetscLogEventBegin(petsc_gamg_setup_matmat_events[pc_gamg->current_level][1], 0, 0, 0, 0)); 2016c34c54dSStefano Zampini PetscCall(MatPtAP(Amat_fine, Pold, MAT_INITIAL_MATRIX, 2.0, &Cmat)); 2026c34c54dSStefano Zampini PetscCall(PetscLogEventEnd(petsc_gamg_setup_matmat_events[pc_gamg->current_level][1], 0, 0, 0, 0)); 2036c34c54dSStefano Zampini PetscCall(PetscLogEventEnd(petsc_gamg_setup_events[GAMG_PTAP], 0, 0, 0, 0)); 204849bee69SMark Adams PetscCall(PetscLogEventBegin(petsc_gamg_setup_events[GAMG_REPART], 0, 0, 0, 0)); 20563a3b9bcSJacob Faibussowitsch PetscCall(PetscInfo(pc, "%s: Repartition: size (active): %d --> %d, %" PetscInt_FMT " local equations, using %s process layout\n", ((PetscObject)pc)->prefix, *a_nactive_proc, new_size, ncrs_eq, (pc_gamg->layout_type == PCGAMG_LAYOUT_COMPACT) ? "compact" : "spread")); 206a2f3521dSMark F. Adams /* get 'adj' */ 207c5bfad50SMark F. Adams if (cr_bs == 1) { 2089566063dSJacob Faibussowitsch PetscCall(MatConvert(Cmat, MATMPIADJ, MAT_INITIAL_MATRIX, &adj)); 209806fa848SBarry Smith } else { 210a2f3521dSMark F. Adams /* make a scalar matrix to partition (no Stokes here) */ 211eb07cef2SMark F. Adams Mat tMat; 212a2f3521dSMark F. Adams PetscInt Istart_crs, Iend_crs, ncols, jj, Ii; 213b4fbaa2aSMark F. Adams const PetscScalar *vals; 214b4fbaa2aSMark F. Adams const PetscInt *idx; 215*c8b01eeaSMark Adams PetscInt *d_nnz, *o_nnz, M, N, maxnnz = 0, *j_buf = NULL; 216*c8b01eeaSMark Adams PetscScalar *v_buff = NULL; 21739d09545SMark Adams static PetscInt llev = 0; /* ugly but just used for debugging */ 218d9558ea9SBarry Smith MatType mtype; 219b4fbaa2aSMark F. Adams 2209566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(ncrs, &d_nnz, ncrs, &o_nnz)); 2219566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(Cmat, &Istart_crs, &Iend_crs)); 2229566063dSJacob Faibussowitsch PetscCall(MatGetSize(Cmat, &M, &N)); 223c5bfad50SMark F. Adams for (Ii = Istart_crs, jj = 0; Ii < Iend_crs; Ii += cr_bs, jj++) { 2249566063dSJacob Faibussowitsch PetscCall(MatGetRow(Cmat, Ii, &ncols, NULL, NULL)); 225c5bfad50SMark F. Adams d_nnz[jj] = ncols / cr_bs; 226c5bfad50SMark F. Adams o_nnz[jj] = ncols / cr_bs; 227*c8b01eeaSMark Adams if (ncols > maxnnz) maxnnz = ncols; 2289566063dSJacob Faibussowitsch PetscCall(MatRestoreRow(Cmat, Ii, &ncols, NULL, NULL)); 2293ae0bb68SMark Adams if (d_nnz[jj] > ncrs) d_nnz[jj] = ncrs; 2303ae0bb68SMark Adams if (o_nnz[jj] > (M / cr_bs - ncrs)) o_nnz[jj] = M / cr_bs - ncrs; 23158471d46SMark F. Adams } 2326876a03eSMark F. Adams 2339566063dSJacob Faibussowitsch PetscCall(MatGetType(Amat_fine, &mtype)); 2349566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, &tMat)); 2359566063dSJacob Faibussowitsch PetscCall(MatSetSizes(tMat, ncrs, ncrs, PETSC_DETERMINE, PETSC_DETERMINE)); 2369566063dSJacob Faibussowitsch PetscCall(MatSetType(tMat, mtype)); 2379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(tMat, 0, d_nnz)); 2389566063dSJacob Faibussowitsch PetscCall(MatMPIAIJSetPreallocation(tMat, 0, d_nnz, 0, o_nnz)); 2399566063dSJacob Faibussowitsch PetscCall(PetscFree2(d_nnz, o_nnz)); 240*c8b01eeaSMark Adams PetscCall(PetscMalloc2(maxnnz, &j_buf, maxnnz, &v_buff)); 241*c8b01eeaSMark Adams for (ii = 0; ii < maxnnz; ii++) v_buff[ii] = 1.; 242eb07cef2SMark F. Adams 243a2f3521dSMark F. Adams for (ii = Istart_crs; ii < Iend_crs; ii++) { 244c5bfad50SMark F. Adams PetscInt dest_row = ii / cr_bs; 2459566063dSJacob Faibussowitsch PetscCall(MatGetRow(Cmat, ii, &ncols, &idx, &vals)); 246*c8b01eeaSMark Adams for (jj = 0; jj < ncols; jj++) j_buf[jj] = idx[jj] / cr_bs; 247*c8b01eeaSMark Adams PetscCall(MatSetValues(tMat, 1, &dest_row, ncols, j_buf, v_buff, ADD_VALUES)); 2489566063dSJacob Faibussowitsch PetscCall(MatRestoreRow(Cmat, ii, &ncols, &idx, &vals)); 249eb07cef2SMark F. Adams } 2509566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(tMat, MAT_FINAL_ASSEMBLY)); 2519566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(tMat, MAT_FINAL_ASSEMBLY)); 252*c8b01eeaSMark Adams PetscCall(PetscFree2(j_buf, v_buff)); 253eb07cef2SMark F. Adams 254b4fbaa2aSMark F. Adams if (llev++ == -1) { 2559371c9d4SSatish Balay PetscViewer viewer; 2569371c9d4SSatish Balay char fname[32]; 25763a3b9bcSJacob Faibussowitsch PetscCall(PetscSNPrintf(fname, sizeof(fname), "part_mat_%" PetscInt_FMT ".mat", llev)); 2583ba16761SJacob Faibussowitsch PetscCall(PetscViewerBinaryOpen(comm, fname, FILE_MODE_WRITE, &viewer)); 2599566063dSJacob Faibussowitsch PetscCall(MatView(tMat, viewer)); 2609566063dSJacob Faibussowitsch PetscCall(PetscViewerDestroy(&viewer)); 261b4fbaa2aSMark F. Adams } 2629566063dSJacob Faibussowitsch PetscCall(MatConvert(tMat, MATMPIADJ, MAT_INITIAL_MATRIX, &adj)); 2639566063dSJacob Faibussowitsch PetscCall(MatDestroy(&tMat)); 264a2f3521dSMark F. Adams } /* create 'adj' */ 265f150b916SMark F. Adams 266a2f3521dSMark F. Adams { /* partition: get newproc_idx */ 2675a9b9e01SMark F. Adams char prefix[256]; 2685a9b9e01SMark F. Adams const char *pcpre; 269b4fbaa2aSMark F. Adams const PetscInt *is_idx; 270b4fbaa2aSMark F. Adams MatPartitioning mpart; 271a4b7d37bSMark F. Adams IS proc_is; 2722f03bc48SMark F. Adams 2739566063dSJacob Faibussowitsch PetscCall(MatPartitioningCreate(comm, &mpart)); 2749566063dSJacob Faibussowitsch PetscCall(MatPartitioningSetAdjacency(mpart, adj)); 2759566063dSJacob Faibussowitsch PetscCall(PCGetOptionsPrefix(pc, &pcpre)); 2769566063dSJacob Faibussowitsch PetscCall(PetscSNPrintf(prefix, sizeof(prefix), "%spc_gamg_", pcpre ? pcpre : "")); 2779566063dSJacob Faibussowitsch PetscCall(PetscObjectSetOptionsPrefix((PetscObject)mpart, prefix)); 2789566063dSJacob Faibussowitsch PetscCall(MatPartitioningSetFromOptions(mpart)); 2799566063dSJacob Faibussowitsch PetscCall(MatPartitioningSetNParts(mpart, new_size)); 2809566063dSJacob Faibussowitsch PetscCall(MatPartitioningApply(mpart, &proc_is)); 2819566063dSJacob Faibussowitsch PetscCall(MatPartitioningDestroy(&mpart)); 2825a9b9e01SMark F. Adams 2835ef31b24SMark F. Adams /* collect IS info */ 2849566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ncrs_eq, &newproc_idx)); 2859566063dSJacob Faibussowitsch PetscCall(ISGetIndices(proc_is, &is_idx)); 286a2f3521dSMark F. Adams for (kk = jj = 0; kk < nloc_old; kk++) { 2879371c9d4SSatish Balay for (ii = 0; ii < cr_bs; ii++, jj++) { newproc_idx[jj] = is_idx[kk] * expand_factor; /* distribution */ } 2885ef31b24SMark F. Adams } 2899566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(proc_is, &is_idx)); 2909566063dSJacob Faibussowitsch PetscCall(ISDestroy(&proc_is)); 2915ef31b24SMark F. Adams } 2929566063dSJacob Faibussowitsch PetscCall(MatDestroy(&adj)); 2935a9b9e01SMark F. Adams 2946c34c54dSStefano Zampini PetscCall(ISCreateGeneral(comm, ncrs_eq, newproc_idx, PETSC_OWN_POINTER, &is_eq_newproc)); 29511e60469SMark F. Adams /* 296a2f3521dSMark F. Adams Create an index set from the is_eq_newproc index set to indicate the mapping TO 29711e60469SMark F. Adams */ 2989566063dSJacob Faibussowitsch PetscCall(ISPartitioningToNumbering(is_eq_newproc, &is_eq_num)); 29911e60469SMark F. Adams /* 300a2f3521dSMark F. Adams Determine how many equations/vertices are assigned to each processor 30111e60469SMark F. Adams */ 3026c34c54dSStefano Zampini PetscCall(PetscMalloc1(size, &counts)); 3039566063dSJacob Faibussowitsch PetscCall(ISPartitioningCount(is_eq_newproc, size, counts)); 304c5df96a5SBarry Smith ncrs_eq_new = counts[rank]; 3059566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is_eq_newproc)); 3066c34c54dSStefano Zampini PetscCall(PetscFree(counts)); 3076c34c54dSStefano Zampini PetscCall(PetscLogEventEnd(petsc_gamg_setup_events[GAMG_REPART], 0, 0, 0, 0)); 3086c34c54dSStefano Zampini } else { /* simple aggregation of parts -- 'is_eq_newproc' */ 3096c34c54dSStefano Zampini const PetscInt *ranges; 3106c34c54dSStefano Zampini PetscInt newstart = 0; 3116c34c54dSStefano Zampini PetscLayout ilay; 3126c34c54dSStefano Zampini 3136c34c54dSStefano Zampini PetscCheck(new_size != nactive, PETSC_COMM_SELF, PETSC_ERR_PLIB, "new_size==nactive. Should not happen"); 3146c34c54dSStefano Zampini PetscCall(PetscInfo(pc, "%s: Number of equations (loc) %" PetscInt_FMT " with simple aggregation\n", ((PetscObject)pc)->prefix, ncrs_eq)); 3156c34c54dSStefano Zampini PetscCallMPI(MPI_Exscan(&ncrs_eq, &newstart, 1, MPIU_INT, MPI_SUM, comm)); 3166c34c54dSStefano Zampini PetscCall(ISCreateStride(comm, ncrs_eq, newstart, 1, &is_eq_num)); 3176c34c54dSStefano Zampini PetscCall(ISSetPermutation(is_eq_num)); 3186c34c54dSStefano Zampini PetscCall(ISGetLayout(is_eq_num, &ilay)); 3196c34c54dSStefano Zampini PetscCall(PetscLayoutGetRanges(ilay, &ranges)); 3206c34c54dSStefano Zampini ncrs_eq_new = 0; 3216c34c54dSStefano Zampini for (PetscInt r = 0; r < size; r++) 3226c34c54dSStefano Zampini if (rank == (r / rfactor) * expand_factor) ncrs_eq_new += ranges[r + 1] - ranges[r]; 3236c34c54dSStefano Zampini //targetPE = (rank / rfactor) * expand_factor; 3246c34c54dSStefano Zampini //PetscCall(ISCreateStride(comm, ncrs_eq, targetPE, 0, &is_eq_newproc)); 3256c34c54dSStefano Zampini //PetscCall(ISPartitioningToNumbering(is_eq_newproc, &is_eq_num)); 3266c34c54dSStefano Zampini //PetscCall(PetscMalloc1(size, &counts)); 3276c34c54dSStefano Zampini //PetscCall(ISPartitioningCount(is_eq_newproc, size, counts)); 3286c34c54dSStefano Zampini //ncrs_eq_new = counts[rank]; 3296c34c54dSStefano Zampini //PetscCall(ISDestroy(&is_eq_newproc)); 3306c34c54dSStefano Zampini //PetscCall(PetscFree(counts)); 3316c34c54dSStefano Zampini } /* end simple 'is_eq_newproc' */ 3326c34c54dSStefano Zampini 333ce7c7f2fSMark Adams ncrs_new = ncrs_eq_new / cr_bs; 334a2f3521dSMark F. Adams 3356aad120cSJose E. Roman /* data movement scope -- this could be moved to subclasses so that we don't try to cram all auxiliary data into some complex abstracted thing */ 336885364a3SMark Adams { 337885364a3SMark Adams Vec src_crd, dest_crd; 338885364a3SMark Adams const PetscInt *idx, ndata_rows = pc_gamg->data_cell_rows, ndata_cols = pc_gamg->data_cell_cols, node_data_sz = ndata_rows * ndata_cols; 339885364a3SMark Adams VecScatter vecscat; 340885364a3SMark Adams PetscScalar *array; 341885364a3SMark Adams IS isscat; 342a2f3521dSMark F. Adams /* move data (for primal equations only) */ 34322063be5SMark F. Adams /* Create a vector to contain the newly ordered element information */ 3449566063dSJacob Faibussowitsch PetscCall(VecCreate(comm, &dest_crd)); 3459566063dSJacob Faibussowitsch PetscCall(VecSetSizes(dest_crd, node_data_sz * ncrs_new, PETSC_DECIDE)); 3469566063dSJacob Faibussowitsch PetscCall(VecSetType(dest_crd, VECSTANDARD)); /* this is needed! */ 34711e60469SMark F. Adams /* 3489d5b6da9SMark F. Adams There are 'ndata_rows*ndata_cols' data items per node, (one can think of the vectors of having 349c5bfad50SMark F. Adams a block size of ...). Note, ISs are expanded into equation space by 'cr_bs'. 35011e60469SMark F. Adams */ 3519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ncrs * node_data_sz, &tidx)); 3526c34c54dSStefano Zampini PetscCall(ISGetIndices(is_eq_num, &idx)); 3533ae0bb68SMark Adams for (ii = 0, jj = 0; ii < ncrs; ii++) { 354c5bfad50SMark F. Adams PetscInt id = idx[ii * cr_bs] / cr_bs; /* get node back */ 355a2f3521dSMark F. Adams for (kk = 0; kk < node_data_sz; kk++, jj++) tidx[jj] = id * node_data_sz + kk; 35611e60469SMark F. Adams } 3576c34c54dSStefano Zampini PetscCall(ISRestoreIndices(is_eq_num, &idx)); 3589566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(comm, node_data_sz * ncrs, tidx, PETSC_COPY_VALUES, &isscat)); 3599566063dSJacob Faibussowitsch PetscCall(PetscFree(tidx)); 36011e60469SMark F. Adams /* 36111e60469SMark F. Adams Create a vector to contain the original vertex information for each element 36211e60469SMark F. Adams */ 3639566063dSJacob Faibussowitsch PetscCall(VecCreateSeq(PETSC_COMM_SELF, node_data_sz * ncrs, &src_crd)); 3649d5b6da9SMark F. Adams for (jj = 0; jj < ndata_cols; jj++) { 3653ae0bb68SMark Adams const PetscInt stride0 = ncrs * pc_gamg->data_cell_rows; 3663ae0bb68SMark Adams for (ii = 0; ii < ncrs; ii++) { 3679d5b6da9SMark F. Adams for (kk = 0; kk < ndata_rows; kk++) { 368a2f3521dSMark F. Adams PetscInt ix = ii * ndata_rows + kk + jj * stride0, jx = ii * node_data_sz + kk * ndata_cols + jj; 369c8b0795cSMark F. Adams PetscScalar tt = (PetscScalar)pc_gamg->data[ix]; 3709566063dSJacob Faibussowitsch PetscCall(VecSetValues(src_crd, 1, &jx, &tt, INSERT_VALUES)); 371d3d6bff4SMark F. Adams } 372038e3b61SMark F. Adams } 373eb07cef2SMark F. Adams } 3749566063dSJacob Faibussowitsch PetscCall(VecAssemblyBegin(src_crd)); 3759566063dSJacob Faibussowitsch PetscCall(VecAssemblyEnd(src_crd)); 37611e60469SMark F. Adams /* 37711e60469SMark F. Adams Scatter the element vertex information (still in the original vertex ordering) 37811e60469SMark F. Adams to the correct processor 37911e60469SMark F. Adams */ 3809566063dSJacob Faibussowitsch PetscCall(VecScatterCreate(src_crd, NULL, dest_crd, isscat, &vecscat)); 3819566063dSJacob Faibussowitsch PetscCall(ISDestroy(&isscat)); 3829566063dSJacob Faibussowitsch PetscCall(VecScatterBegin(vecscat, src_crd, dest_crd, INSERT_VALUES, SCATTER_FORWARD)); 3839566063dSJacob Faibussowitsch PetscCall(VecScatterEnd(vecscat, src_crd, dest_crd, INSERT_VALUES, SCATTER_FORWARD)); 3849566063dSJacob Faibussowitsch PetscCall(VecScatterDestroy(&vecscat)); 3859566063dSJacob Faibussowitsch PetscCall(VecDestroy(&src_crd)); 38611e60469SMark F. Adams /* 38711e60469SMark F. Adams Put the element vertex data into a new allocation of the gdata->ele 38811e60469SMark F. Adams */ 3899566063dSJacob Faibussowitsch PetscCall(PetscFree(pc_gamg->data)); 3909566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(node_data_sz * ncrs_new, &pc_gamg->data)); 3912fa5cd67SKarl Rupp 3923ae0bb68SMark Adams pc_gamg->data_sz = node_data_sz * ncrs_new; 3933ae0bb68SMark Adams strideNew = ncrs_new * ndata_rows; 3942fa5cd67SKarl Rupp 3959566063dSJacob Faibussowitsch PetscCall(VecGetArray(dest_crd, &array)); 3969d5b6da9SMark F. Adams for (jj = 0; jj < ndata_cols; jj++) { 3973ae0bb68SMark Adams for (ii = 0; ii < ncrs_new; ii++) { 3989d5b6da9SMark F. Adams for (kk = 0; kk < ndata_rows; kk++) { 399a2f3521dSMark F. Adams PetscInt ix = ii * ndata_rows + kk + jj * strideNew, jx = ii * node_data_sz + kk * ndata_cols + jj; 400c8b0795cSMark F. Adams pc_gamg->data[ix] = PetscRealPart(array[jx]); 401d3d6bff4SMark F. Adams } 402038e3b61SMark F. Adams } 403038e3b61SMark F. Adams } 4049566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(dest_crd, &array)); 4059566063dSJacob Faibussowitsch PetscCall(VecDestroy(&dest_crd)); 406885364a3SMark Adams } 407a2f3521dSMark F. Adams /* move A and P (columns) with new layout */ 40811e60469SMark F. Adams /* 4097dae84e0SHong Zhang Invert for MatCreateSubMatrix 41011e60469SMark F. Adams */ 4119566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(is_eq_num, ncrs_eq_new, &new_eq_indices)); 4126c34c54dSStefano Zampini PetscCall(ISSort(new_eq_indices)); 4139566063dSJacob Faibussowitsch PetscCall(ISSetBlockSize(new_eq_indices, cr_bs)); 4143cb8563fSToby Isaac if (Pcolumnperm) { 4159566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)new_eq_indices)); 4163cb8563fSToby Isaac *Pcolumnperm = new_eq_indices; 4173cb8563fSToby Isaac } 4189566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is_eq_num)); 419849bee69SMark Adams 420a2f3521dSMark F. Adams /* 'a_Amat_crs' output */ 4216c34c54dSStefano Zampini if (Cmat) { /* repartitioning from Cmat adjacency case */ 422a2f3521dSMark F. Adams Mat mat; 423b94d7dedSBarry Smith PetscBool isset, isspd, isher; 42490db8557SMark Adams #if !defined(PETSC_USE_COMPLEX) 425b94d7dedSBarry Smith PetscBool issym; 426b94d7dedSBarry Smith #endif 427b94d7dedSBarry Smith 428b94d7dedSBarry Smith PetscCall(MatCreateSubMatrix(Cmat, new_eq_indices, new_eq_indices, MAT_INITIAL_MATRIX, &mat)); 429b94d7dedSBarry Smith PetscCall(MatIsSPDKnown(Cmat, &isset, &isspd)); // like MatPropagateSymmetryOptions, but should set MAT_STRUCTURALLY_SYMMETRIC ? 430b94d7dedSBarry Smith if (isset) PetscCall(MatSetOption(mat, MAT_SPD, isspd)); 431b94d7dedSBarry Smith else { 432b94d7dedSBarry Smith PetscCall(MatIsHermitianKnown(Cmat, &isset, &isher)); 433b94d7dedSBarry Smith if (isset) PetscCall(MatSetOption(mat, MAT_HERMITIAN, isher)); 434b94d7dedSBarry Smith else { 435b94d7dedSBarry Smith #if !defined(PETSC_USE_COMPLEX) 436b94d7dedSBarry Smith PetscCall(MatIsSymmetricKnown(Cmat, &isset, &issym)); 437b94d7dedSBarry Smith if (isset) PetscCall(MatSetOption(mat, MAT_SYMMETRIC, issym)); 43890db8557SMark Adams #endif 43990db8557SMark Adams } 44090db8557SMark Adams } 441a2f3521dSMark F. Adams *a_Amat_crs = mat; 442a2f3521dSMark F. Adams } 443a2f3521dSMark F. Adams 44411e60469SMark F. Adams /* prolongator */ 44511e60469SMark F. Adams { 44611e60469SMark F. Adams IS findices; 447a2f3521dSMark F. Adams PetscInt Istart, Iend; 448a2f3521dSMark F. Adams Mat Pnew; 44962294041SBarry Smith 4509566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(Pold, &Istart, &Iend)); 4519566063dSJacob Faibussowitsch PetscCall(ISCreateStride(comm, Iend - Istart, Istart, 1, &findices)); 4529566063dSJacob Faibussowitsch PetscCall(ISSetBlockSize(findices, f_bs)); 4539566063dSJacob Faibussowitsch PetscCall(MatCreateSubMatrix(Pold, findices, new_eq_indices, MAT_INITIAL_MATRIX, &Pnew)); 4549566063dSJacob Faibussowitsch PetscCall(ISDestroy(&findices)); 4559566063dSJacob Faibussowitsch PetscCall(MatSetOption(Pnew, MAT_FORM_EXPLICIT_TRANSPOSE, PETSC_TRUE)); 456c5bfad50SMark F. Adams 4579566063dSJacob Faibussowitsch PetscCall(MatDestroy(a_P_inout)); 458a2f3521dSMark F. Adams 459a2f3521dSMark F. Adams /* output - repartitioned */ 460a2f3521dSMark F. Adams *a_P_inout = Pnew; 461e33ef3b1SMark F. Adams } 4626c34c54dSStefano Zampini 4636c34c54dSStefano Zampini if (!Cmat) { /* simple repartitioning case */ 4646c34c54dSStefano Zampini PetscCall(PetscLogEventBegin(petsc_gamg_setup_events[GAMG_PTAP], 0, 0, 0, 0)); 4656c34c54dSStefano Zampini PetscCall(PetscLogEventBegin(petsc_gamg_setup_matmat_events[pc_gamg->current_level][1], 0, 0, 0, 0)); 4666c34c54dSStefano Zampini PetscCall(MatPtAP(Amat_fine, *a_P_inout, MAT_INITIAL_MATRIX, 2.0, a_Amat_crs)); 4676c34c54dSStefano Zampini PetscCall(PetscLogEventEnd(petsc_gamg_setup_matmat_events[pc_gamg->current_level][1], 0, 0, 0, 0)); 4686c34c54dSStefano Zampini PetscCall(PetscLogEventEnd(petsc_gamg_setup_events[GAMG_PTAP], 0, 0, 0, 0)); 4696c34c54dSStefano Zampini } 4706c34c54dSStefano Zampini PetscCall(MatDestroy(&Cmat)); 4719566063dSJacob Faibussowitsch PetscCall(ISDestroy(&new_eq_indices)); 4725b89ad90SMark F. Adams 473c5df96a5SBarry Smith *a_nactive_proc = new_size; /* output */ 474ce7c7f2fSMark Adams 475ce7c7f2fSMark Adams /* pinning on reduced grids, not a bad heuristic and optimization gets folded into process reduction optimization */ 476ce7c7f2fSMark Adams if (pc_gamg->cpu_pin_coarse_grids) { 477ce7c7f2fSMark Adams #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 4788bca76a6SMark Adams static PetscInt llev = 2; 47963a3b9bcSJacob Faibussowitsch PetscCall(PetscInfo(pc, "%s: Pinning level %" PetscInt_FMT " to the CPU\n", ((PetscObject)pc)->prefix, llev++)); 480ce7c7f2fSMark Adams #endif 4819566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*a_Amat_crs, PETSC_TRUE)); 4829566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*a_P_inout, PETSC_TRUE)); 483adf5291fSStefano Zampini if (1) { /* HACK: move this to MatBindCPU_MPIAIJXXX; lvec is created, need to pin it, this is done in MatSetUpMultiply_MPIAIJ. Hack */ 484ce7c7f2fSMark Adams Mat A = *a_Amat_crs, P = *a_P_inout; 485ce7c7f2fSMark Adams PetscMPIInt size; 4869566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)A), &size)); 487ce7c7f2fSMark Adams if (size > 1) { 488ce7c7f2fSMark Adams Mat_MPIAIJ *a = (Mat_MPIAIJ *)A->data, *p = (Mat_MPIAIJ *)P->data; 4899566063dSJacob Faibussowitsch PetscCall(VecBindToCPU(a->lvec, PETSC_TRUE)); 4909566063dSJacob Faibussowitsch PetscCall(VecBindToCPU(p->lvec, PETSC_TRUE)); 491ce7c7f2fSMark Adams } 492ce7c7f2fSMark Adams } 493ce7c7f2fSMark Adams } 494849bee69SMark Adams PetscCall(PetscLogEventEnd(petsc_gamg_setup_events[GAMG_REDUCE], 0, 0, 0, 0)); 495849bee69SMark Adams } // processor reduce 4963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4975b89ad90SMark F. Adams } 4985b89ad90SMark F. Adams 499bae903cbSmarkadams4 // used in GEO 500d71ae5a4SJacob Faibussowitsch PetscErrorCode PCGAMGSquareGraph_GAMG(PC a_pc, Mat Gmat1, Mat *Gmat2) 501d71ae5a4SJacob Faibussowitsch { 5024b1575e2SStefano Zampini const char *prefix; 5034b1575e2SStefano Zampini char addp[32]; 5044b1575e2SStefano Zampini PC_MG *mg = (PC_MG *)a_pc->data; 5054b1575e2SStefano Zampini PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 5064b1575e2SStefano Zampini 5074b1575e2SStefano Zampini PetscFunctionBegin; 5089566063dSJacob Faibussowitsch PetscCall(PCGetOptionsPrefix(a_pc, &prefix)); 50963a3b9bcSJacob Faibussowitsch PetscCall(PetscInfo(a_pc, "%s: Square Graph on level %" PetscInt_FMT "\n", ((PetscObject)a_pc)->prefix, pc_gamg->current_level + 1)); 5109566063dSJacob Faibussowitsch PetscCall(MatProductCreate(Gmat1, Gmat1, NULL, Gmat2)); 5119566063dSJacob Faibussowitsch PetscCall(MatSetOptionsPrefix(*Gmat2, prefix)); 51263a3b9bcSJacob Faibussowitsch PetscCall(PetscSNPrintf(addp, sizeof(addp), "pc_gamg_square_%" PetscInt_FMT "_", pc_gamg->current_level)); 5139566063dSJacob Faibussowitsch PetscCall(MatAppendOptionsPrefix(*Gmat2, addp)); 514b94d7dedSBarry Smith if ((*Gmat2)->structurally_symmetric == PETSC_BOOL3_TRUE) { 5159566063dSJacob Faibussowitsch PetscCall(MatProductSetType(*Gmat2, MATPRODUCT_AB)); 516b4da3a1bSStefano Zampini } else { 5179566063dSJacob Faibussowitsch PetscCall(MatSetOption(Gmat1, MAT_FORM_EXPLICIT_TRANSPOSE, PETSC_TRUE)); 5189566063dSJacob Faibussowitsch PetscCall(MatProductSetType(*Gmat2, MATPRODUCT_AtB)); 519b4da3a1bSStefano Zampini } 5209566063dSJacob Faibussowitsch PetscCall(MatProductSetFromOptions(*Gmat2)); 5219566063dSJacob Faibussowitsch PetscCall(PetscLogEventBegin(petsc_gamg_setup_matmat_events[pc_gamg->current_level][0], 0, 0, 0, 0)); 5229566063dSJacob Faibussowitsch PetscCall(MatProductSymbolic(*Gmat2)); 5239566063dSJacob Faibussowitsch PetscCall(PetscLogEventEnd(petsc_gamg_setup_matmat_events[pc_gamg->current_level][0], 0, 0, 0, 0)); 5249566063dSJacob Faibussowitsch PetscCall(MatProductClear(*Gmat2)); 5254b1575e2SStefano Zampini /* we only need the sparsity, cheat and tell PETSc the matrix has been assembled */ 5264b1575e2SStefano Zampini (*Gmat2)->assembled = PETSC_TRUE; 5273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5284b1575e2SStefano Zampini } 5294b1575e2SStefano Zampini 5305b89ad90SMark F. Adams /* 5315b89ad90SMark F. Adams PCSetUp_GAMG - Prepares for the use of the GAMG preconditioner 5325b89ad90SMark F. Adams by setting data structures and options. 5335b89ad90SMark F. Adams 5345b89ad90SMark F. Adams Input Parameter: 5355b89ad90SMark F. Adams . pc - the preconditioner context 5365b89ad90SMark F. Adams 5375b89ad90SMark F. Adams */ 53866976f2fSJacob Faibussowitsch static PetscErrorCode PCSetUp_GAMG(PC pc) 539d71ae5a4SJacob Faibussowitsch { 5409d5b6da9SMark F. Adams PC_MG *mg = (PC_MG *)pc->data; 5415b89ad90SMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 5422adcac29SMark F. Adams Mat Pmat = pc->pmat; 543b65aec2dSMark Adams PetscInt fine_level, level, level1, bs, M, N, qq, lidx, nASMBlocksArr[PETSC_MG_MAXLEVELS], cr_bs; 5443b4367a7SBarry Smith MPI_Comm comm; 545c5df96a5SBarry Smith PetscMPIInt rank, size, nactivepe; 54618c3aa7eSMark Mat Aarr[PETSC_MG_MAXLEVELS], Parr[PETSC_MG_MAXLEVELS]; 54718c3aa7eSMark IS *ASMLocalIDsArr[PETSC_MG_MAXLEVELS]; 5484279555eSSatish Balay PetscBool is_last = PETSC_FALSE; 5494279555eSSatish Balay #if defined(PETSC_USE_INFO) 550a2f3521dSMark F. Adams PetscLogDouble nnz0 = 0., nnztot = 0.; 551569f4572SMark Adams MatInfo info; 5524279555eSSatish Balay #endif 5535ef31b24SMark F. Adams 5545b89ad90SMark F. Adams PetscFunctionBegin; 5559566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)pc, &comm)); 5569566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_rank(comm, &rank)); 5579566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(comm, &size)); 558849bee69SMark Adams PetscCall(PetscLogEventBegin(petsc_gamg_setup_events[GAMG_SETUP], 0, 0, 0, 0)); 5598abdc6daSStefano Zampini if (pc->setupcalled) { 5608abdc6daSStefano Zampini if (!pc_gamg->reuse_prol || pc->flag == DIFFERENT_NONZERO_PATTERN) { 561878e152fSMark F. Adams /* reset everything */ 5629566063dSJacob Faibussowitsch PetscCall(PCReset_MG(pc)); 563878e152fSMark F. Adams pc->setupcalled = 0; 564806fa848SBarry Smith } else { 56584d3f75bSMark F. Adams PC_MG_Levels **mglevels = mg->levels; 56603a628feSMark F. Adams /* just do Galerkin grids */ 56758471d46SMark F. Adams Mat B, dA, dB; 5689d5b6da9SMark F. Adams if (pc_gamg->Nlevels > 1) { 5694555aa8cSStefano Zampini PetscInt gl; 57058471d46SMark F. Adams /* currently only handle case where mat and pmat are the same on coarser levels */ 5719566063dSJacob Faibussowitsch PetscCall(KSPGetOperators(mglevels[pc_gamg->Nlevels - 1]->smoothd, &dA, &dB)); 57258471d46SMark F. Adams /* (re)set to get dirty flag */ 5739566063dSJacob Faibussowitsch PetscCall(KSPSetOperators(mglevels[pc_gamg->Nlevels - 1]->smoothd, dA, dB)); 57458471d46SMark F. Adams 5754555aa8cSStefano Zampini for (level = pc_gamg->Nlevels - 2, gl = 0; level >= 0; level--, gl++) { 5768abdc6daSStefano Zampini MatReuse reuse = MAT_INITIAL_MATRIX; 577849bee69SMark Adams #if defined(GAMG_STAGES) 578849bee69SMark Adams PetscCall(PetscLogStagePush(gamg_stages[gl])); 579849bee69SMark Adams #endif 5808abdc6daSStefano Zampini /* matrix structure can change from repartitioning or process reduction but don't know if we have process reduction here. Should fix */ 5819566063dSJacob Faibussowitsch PetscCall(KSPGetOperators(mglevels[level]->smoothd, NULL, &B)); 5828abdc6daSStefano Zampini if (B->product) { 583ad540459SPierre Jolivet if (B->product->A == dB && B->product->B == mglevels[level + 1]->interpolate) reuse = MAT_REUSE_MATRIX; 5848abdc6daSStefano Zampini } 5859566063dSJacob Faibussowitsch if (reuse == MAT_INITIAL_MATRIX) PetscCall(MatDestroy(&mglevels[level]->A)); 5868abdc6daSStefano Zampini if (reuse == MAT_REUSE_MATRIX) { 587e02fb3cdSMark Adams PetscCall(PetscInfo(pc, "%s: RAP after initial setup, reuse matrix level %" PetscInt_FMT "\n", ((PetscObject)pc)->prefix, level)); 5888abdc6daSStefano Zampini } else { 589e02fb3cdSMark Adams PetscCall(PetscInfo(pc, "%s: RAP after initial setup, with repartitioning (new matrix) level %" PetscInt_FMT "\n", ((PetscObject)pc)->prefix, level)); 5908abdc6daSStefano Zampini } 5919566063dSJacob Faibussowitsch PetscCall(PetscLogEventBegin(petsc_gamg_setup_matmat_events[gl][1], 0, 0, 0, 0)); 592fb842aefSJose E. Roman PetscCall(MatPtAP(dB, mglevels[level + 1]->interpolate, reuse, PETSC_DETERMINE, &B)); 5939566063dSJacob Faibussowitsch PetscCall(PetscLogEventEnd(petsc_gamg_setup_matmat_events[gl][1], 0, 0, 0, 0)); 59463b77682SMark Adams if (reuse == MAT_INITIAL_MATRIX) mglevels[level]->A = B; 5959566063dSJacob Faibussowitsch PetscCall(KSPSetOperators(mglevels[level]->smoothd, B, B)); 596e1cf1444SMark Adams // check for redoing eigen estimates 597e1cf1444SMark Adams if (pc_gamg->recompute_esteig) { 598e1cf1444SMark Adams PetscBool ischeb; 599e1cf1444SMark Adams KSP smoother; 600e1cf1444SMark Adams PetscCall(PCMGGetSmoother(pc, level + 1, &smoother)); 601e1cf1444SMark Adams PetscCall(PetscObjectTypeCompare((PetscObject)smoother, KSPCHEBYSHEV, &ischeb)); 602e1cf1444SMark Adams if (ischeb) { 603e1cf1444SMark Adams KSP_Chebyshev *cheb = (KSP_Chebyshev *)smoother->data; 604e1cf1444SMark Adams cheb->emin_provided = 0; 605e1cf1444SMark Adams cheb->emax_provided = 0; 606e1cf1444SMark Adams } 607e1cf1444SMark Adams /* we could call PetscCall(KSPChebyshevSetEigenvalues(smoother, 0, 0)); but the logic does not work properly */ 608e1cf1444SMark Adams } 609e1cf1444SMark Adams // inc 61058471d46SMark F. Adams dB = B; 611849bee69SMark Adams #if defined(GAMG_STAGES) 612849bee69SMark Adams PetscCall(PetscLogStagePop()); 613849bee69SMark Adams #endif 61458471d46SMark F. Adams } 6155f8cf99dSMark F. Adams } 616d5280255SMark F. Adams 6179566063dSJacob Faibussowitsch PetscCall(PCSetUp_MG(pc)); 618849bee69SMark Adams PetscCall(PetscLogEventEnd(petsc_gamg_setup_events[GAMG_SETUP], 0, 0, 0, 0)); 6193ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 620eb07cef2SMark F. Adams } 621878e152fSMark F. Adams } 622f6536408SMark F. Adams 623878e152fSMark F. Adams if (!pc_gamg->data) { 624878e152fSMark F. Adams if (pc_gamg->orig_data) { 6259566063dSJacob Faibussowitsch PetscCall(MatGetBlockSize(Pmat, &bs)); 6269566063dSJacob Faibussowitsch PetscCall(MatGetLocalSize(Pmat, &qq, NULL)); 6272fa5cd67SKarl Rupp 628878e152fSMark F. Adams pc_gamg->data_sz = (qq / bs) * pc_gamg->orig_data_cell_rows * pc_gamg->orig_data_cell_cols; 629878e152fSMark F. Adams pc_gamg->data_cell_rows = pc_gamg->orig_data_cell_rows; 630878e152fSMark F. Adams pc_gamg->data_cell_cols = pc_gamg->orig_data_cell_cols; 6312fa5cd67SKarl Rupp 6329566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(pc_gamg->data_sz, &pc_gamg->data)); 633878e152fSMark F. Adams for (qq = 0; qq < pc_gamg->data_sz; qq++) pc_gamg->data[qq] = pc_gamg->orig_data[qq]; 634806fa848SBarry Smith } else { 6355f80ce2aSJacob Faibussowitsch PetscCheck(pc_gamg->ops->createdefaultdata, comm, PETSC_ERR_PLIB, "'createdefaultdata' not set(?) need to support NULL data"); 6369566063dSJacob Faibussowitsch PetscCall(pc_gamg->ops->createdefaultdata(pc, Pmat)); 6379d5b6da9SMark F. Adams } 638878e152fSMark F. Adams } 639878e152fSMark F. Adams 640878e152fSMark F. Adams /* cache original data for reuse */ 6411c1aac46SBarry Smith if (!pc_gamg->orig_data && (PetscBool)(!pc_gamg->reuse_prol)) { 6429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(pc_gamg->data_sz, &pc_gamg->orig_data)); 643878e152fSMark F. Adams for (qq = 0; qq < pc_gamg->data_sz; qq++) pc_gamg->orig_data[qq] = pc_gamg->data[qq]; 644878e152fSMark F. Adams pc_gamg->orig_data_cell_rows = pc_gamg->data_cell_rows; 645878e152fSMark F. Adams pc_gamg->orig_data_cell_cols = pc_gamg->data_cell_cols; 646878e152fSMark F. Adams } 647038e3b61SMark F. Adams 648302f38e8SMark F. Adams /* get basic dims */ 6499566063dSJacob Faibussowitsch PetscCall(MatGetBlockSize(Pmat, &bs)); 650b65aec2dSMark Adams PetscCall(MatGetSize(Pmat, &M, NULL)); 65184d3f75bSMark F. Adams 6524279555eSSatish Balay #if defined(PETSC_USE_INFO) 6539566063dSJacob Faibussowitsch PetscCall(MatGetInfo(Pmat, MAT_GLOBAL_SUM, &info)); /* global reduction */ 654569f4572SMark Adams nnz0 = info.nz_used; 655569f4572SMark Adams nnztot = info.nz_used; 6564279555eSSatish Balay #endif 657b65aec2dSMark Adams PetscCall(PetscInfo(pc, "%s: level %d) N=%" PetscInt_FMT ", n data rows=%" PetscInt_FMT ", n data cols=%" PetscInt_FMT ", nnz/row (ave)=%" PetscInt_FMT ", block size %d, np=%d\n", ((PetscObject)pc)->prefix, 0, M, pc_gamg->data_cell_rows, pc_gamg->data_cell_cols, (PetscInt)(nnz0 / (PetscReal)M + 0.5), (int)bs, size)); 658569f4572SMark Adams 659a2f3521dSMark F. Adams /* Get A_i and R_i */ 660b65aec2dSMark Adams for (level = 0, Aarr[0] = Pmat, nactivepe = size; level < (pc_gamg->Nlevels - 1) && (level == 0 || M > pc_gamg->coarse_eq_limit); level++) { 6619ab59c8bSMark Adams pc_gamg->current_level = level; 6625b89ad90SMark F. Adams level1 = level + 1; 6634555aa8cSStefano Zampini #if defined(GAMG_STAGES) 664849bee69SMark Adams if (!gamg_stages[level]) { 665849bee69SMark Adams char str[32]; 666a364092eSJacob Faibussowitsch PetscCall(PetscSNPrintf(str, PETSC_STATIC_ARRAY_LENGTH(str), "GAMG Level %d", (int)level)); 667849bee69SMark Adams PetscCall(PetscLogStageRegister(str, &gamg_stages[level])); 668849bee69SMark Adams } 6699566063dSJacob Faibussowitsch PetscCall(PetscLogStagePush(gamg_stages[level])); 670b4fbaa2aSMark F. Adams #endif 671b65aec2dSMark Adams /* construct prolongator - Parr[level1] */ 672b65aec2dSMark Adams if (level == 0 && pc_gamg->injection_index_size > 0) { 673b65aec2dSMark Adams Mat Prol; 674b65aec2dSMark Adams MatType mtype; 675b65aec2dSMark Adams PetscInt prol_m, prol_n, Prol_N = (M / bs) * pc_gamg->injection_index_size, Istart, Iend, nn, row; 676b65aec2dSMark Adams PetscCall(PetscInfo(pc, "Create fine grid injection space prolongation %" PetscInt_FMT " x %" PetscInt_FMT ". %s\n", M, Prol_N, pc_gamg->data ? "delete null space data" : "")); 677b65aec2dSMark Adams PetscCall(MatGetOwnershipRange(Pmat, &Istart, &Iend)); 678b65aec2dSMark Adams PetscCall(MatGetLocalSize(Pmat, &prol_m, NULL)); // rows m x n 679b65aec2dSMark Adams prol_n = (prol_m / bs) * pc_gamg->injection_index_size; 680b65aec2dSMark Adams PetscCheck(pc_gamg->injection_index_size < bs, PetscObjectComm((PetscObject)pc), PETSC_ERR_ARG_INCOMP, "Injection size %d must be less that block size %d", (int)pc_gamg->injection_index_size, (int)bs); 681b65aec2dSMark Adams PetscCall(MatGetType(Pmat, &mtype)); 682b65aec2dSMark Adams PetscCall(MatCreate(PetscObjectComm((PetscObject)pc), &Prol)); 683b65aec2dSMark Adams PetscCall(MatSetBlockSizes(Prol, bs, pc_gamg->injection_index_size)); 684b65aec2dSMark Adams PetscCall(MatSetSizes(Prol, prol_m, prol_n, M, Prol_N)); 685b65aec2dSMark Adams PetscCall(MatSetType(Prol, mtype)); 686b65aec2dSMark Adams #if PetscDefined(HAVE_DEVICE) 687b65aec2dSMark Adams PetscBool flg; 688b65aec2dSMark Adams PetscCall(MatBoundToCPU(Pmat, &flg)); 689b65aec2dSMark Adams PetscCall(MatBindToCPU(Prol, flg)); 690b65aec2dSMark Adams if (flg) PetscCall(MatSetBindingPropagates(Prol, PETSC_TRUE)); 691b65aec2dSMark Adams #endif 692b65aec2dSMark Adams PetscCall(MatSeqAIJSetPreallocation(Prol, 1, NULL)); 693b65aec2dSMark Adams PetscCall(MatMPIAIJSetPreallocation(Prol, 1, NULL, 0, NULL)); 694b65aec2dSMark Adams // set I \kron [1, 1, ... ]^T 695b65aec2dSMark Adams for (PetscInt ii = Istart, col = (Istart / bs) * pc_gamg->injection_index_size; ii < Iend; ii += bs) { 696b65aec2dSMark Adams const PetscScalar one = 1; 697b65aec2dSMark Adams for (PetscInt jj = 0; jj < pc_gamg->injection_index_size; jj++, col++) { 698b65aec2dSMark Adams PetscInt row = ii + pc_gamg->injection_index[jj]; 699b65aec2dSMark Adams PetscCall(MatSetValues(Prol, 1, &row, 1, &col, &one, INSERT_VALUES)); 700b65aec2dSMark Adams } 701b65aec2dSMark Adams } 702b65aec2dSMark Adams PetscCall(MatAssemblyBegin(Prol, MAT_FINAL_ASSEMBLY)); 703b65aec2dSMark Adams PetscCall(MatAssemblyEnd(Prol, MAT_FINAL_ASSEMBLY)); 704b65aec2dSMark Adams PetscCall(MatViewFromOptions(Prol, NULL, "-mat_view_injection")); 705b65aec2dSMark Adams PetscCall(MatGetBlockSizes(Prol, NULL, &cr_bs)); // column size 706b65aec2dSMark Adams Parr[level1] = Prol; 707b65aec2dSMark Adams // can not deal with null space -- with array of 'injection cols' we could take 'injection rows and 'injection cols' to 'data' 708b65aec2dSMark Adams if (pc_gamg->data) { 709b65aec2dSMark Adams pc_gamg->data_cell_cols = pc_gamg->injection_index_size; 710b65aec2dSMark Adams pc_gamg->data_cell_rows = pc_gamg->injection_index_size; 711b65aec2dSMark Adams pc_gamg->orig_data_cell_cols = 0; 712b65aec2dSMark Adams pc_gamg->orig_data_cell_rows = 0; 713b65aec2dSMark Adams PetscCall(PetscFree(pc_gamg->data)); 714b65aec2dSMark Adams pc_gamg->data_sz = pc_gamg->injection_index_size * prol_n; 715b65aec2dSMark Adams PetscCall(PetscMalloc1(pc_gamg->data_sz, &pc_gamg->data)); 716b65aec2dSMark Adams for (row = nn = 0; row < prol_n; row += pc_gamg->injection_index_size) { 717b65aec2dSMark Adams for (int jj = 0; jj < pc_gamg->injection_index_size; jj++) { 718b65aec2dSMark Adams int idx = row * pc_gamg->injection_index_size + jj * pc_gamg->injection_index_size; 719b65aec2dSMark Adams for (int kk = 0; kk < pc_gamg->injection_index_size; kk++, nn++) { pc_gamg->data[idx + kk] = (jj == kk) ? 1 : 0; } 720b65aec2dSMark Adams } 721b65aec2dSMark Adams } 722b65aec2dSMark Adams PetscCheck(nn == pc_gamg->data_sz, PETSC_COMM_SELF, PETSC_ERR_PLIB, "nn != pc_gamg->data_sz %" PetscInt_FMT " %" PetscInt_FMT, pc_gamg->data_sz, nn); 723b65aec2dSMark Adams } 724b65aec2dSMark Adams } else { 7258926f930SMark Adams Mat Gmat, mat; 7260cbbd2e1SMark F. Adams PetscCoarsenData *agg_lists; 7277700e67bSMark Adams Mat Prol11; 728c8b0795cSMark F. Adams 7292d776b49SBarry Smith PetscCall(PCGAMGCreateGraph(pc, Aarr[level], &Gmat)); 7309c15c1aeSMark Adams PetscCall(pc_gamg->ops->coarsen(pc, &Gmat, &agg_lists)); // Gmat may have ghosts for QR aggregates not in matrix 7318926f930SMark Adams PetscCall(PetscCDGetMat(agg_lists, &mat)); 7328926f930SMark Adams if (!mat) PetscCall(PetscCDSetMat(agg_lists, Gmat)); 7338926f930SMark Adams PetscCall(pc_gamg->ops->prolongator(pc, Aarr[level], agg_lists, &Prol11)); 734a2f3521dSMark F. Adams /* could have failed to create new level */ 735a2f3521dSMark F. Adams if (Prol11) { 736f7df55f0SStefano Zampini const char *prefix; 737f7df55f0SStefano Zampini char addp[32]; 738f7df55f0SStefano Zampini 7399d5b6da9SMark F. Adams /* get new block size of coarse matrices */ 740b65aec2dSMark Adams PetscCall(MatGetBlockSizes(Prol11, NULL, &cr_bs)); // column size 741a2f3521dSMark F. Adams 742fd1112cbSBarry Smith if (pc_gamg->ops->optprolongator) { 743c8b0795cSMark F. Adams /* smooth */ 7449566063dSJacob Faibussowitsch PetscCall(pc_gamg->ops->optprolongator(pc, Aarr[level], &Prol11)); 745c8b0795cSMark F. Adams } 746c8b0795cSMark F. Adams 7470c3bc534SBarry Smith if (pc_gamg->use_aggs_in_asm) { 7488926f930SMark Adams PetscInt bs; 7498926f930SMark Adams PetscCall(MatGetBlockSizes(Prol11, &bs, NULL)); // row block size 7509c15c1aeSMark Adams PetscCall(PetscCDGetASMBlocks(agg_lists, bs, &nASMBlocksArr[level], &ASMLocalIDsArr[level])); 7519c15c1aeSMark Adams PetscCall(PetscInfo(pc, "%d: %" PetscInt_FMT " ASM local domains, bs = %d\n", (int)level, nASMBlocksArr[level], (int)bs)); 7528926f930SMark Adams } else if (pc_gamg->asm_hem_aggs) { 7538926f930SMark Adams const char *prefix; 7548926f930SMark Adams PetscInt bs; 755e0b7e82fSBarry Smith 756e0b7e82fSBarry Smith /* 757e0b7e82fSBarry Smith Do not use aggs created for defining coarser problems, instead create aggs specifically to use 758e0b7e82fSBarry Smith to define PCASM blocks. 759e0b7e82fSBarry Smith */ 7608926f930SMark Adams PetscCall(PetscCDGetMat(agg_lists, &mat)); 7618926f930SMark Adams if (mat == Gmat) PetscCall(PetscCDClearMat(agg_lists)); // take the Mat away from the list (yuck) 7628926f930SMark Adams PetscCall(PetscCDDestroy(agg_lists)); 7638926f930SMark Adams PetscCall(PetscInfo(pc, "HEM ASM passes = %d\n", (int)pc_gamg->asm_hem_aggs)); 764e0b7e82fSBarry Smith PetscCall(MatCoarsenDestroy(&pc_gamg->asm_crs)); 765e0b7e82fSBarry Smith PetscCall(MatCoarsenCreate(PetscObjectComm((PetscObject)pc), &pc_gamg->asm_crs)); 7668926f930SMark Adams PetscCall(PetscObjectGetOptionsPrefix((PetscObject)pc, &prefix)); 767e0b7e82fSBarry Smith PetscCall(PetscObjectSetOptionsPrefix((PetscObject)pc_gamg->asm_crs, prefix)); 768e0b7e82fSBarry Smith PetscCall(MatCoarsenSetFromOptions(pc_gamg->asm_crs)); // get strength args 769e0b7e82fSBarry Smith PetscCall(MatCoarsenSetType(pc_gamg->asm_crs, MATCOARSENHEM)); 770e0b7e82fSBarry Smith PetscCall(MatCoarsenSetMaximumIterations(pc_gamg->asm_crs, pc_gamg->asm_hem_aggs)); 771e0b7e82fSBarry Smith PetscCall(MatCoarsenSetAdjacency(pc_gamg->asm_crs, Gmat)); 772e0b7e82fSBarry Smith PetscCall(MatCoarsenSetStrictAggs(pc_gamg->asm_crs, PETSC_TRUE)); 773e0b7e82fSBarry Smith PetscCall(MatCoarsenApply(pc_gamg->asm_crs)); 774e0b7e82fSBarry Smith PetscCall(MatCoarsenGetData(pc_gamg->asm_crs, &agg_lists)); /* output */ 7758926f930SMark Adams // create aggregates 7768926f930SMark Adams PetscCall(MatGetBlockSizes(Aarr[level], &bs, NULL)); // row block size 7778926f930SMark Adams PetscCall(PetscCDGetASMBlocks(agg_lists, bs, &nASMBlocksArr[level], &ASMLocalIDsArr[level])); 778ffc955d6SMark F. Adams } 7799566063dSJacob Faibussowitsch PetscCall(PCGetOptionsPrefix(pc, &prefix)); 7809566063dSJacob Faibussowitsch PetscCall(MatSetOptionsPrefix(Prol11, prefix)); 7819566063dSJacob Faibussowitsch PetscCall(PetscSNPrintf(addp, sizeof(addp), "pc_gamg_prolongator_%d_", (int)level)); 7829566063dSJacob Faibussowitsch PetscCall(MatAppendOptionsPrefix(Prol11, addp)); 78391f31d3dSStefano Zampini /* Always generate the transpose with CUDA 784f7df55f0SStefano Zampini Such behaviour can be adapted with -pc_gamg_prolongator_ prefixed options */ 7859566063dSJacob Faibussowitsch PetscCall(MatSetOption(Prol11, MAT_FORM_EXPLICIT_TRANSPOSE, PETSC_TRUE)); 7869566063dSJacob Faibussowitsch PetscCall(MatSetFromOptions(Prol11)); 7874bde40a0SMark Adams Parr[level1] = Prol11; 7884bde40a0SMark Adams } else Parr[level1] = NULL; /* failed to coarsen */ 7898926f930SMark Adams PetscCall(PetscCDGetMat(agg_lists, &mat)); 7908926f930SMark Adams if (mat == Gmat) PetscCall(PetscCDClearMat(agg_lists)); // take the Mat away from the list (yuck) 7919566063dSJacob Faibussowitsch PetscCall(MatDestroy(&Gmat)); 7929566063dSJacob Faibussowitsch PetscCall(PetscCDDestroy(agg_lists)); 793a2f3521dSMark F. Adams } /* construct prolongator scope */ 794b65aec2dSMark Adams if (level == 0) Aarr[0] = Pmat; /* use Pmat for finest level setup */ 795171cca9aSMark Adams if (!Parr[level1]) { /* failed to coarsen */ 79663a3b9bcSJacob Faibussowitsch PetscCall(PetscInfo(pc, "%s: Stop gridding, level %" PetscInt_FMT "\n", ((PetscObject)pc)->prefix, level)); 7974555aa8cSStefano Zampini #if defined(GAMG_STAGES) 7989566063dSJacob Faibussowitsch PetscCall(PetscLogStagePop()); 799a90e85d9SMark Adams #endif 800c8b0795cSMark F. Adams break; 801c8b0795cSMark F. Adams } 8029566063dSJacob Faibussowitsch PetscCall(MatGetSize(Parr[level1], &M, &N)); /* N is next M, a loop test variables */ 8032472a847SBarry Smith PetscCheck(!is_last, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Is last ?"); 804171cca9aSMark Adams if (N <= pc_gamg->coarse_eq_limit) is_last = PETSC_TRUE; 8050e2909e1SMark Adams if (level1 == pc_gamg->Nlevels - 1) is_last = PETSC_TRUE; 806e323ae0aSPierre Jolivet if (level == PETSC_MG_MAXLEVELS - 2) is_last = PETSC_TRUE; 807849bee69SMark Adams PetscCall(PetscLogEventBegin(petsc_gamg_setup_events[GAMG_LEVEL], 0, 0, 0, 0)); 808b65aec2dSMark Adams PetscCall(pc_gamg->ops->createlevel(pc, Aarr[level], cr_bs, &Parr[level1], &Aarr[level1], &nactivepe, NULL, is_last)); 809849bee69SMark Adams PetscCall(PetscLogEventEnd(petsc_gamg_setup_events[GAMG_LEVEL], 0, 0, 0, 0)); 810a2f3521dSMark F. Adams 8119566063dSJacob Faibussowitsch PetscCall(MatGetSize(Aarr[level1], &M, &N)); /* M is loop test variables */ 8124279555eSSatish Balay #if defined(PETSC_USE_INFO) 8139566063dSJacob Faibussowitsch PetscCall(MatGetInfo(Aarr[level1], MAT_GLOBAL_SUM, &info)); 814569f4572SMark Adams nnztot += info.nz_used; 8154279555eSSatish Balay #endif 816bae903cbSmarkadams4 PetscCall(PetscInfo(pc, "%s: %d) N=%" PetscInt_FMT ", n data cols=%" PetscInt_FMT ", nnz/row (ave)=%" PetscInt_FMT ", %d active pes\n", ((PetscObject)pc)->prefix, (int)level1, M, pc_gamg->data_cell_cols, (PetscInt)(info.nz_used / (PetscReal)M), nactivepe)); 817569f4572SMark Adams 8184555aa8cSStefano Zampini #if defined(GAMG_STAGES) 8199566063dSJacob Faibussowitsch PetscCall(PetscLogStagePop()); 820b4fbaa2aSMark F. Adams #endif 821a90e85d9SMark Adams /* stop if one node or one proc -- could pull back for singular problems */ 8229ab59c8bSMark Adams if ((pc_gamg->data_cell_cols && M / pc_gamg->data_cell_cols < 2) || (!pc_gamg->data_cell_cols && M / bs < 2)) { 82363a3b9bcSJacob Faibussowitsch PetscCall(PetscInfo(pc, "%s: HARD stop of coarsening on level %" PetscInt_FMT ". Grid too small: %" PetscInt_FMT " block nodes\n", ((PetscObject)pc)->prefix, level, M / bs)); 824a90e85d9SMark Adams level++; 825a90e85d9SMark Adams break; 826e323ae0aSPierre Jolivet } else if (level == PETSC_MG_MAXLEVELS - 2) { /* stop if we are limited by PC_MG_MAXLEVELS */ 827e323ae0aSPierre Jolivet PetscCall(PetscInfo(pc, "%s: HARD stop of coarsening on level %" PetscInt_FMT ". PC_MG_MAXLEVELS reached\n", ((PetscObject)pc)->prefix, level)); 828e323ae0aSPierre Jolivet level++; 829e323ae0aSPierre Jolivet break; 830a90e85d9SMark Adams } 831c8b0795cSMark F. Adams } /* levels */ 8329566063dSJacob Faibussowitsch PetscCall(PetscFree(pc_gamg->data)); 833c8b0795cSMark F. Adams 834ba4ceb06Smarkadams4 PetscCall(PetscInfo(pc, "%s: %" PetscInt_FMT " levels, operator complexity = %g\n", ((PetscObject)pc)->prefix, level + 1, nnztot / nnz0)); 8359d5b6da9SMark F. Adams pc_gamg->Nlevels = level + 1; 8365b89ad90SMark F. Adams fine_level = level; 8379566063dSJacob Faibussowitsch PetscCall(PCMGSetLevels(pc, pc_gamg->Nlevels, NULL)); 8385b89ad90SMark F. Adams 83962294041SBarry Smith if (pc_gamg->Nlevels > 1) { /* don't setup MG if one level */ 8400ed2132dSStefano Zampini 841d5280255SMark F. Adams /* set default smoothers & set operators */ 84262294041SBarry Smith for (lidx = 1, level = pc_gamg->Nlevels - 2; lidx <= fine_level; lidx++, level--) { 843ffc955d6SMark F. Adams KSP smoother; 844ffc955d6SMark F. Adams PC subpc; 845a2f3521dSMark F. Adams 8469566063dSJacob Faibussowitsch PetscCall(PCMGGetSmoother(pc, lidx, &smoother)); 8479566063dSJacob Faibussowitsch PetscCall(KSPGetPC(smoother, &subpc)); 848ffc955d6SMark F. Adams 8499566063dSJacob Faibussowitsch PetscCall(KSPSetNormType(smoother, KSP_NORM_NONE)); 850a2f3521dSMark F. Adams /* set ops */ 8519566063dSJacob Faibussowitsch PetscCall(KSPSetOperators(smoother, Aarr[level], Aarr[level])); 8529566063dSJacob Faibussowitsch PetscCall(PCMGSetInterpolation(pc, lidx, Parr[level + 1])); 853a2f3521dSMark F. Adams 854a2f3521dSMark F. Adams /* set defaults */ 8559566063dSJacob Faibussowitsch PetscCall(KSPSetType(smoother, KSPCHEBYSHEV)); 856a2f3521dSMark F. Adams 8570c3bc534SBarry Smith /* set blocks for ASM smoother that uses the 'aggregates' */ 8588926f930SMark Adams if (pc_gamg->use_aggs_in_asm || pc_gamg->asm_hem_aggs) { 8592d3561bbSSatish Balay PetscInt sz; 8607a28f3e5SMark Adams IS *iss; 861a2f3521dSMark F. Adams 8622d3561bbSSatish Balay sz = nASMBlocksArr[level]; 8637a28f3e5SMark Adams iss = ASMLocalIDsArr[level]; 8649566063dSJacob Faibussowitsch PetscCall(PCSetType(subpc, PCASM)); 8659566063dSJacob Faibussowitsch PetscCall(PCASMSetOverlap(subpc, 0)); 8669566063dSJacob Faibussowitsch PetscCall(PCASMSetType(subpc, PC_ASM_BASIC)); 8677f66b68fSMark Adams if (!sz) { 868ffc955d6SMark F. Adams IS is; 8699566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, 0, NULL, PETSC_COPY_VALUES, &is)); 8709566063dSJacob Faibussowitsch PetscCall(PCASMSetLocalSubdomains(subpc, 1, NULL, &is)); 8719566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is)); 872806fa848SBarry Smith } else { 873a94c3b12SMark F. Adams PetscInt kk; 8742eab5cd7Smarkadams4 PetscCall(PCASMSetLocalSubdomains(subpc, sz, iss, NULL)); 87548a46eb9SPierre Jolivet for (kk = 0; kk < sz; kk++) PetscCall(ISDestroy(&iss[kk])); 8769566063dSJacob Faibussowitsch PetscCall(PetscFree(iss)); 877ffc955d6SMark F. Adams } 8780298fd71SBarry Smith ASMLocalIDsArr[level] = NULL; 879ffc955d6SMark F. Adams nASMBlocksArr[level] = 0; 880806fa848SBarry Smith } else { 8819566063dSJacob Faibussowitsch PetscCall(PCSetType(subpc, PCJACOBI)); 882ffc955d6SMark F. Adams } 883d5280255SMark F. Adams } 884d5280255SMark F. Adams { 885d5280255SMark F. Adams /* coarse grid */ 8869371c9d4SSatish Balay KSP smoother, *k2; 8879371c9d4SSatish Balay PC subpc, pc2; 8889371c9d4SSatish Balay PetscInt ii, first; 8899371c9d4SSatish Balay Mat Lmat = Aarr[(level = pc_gamg->Nlevels - 1)]; 8909371c9d4SSatish Balay lidx = 0; 8910ed2132dSStefano Zampini 8929566063dSJacob Faibussowitsch PetscCall(PCMGGetSmoother(pc, lidx, &smoother)); 8939566063dSJacob Faibussowitsch PetscCall(KSPSetOperators(smoother, Lmat, Lmat)); 894cf8ae1d3SMark Adams if (!pc_gamg->use_parallel_coarse_grid_solver) { 8959566063dSJacob Faibussowitsch PetscCall(KSPSetNormType(smoother, KSP_NORM_NONE)); 8969566063dSJacob Faibussowitsch PetscCall(KSPGetPC(smoother, &subpc)); 8979566063dSJacob Faibussowitsch PetscCall(PCSetType(subpc, PCBJACOBI)); 8989566063dSJacob Faibussowitsch PetscCall(PCSetUp(subpc)); 8999566063dSJacob Faibussowitsch PetscCall(PCBJacobiGetSubKSP(subpc, &ii, &first, &k2)); 90063a3b9bcSJacob Faibussowitsch PetscCheck(ii == 1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "ii %" PetscInt_FMT " is not one", ii); 9019566063dSJacob Faibussowitsch PetscCall(KSPGetPC(k2[0], &pc2)); 9029566063dSJacob Faibussowitsch PetscCall(PCSetType(pc2, PCLU)); 9039566063dSJacob Faibussowitsch PetscCall(PCFactorSetShiftType(pc2, MAT_SHIFT_INBLOCKS)); 904fb842aefSJose E. Roman PetscCall(KSPSetTolerances(k2[0], PETSC_CURRENT, PETSC_CURRENT, PETSC_CURRENT, 1)); 9059566063dSJacob Faibussowitsch PetscCall(KSPSetType(k2[0], KSPPREONLY)); 906d5280255SMark F. Adams } 907cf8ae1d3SMark Adams } 908d5280255SMark F. Adams 909d5280255SMark F. Adams /* should be called in PCSetFromOptions_GAMG(), but cannot be called prior to PCMGSetLevels() */ 910d0609cedSBarry Smith PetscObjectOptionsBegin((PetscObject)pc); 911dbbe0bcdSBarry Smith PetscCall(PCSetFromOptions_MG(pc, PetscOptionsObject)); 912d0609cedSBarry Smith PetscOptionsEnd(); 9139566063dSJacob Faibussowitsch PetscCall(PCMGSetGalerkin(pc, PC_MG_GALERKIN_EXTERNAL)); 914d5280255SMark F. Adams 915f1580f4eSBarry Smith /* set cheby eigen estimates from SA to use in the solver */ 9167e6512fdSJed Brown if (pc_gamg->use_sa_esteig) { 91718c3aa7eSMark for (lidx = 1, level = pc_gamg->Nlevels - 2; level >= 0; lidx++, level--) { 91818c3aa7eSMark KSP smoother; 91918c3aa7eSMark PetscBool ischeb; 9200ed2132dSStefano Zampini 9219566063dSJacob Faibussowitsch PetscCall(PCMGGetSmoother(pc, lidx, &smoother)); 9229566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)smoother, KSPCHEBYSHEV, &ischeb)); 92318c3aa7eSMark if (ischeb) { 92418c3aa7eSMark KSP_Chebyshev *cheb = (KSP_Chebyshev *)smoother->data; 9250ed2132dSStefano Zampini 9262de708cbSJed Brown // The command line will override these settings because KSPSetFromOptions is called in PCSetUp_MG 927efe053fcSJed Brown if (mg->max_eigen_DinvA[level] > 0) { 9287e6512fdSJed Brown // SA uses Jacobi for P; we use SA estimates if the smoother is also Jacobi or if the user explicitly requested it. 9297e6512fdSJed Brown // TODO: This should test whether it's the same Jacobi variant (DIAG, ROWSUM, etc.) 93018c3aa7eSMark PetscReal emax, emin; 9310ed2132dSStefano Zampini 93218c3aa7eSMark emin = mg->min_eigen_DinvA[level]; 93318c3aa7eSMark emax = mg->max_eigen_DinvA[level]; 93463a3b9bcSJacob Faibussowitsch PetscCall(PetscInfo(pc, "%s: PCSetUp_GAMG: call KSPChebyshevSetEigenvalues on level %" PetscInt_FMT " (N=%" PetscInt_FMT ") with emax = %g emin = %g\n", ((PetscObject)pc)->prefix, level, Aarr[level]->rmap->N, (double)emax, (double)emin)); 9350a94a983SJed Brown cheb->emin_provided = emin; 9360a94a983SJed Brown cheb->emax_provided = emax; 93718c3aa7eSMark } 93818c3aa7eSMark } 93918c3aa7eSMark } 94018c3aa7eSMark } 9410ed2132dSStefano Zampini 9429566063dSJacob Faibussowitsch PetscCall(PCSetUp_MG(pc)); 9430ed2132dSStefano Zampini 944d5280255SMark F. Adams /* clean up */ 945d5280255SMark F. Adams for (level = 1; level < pc_gamg->Nlevels; level++) { 9469566063dSJacob Faibussowitsch PetscCall(MatDestroy(&Parr[level])); 9479566063dSJacob Faibussowitsch PetscCall(MatDestroy(&Aarr[level])); 9485b89ad90SMark F. Adams } 949806fa848SBarry Smith } else { 9505f8cf99dSMark F. Adams KSP smoother; 9510ed2132dSStefano Zampini 95263a3b9bcSJacob Faibussowitsch PetscCall(PetscInfo(pc, "%s: One level solver used (system is seen as DD). Using default solver.\n", ((PetscObject)pc)->prefix)); 9539566063dSJacob Faibussowitsch PetscCall(PCMGGetSmoother(pc, 0, &smoother)); 9549566063dSJacob Faibussowitsch PetscCall(KSPSetOperators(smoother, Aarr[0], Aarr[0])); 9559566063dSJacob Faibussowitsch PetscCall(KSPSetType(smoother, KSPPREONLY)); 9569566063dSJacob Faibussowitsch PetscCall(PCSetUp_MG(pc)); 9575f8cf99dSMark F. Adams } 958849bee69SMark Adams PetscCall(PetscLogEventEnd(petsc_gamg_setup_events[GAMG_SETUP], 0, 0, 0, 0)); 9593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 9605b89ad90SMark F. Adams } 9615b89ad90SMark F. Adams 9625b89ad90SMark F. Adams /* 9635b89ad90SMark F. Adams PCDestroy_GAMG - Destroys the private context for the GAMG preconditioner 9645b89ad90SMark F. Adams that was created with PCCreate_GAMG(). 9655b89ad90SMark F. Adams 9665b89ad90SMark F. Adams Input Parameter: 9675b89ad90SMark F. Adams . pc - the preconditioner context 9685b89ad90SMark F. Adams 9695b89ad90SMark F. Adams Application Interface Routine: PCDestroy() 9705b89ad90SMark F. Adams */ 971d71ae5a4SJacob Faibussowitsch PetscErrorCode PCDestroy_GAMG(PC pc) 972d71ae5a4SJacob Faibussowitsch { 9735b89ad90SMark F. Adams PC_MG *mg = (PC_MG *)pc->data; 9745b89ad90SMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 9755b89ad90SMark F. Adams 9765b89ad90SMark F. Adams PetscFunctionBegin; 9779566063dSJacob Faibussowitsch PetscCall(PCReset_GAMG(pc)); 9781baa6e33SBarry Smith if (pc_gamg->ops->destroy) PetscCall((*pc_gamg->ops->destroy)(pc)); 9799566063dSJacob Faibussowitsch PetscCall(PetscFree(pc_gamg->ops)); 9809566063dSJacob Faibussowitsch PetscCall(PetscFree(pc_gamg->gamg_type_name)); 9819566063dSJacob Faibussowitsch PetscCall(PetscFree(pc_gamg)); 9822e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetProcEqLim_C", NULL)); 9832e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetCoarseEqLim_C", NULL)); 9842e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetRepartition_C", NULL)); 9852e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetEigenvalues_C", NULL)); 9862e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetUseSAEstEig_C", NULL)); 987e1cf1444SMark Adams PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetRecomputeEstEig_C", NULL)); 9882e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetReuseInterpolation_C", NULL)); 9892e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGASMSetUseAggs_C", NULL)); 990d529f056Smarkadams4 PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetParallelCoarseGridSolve_C", NULL)); 9912e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetCpuPinCoarseGrids_C", NULL)); 9922e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetCoarseGridLayoutType_C", NULL)); 9932e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetThreshold_C", NULL)); 9942e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetRankReductionFactors_C", NULL)); 9952e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetThresholdScale_C", NULL)); 9962e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetType_C", NULL)); 9972e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGGetType_C", NULL)); 9982e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetNlevels_C", NULL)); 9998926f930SMark Adams PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGASMSetHEM_C", NULL)); 1000b65aec2dSMark Adams PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetInjectionIndices_C", NULL)); 1001b65aec2dSMark Adams PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetInjectionIndex_C", NULL)); 10029566063dSJacob Faibussowitsch PetscCall(PCDestroy_MG(pc)); 10033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10045b89ad90SMark F. Adams } 10055b89ad90SMark F. Adams 1006676e1743SMark F. Adams /*@ 1007f1580f4eSBarry Smith PCGAMGSetProcEqLim - Set number of equations to aim for per process on the coarse grids via processor reduction in `PCGAMG` 1008676e1743SMark F. Adams 1009c3339decSBarry Smith Logically Collective 1010676e1743SMark F. Adams 1011676e1743SMark F. Adams Input Parameters: 10121cc46a46SBarry Smith + pc - the preconditioner context 10131cc46a46SBarry Smith - n - the number of equations 1014676e1743SMark F. Adams 1015676e1743SMark F. Adams Options Database Key: 1016147403d9SBarry Smith . -pc_gamg_process_eq_limit <limit> - set the limit 1017676e1743SMark F. Adams 101820f4b53cSBarry Smith Level: intermediate 101920f4b53cSBarry Smith 1020f1580f4eSBarry Smith Note: 1021f1580f4eSBarry Smith `PCGAMG` will reduce the number of MPI processes used directly on the coarse grids so that there are around <limit> equations on each process 1022cab9ed1eSBarry Smith that has degrees of freedom 1023cab9ed1eSBarry Smith 1024a077d33dSBarry Smith Developer Note: 1025a077d33dSBarry Smith Should be named `PCGAMGSetProcessEquationLimit()`. 1026a077d33dSBarry Smith 1027a077d33dSBarry Smith .seealso: [the Users Manual section on PCGAMG](sec_amg), [the Users Manual section on PCMG](sec_mg), [](ch_ksp), `PCGAMG`, `PCGAMGSetCoarseEqLim()`, `PCGAMGSetRankReductionFactors()`, `PCGAMGSetRepartition()` 1028676e1743SMark F. Adams @*/ 1029d71ae5a4SJacob Faibussowitsch PetscErrorCode PCGAMGSetProcEqLim(PC pc, PetscInt n) 1030d71ae5a4SJacob Faibussowitsch { 1031676e1743SMark F. Adams PetscFunctionBegin; 1032676e1743SMark F. Adams PetscValidHeaderSpecific(pc, PC_CLASSID, 1); 1033cac4c232SBarry Smith PetscTryMethod(pc, "PCGAMGSetProcEqLim_C", (PC, PetscInt), (pc, n)); 10343ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1035676e1743SMark F. Adams } 1036676e1743SMark F. Adams 1037d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCGAMGSetProcEqLim_GAMG(PC pc, PetscInt n) 1038d71ae5a4SJacob Faibussowitsch { 1039c20e4228SMark F. Adams PC_MG *mg = (PC_MG *)pc->data; 1040c20e4228SMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 1041676e1743SMark F. Adams 1042676e1743SMark F. Adams PetscFunctionBegin; 10439d5b6da9SMark F. Adams if (n > 0) pc_gamg->min_eq_proc = n; 10443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1045676e1743SMark F. Adams } 1046676e1743SMark F. Adams 1047389730f3SMark F. Adams /*@ 1048f1580f4eSBarry Smith PCGAMGSetCoarseEqLim - Set maximum number of equations on the coarsest grid of `PCGAMG` 1049389730f3SMark F. Adams 1050c3339decSBarry Smith Collective 1051389730f3SMark F. Adams 1052389730f3SMark F. Adams Input Parameters: 10531cc46a46SBarry Smith + pc - the preconditioner context 10541cc46a46SBarry Smith - n - maximum number of equations to aim for 1055389730f3SMark F. Adams 1056389730f3SMark F. Adams Options Database Key: 1057147403d9SBarry Smith . -pc_gamg_coarse_eq_limit <limit> - set the limit 1058389730f3SMark F. Adams 105920f4b53cSBarry Smith Level: intermediate 106020f4b53cSBarry Smith 1061f1580f4eSBarry Smith Note: 1062f1580f4eSBarry Smith For example -pc_gamg_coarse_eq_limit 1000 will stop coarsening once the coarse grid 106374329af1SBarry Smith has less than 1000 unknowns. 106474329af1SBarry Smith 1065a077d33dSBarry Smith .seealso: [the Users Manual section on PCGAMG](sec_amg), [the Users Manual section on PCMG](sec_mg), [](ch_ksp), `PCGAMG`, `PCGAMGSetProcEqLim()`, `PCGAMGSetRankReductionFactors()`, `PCGAMGSetRepartition()`, 1066a077d33dSBarry Smith `PCGAMGSetParallelCoarseGridSolve()` 1067389730f3SMark F. Adams @*/ 1068d71ae5a4SJacob Faibussowitsch PetscErrorCode PCGAMGSetCoarseEqLim(PC pc, PetscInt n) 1069d71ae5a4SJacob Faibussowitsch { 1070389730f3SMark F. Adams PetscFunctionBegin; 1071389730f3SMark F. Adams PetscValidHeaderSpecific(pc, PC_CLASSID, 1); 1072cac4c232SBarry Smith PetscTryMethod(pc, "PCGAMGSetCoarseEqLim_C", (PC, PetscInt), (pc, n)); 10733ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1074389730f3SMark F. Adams } 1075389730f3SMark F. Adams 1076d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCGAMGSetCoarseEqLim_GAMG(PC pc, PetscInt n) 1077d71ae5a4SJacob Faibussowitsch { 1078389730f3SMark F. Adams PC_MG *mg = (PC_MG *)pc->data; 1079389730f3SMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 1080389730f3SMark F. Adams 1081389730f3SMark F. Adams PetscFunctionBegin; 10829d5b6da9SMark F. Adams if (n > 0) pc_gamg->coarse_eq_limit = n; 10833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1084389730f3SMark F. Adams } 1085389730f3SMark F. Adams 1086676e1743SMark F. Adams /*@ 1087f1580f4eSBarry Smith PCGAMGSetRepartition - Repartition the degrees of freedom across the processors on the coarser grids when reducing the number of MPI ranks to use 1088676e1743SMark F. Adams 1089c3339decSBarry Smith Collective 1090676e1743SMark F. Adams 1091676e1743SMark F. Adams Input Parameters: 10921cc46a46SBarry Smith + pc - the preconditioner context 1093f1580f4eSBarry Smith - n - `PETSC_TRUE` or `PETSC_FALSE` 1094676e1743SMark F. Adams 1095676e1743SMark F. Adams Options Database Key: 1096147403d9SBarry Smith . -pc_gamg_repartition <true,false> - turn on the repartitioning 1097676e1743SMark F. Adams 109820f4b53cSBarry Smith Level: intermediate 109920f4b53cSBarry Smith 1100f1580f4eSBarry Smith Note: 1101a077d33dSBarry Smith This will generally improve the loading balancing of the work on each level so the solves will be faster but it adds to the 1102a077d33dSBarry Smith preconditioner setup time. 1103cab9ed1eSBarry Smith 1104a077d33dSBarry Smith .seealso: [the Users Manual section on PCGAMG](sec_amg), [the Users Manual section on PCMG](sec_mg), [](ch_ksp), `PCGAMG`, `PCGAMGSetProcEqLim()`, `PCGAMGSetRankReductionFactors()` 1105676e1743SMark F. Adams @*/ 1106d71ae5a4SJacob Faibussowitsch PetscErrorCode PCGAMGSetRepartition(PC pc, PetscBool n) 1107d71ae5a4SJacob Faibussowitsch { 1108676e1743SMark F. Adams PetscFunctionBegin; 1109676e1743SMark F. Adams PetscValidHeaderSpecific(pc, PC_CLASSID, 1); 1110cac4c232SBarry Smith PetscTryMethod(pc, "PCGAMGSetRepartition_C", (PC, PetscBool), (pc, n)); 11113ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1112676e1743SMark F. Adams } 1113676e1743SMark F. Adams 1114d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCGAMGSetRepartition_GAMG(PC pc, PetscBool n) 1115d71ae5a4SJacob Faibussowitsch { 1116c20e4228SMark F. Adams PC_MG *mg = (PC_MG *)pc->data; 1117c20e4228SMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 1118676e1743SMark F. Adams 1119676e1743SMark F. Adams PetscFunctionBegin; 11209d5b6da9SMark F. Adams pc_gamg->repart = n; 11213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1122676e1743SMark F. Adams } 1123676e1743SMark F. Adams 1124dfd5c07aSMark F. Adams /*@ 1125f1580f4eSBarry Smith PCGAMGSetUseSAEstEig - Use the eigen estimate from smoothed aggregation for the Chebyshev smoother during the solution process 112618c3aa7eSMark 1127c3339decSBarry Smith Collective 112818c3aa7eSMark 112918c3aa7eSMark Input Parameters: 113018c3aa7eSMark + pc - the preconditioner context 1131e1cf1444SMark Adams - b - flag 113218c3aa7eSMark 113318c3aa7eSMark Options Database Key: 1134147403d9SBarry Smith . -pc_gamg_use_sa_esteig <true,false> - use the eigen estimate 113518c3aa7eSMark 113620f4b53cSBarry Smith Level: advanced 113720f4b53cSBarry Smith 113818c3aa7eSMark Notes: 11397e6512fdSJed Brown Smoothed aggregation constructs the smoothed prolongator $P = (I - \omega D^{-1} A) T$ where $T$ is the tentative prolongator and $D$ is the diagonal of $A$. 1140f1580f4eSBarry Smith Eigenvalue estimates (based on a few `PCCG` or `PCGMRES` iterations) are computed to choose $\omega$ so that this is a stable smoothing operation. 1141a077d33dSBarry Smith If `KSPCHEBYSHEV` with `PCJACOBI` (diagonal) preconditioning is used for smoothing on the finest level, then the eigenvalue estimates 1142a077d33dSBarry Smith can be reused during the solution process. 1143a077d33dSBarry Smith This option is only used when the smoother uses `PCJACOBI`, and should be turned off when a different `PCJacobiType` is used. 1144efe053fcSJed Brown It became default in PETSc 3.17. 114518c3aa7eSMark 1146a077d33dSBarry Smith .seealso: [the Users Manual section on PCGAMG](sec_amg), [the Users Manual section on PCMG](sec_mg), [](ch_ksp), `PCGAMG`, `KSPChebyshevSetEigenvalues()`, `KSPChebyshevEstEigSet()`, `PCGAMGSetRecomputeEstEig()` 114718c3aa7eSMark @*/ 1148e1cf1444SMark Adams PetscErrorCode PCGAMGSetUseSAEstEig(PC pc, PetscBool b) 1149d71ae5a4SJacob Faibussowitsch { 115018c3aa7eSMark PetscFunctionBegin; 115118c3aa7eSMark PetscValidHeaderSpecific(pc, PC_CLASSID, 1); 1152e1cf1444SMark Adams PetscTryMethod(pc, "PCGAMGSetUseSAEstEig_C", (PC, PetscBool), (pc, b)); 11533ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 115418c3aa7eSMark } 115518c3aa7eSMark 1156e1cf1444SMark Adams static PetscErrorCode PCGAMGSetUseSAEstEig_GAMG(PC pc, PetscBool b) 1157d71ae5a4SJacob Faibussowitsch { 115818c3aa7eSMark PC_MG *mg = (PC_MG *)pc->data; 115918c3aa7eSMark PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 116018c3aa7eSMark 116118c3aa7eSMark PetscFunctionBegin; 1162e1cf1444SMark Adams pc_gamg->use_sa_esteig = b; 1163e1cf1444SMark Adams PetscFunctionReturn(PETSC_SUCCESS); 1164e1cf1444SMark Adams } 1165e1cf1444SMark Adams 1166e1cf1444SMark Adams /*@ 1167a077d33dSBarry Smith PCGAMGSetRecomputeEstEig - Set flag for Chebyshev smoothers to recompute the eigen estimates when a new matrix is used 1168e1cf1444SMark Adams 1169e1cf1444SMark Adams Collective 1170e1cf1444SMark Adams 1171e1cf1444SMark Adams Input Parameters: 1172e1cf1444SMark Adams + pc - the preconditioner context 1173a077d33dSBarry Smith - b - flag, default is `PETSC_TRUE` 1174e1cf1444SMark Adams 1175e1cf1444SMark Adams Options Database Key: 1176e1cf1444SMark Adams . -pc_gamg_recompute_esteig <true> - use the eigen estimate 1177e1cf1444SMark Adams 1178e1cf1444SMark Adams Level: advanced 1179e1cf1444SMark Adams 1180a077d33dSBarry Smith Note: 1181a077d33dSBarry Smith If the matrix changes only slightly in a new solve using ``PETSC_FALSE`` will save time in the setting up of the preconditioner 1182a077d33dSBarry Smith and may not affect the solution time much. 1183a077d33dSBarry Smith 1184a077d33dSBarry Smith .seealso: [the Users Manual section on PCGAMG](sec_amg), [the Users Manual section on PCMG](sec_mg), [](ch_ksp), `PCGAMG`, `KSPChebyshevSetEigenvalues()`, `KSPChebyshevEstEigSet()` 1185e1cf1444SMark Adams @*/ 1186e1cf1444SMark Adams PetscErrorCode PCGAMGSetRecomputeEstEig(PC pc, PetscBool b) 1187e1cf1444SMark Adams { 1188e1cf1444SMark Adams PetscFunctionBegin; 1189e1cf1444SMark Adams PetscValidHeaderSpecific(pc, PC_CLASSID, 1); 1190e1cf1444SMark Adams PetscTryMethod(pc, "PCGAMGSetRecomputeEstEig_C", (PC, PetscBool), (pc, b)); 1191e1cf1444SMark Adams PetscFunctionReturn(PETSC_SUCCESS); 1192e1cf1444SMark Adams } 1193e1cf1444SMark Adams 1194e1cf1444SMark Adams static PetscErrorCode PCGAMGSetRecomputeEstEig_GAMG(PC pc, PetscBool b) 1195e1cf1444SMark Adams { 1196e1cf1444SMark Adams PC_MG *mg = (PC_MG *)pc->data; 1197e1cf1444SMark Adams PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 1198e1cf1444SMark Adams 1199e1cf1444SMark Adams PetscFunctionBegin; 1200e1cf1444SMark Adams pc_gamg->recompute_esteig = b; 12013ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 120218c3aa7eSMark } 120318c3aa7eSMark 120418c3aa7eSMark /*@ 1205f1580f4eSBarry Smith PCGAMGSetEigenvalues - Set WHAT eigenvalues WHY? 120618c3aa7eSMark 1207c3339decSBarry Smith Collective 120818c3aa7eSMark 120918c3aa7eSMark Input Parameters: 121018c3aa7eSMark + pc - the preconditioner context 1211feefa0e1SJacob Faibussowitsch . emax - max eigenvalue 1212feefa0e1SJacob Faibussowitsch - emin - min eigenvalue 121318c3aa7eSMark 121418c3aa7eSMark Options Database Key: 1215147403d9SBarry Smith . -pc_gamg_eigenvalues <emin,emax> - estimates of the eigenvalues 121618c3aa7eSMark 121718c3aa7eSMark Level: intermediate 121818c3aa7eSMark 1219a077d33dSBarry Smith .seealso: [the Users Manual section on PCGAMG](sec_amg), [the Users Manual section on PCMG](sec_mg), [](ch_ksp), `PCGAMG`, `PCGAMGSetUseSAEstEig()` 122018c3aa7eSMark @*/ 1221d71ae5a4SJacob Faibussowitsch PetscErrorCode PCGAMGSetEigenvalues(PC pc, PetscReal emax, PetscReal emin) 1222d71ae5a4SJacob Faibussowitsch { 122318c3aa7eSMark PetscFunctionBegin; 122418c3aa7eSMark PetscValidHeaderSpecific(pc, PC_CLASSID, 1); 1225cac4c232SBarry Smith PetscTryMethod(pc, "PCGAMGSetEigenvalues_C", (PC, PetscReal, PetscReal), (pc, emax, emin)); 12263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 122718c3aa7eSMark } 122841ffd417SStefano Zampini 1229d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCGAMGSetEigenvalues_GAMG(PC pc, PetscReal emax, PetscReal emin) 1230d71ae5a4SJacob Faibussowitsch { 123118c3aa7eSMark PC_MG *mg = (PC_MG *)pc->data; 123218c3aa7eSMark PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 123318c3aa7eSMark 123418c3aa7eSMark PetscFunctionBegin; 12355f80ce2aSJacob Faibussowitsch PetscCheck(emax > emin, PetscObjectComm((PetscObject)pc), PETSC_ERR_ARG_INCOMP, "Maximum eigenvalue must be larger than minimum: max %g min %g", (double)emax, (double)emin); 12365f80ce2aSJacob Faibussowitsch PetscCheck(emax * emin > 0.0, PetscObjectComm((PetscObject)pc), PETSC_ERR_ARG_INCOMP, "Both eigenvalues must be of the same sign: max %g min %g", (double)emax, (double)emin); 123718c3aa7eSMark pc_gamg->emax = emax; 123818c3aa7eSMark pc_gamg->emin = emin; 12393ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 124018c3aa7eSMark } 124118c3aa7eSMark 124218c3aa7eSMark /*@ 1243f1580f4eSBarry Smith PCGAMGSetReuseInterpolation - Reuse prolongation when rebuilding a `PCGAMG` algebraic multigrid preconditioner 1244dfd5c07aSMark F. Adams 1245c3339decSBarry Smith Collective 1246dfd5c07aSMark F. Adams 1247dfd5c07aSMark F. Adams Input Parameters: 12481cc46a46SBarry Smith + pc - the preconditioner context 1249f1580f4eSBarry Smith - n - `PETSC_TRUE` or `PETSC_FALSE` 1250dfd5c07aSMark F. Adams 1251dfd5c07aSMark F. Adams Options Database Key: 1252147403d9SBarry Smith . -pc_gamg_reuse_interpolation <true,false> - reuse the previous interpolation 1253dfd5c07aSMark F. Adams 1254dfd5c07aSMark F. Adams Level: intermediate 1255dfd5c07aSMark F. Adams 1256f1580f4eSBarry Smith Note: 1257147403d9SBarry Smith May negatively affect the convergence rate of the method on new matrices if the matrix entries change a great deal, but allows 1258cab9ed1eSBarry Smith rebuilding the preconditioner quicker. 1259cab9ed1eSBarry Smith 1260a077d33dSBarry Smith .seealso: [the Users Manual section on PCGAMG](sec_amg), [the Users Manual section on PCMG](sec_mg), [](ch_ksp), `PCGAMG` 1261dfd5c07aSMark F. Adams @*/ 1262d71ae5a4SJacob Faibussowitsch PetscErrorCode PCGAMGSetReuseInterpolation(PC pc, PetscBool n) 1263d71ae5a4SJacob Faibussowitsch { 1264dfd5c07aSMark F. Adams PetscFunctionBegin; 1265dfd5c07aSMark F. Adams PetscValidHeaderSpecific(pc, PC_CLASSID, 1); 1266cac4c232SBarry Smith PetscTryMethod(pc, "PCGAMGSetReuseInterpolation_C", (PC, PetscBool), (pc, n)); 12673ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1268dfd5c07aSMark F. Adams } 1269dfd5c07aSMark F. Adams 1270d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCGAMGSetReuseInterpolation_GAMG(PC pc, PetscBool n) 1271d71ae5a4SJacob Faibussowitsch { 1272dfd5c07aSMark F. Adams PC_MG *mg = (PC_MG *)pc->data; 1273dfd5c07aSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 1274dfd5c07aSMark F. Adams 1275dfd5c07aSMark F. Adams PetscFunctionBegin; 1276dfd5c07aSMark F. Adams pc_gamg->reuse_prol = n; 12773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1278dfd5c07aSMark F. Adams } 1279dfd5c07aSMark F. Adams 1280ffc955d6SMark F. Adams /*@ 1281a077d33dSBarry Smith PCGAMGASMSetUseAggs - Have the `PCGAMG` smoother on each level use `PCASM` where the aggregates defined by the coarsening process are 1282a077d33dSBarry Smith the subdomains for the additive Schwarz preconditioner used as the smoother 1283ffc955d6SMark F. Adams 1284c3339decSBarry Smith Collective 1285ffc955d6SMark F. Adams 1286ffc955d6SMark F. Adams Input Parameters: 1287cab9ed1eSBarry Smith + pc - the preconditioner context 1288f1580f4eSBarry Smith - flg - `PETSC_TRUE` to use aggregates, `PETSC_FALSE` to not 1289ffc955d6SMark F. Adams 1290ffc955d6SMark F. Adams Options Database Key: 1291147403d9SBarry Smith . -pc_gamg_asm_use_agg <true,false> - use aggregates to define the additive Schwarz subdomains 1292ffc955d6SMark F. Adams 1293ffc955d6SMark F. Adams Level: intermediate 1294ffc955d6SMark F. Adams 1295a077d33dSBarry Smith Note: 1296a077d33dSBarry Smith This option automatically sets the preconditioner on the levels to be `PCASM`. 1297a077d33dSBarry Smith 1298a077d33dSBarry Smith .seealso: [the Users Manual section on PCGAMG](sec_amg), [the Users Manual section on PCMG](sec_mg), [](ch_ksp), `PCGAMG`, `PCASM`, `PCSetType` 1299ffc955d6SMark F. Adams @*/ 1300d71ae5a4SJacob Faibussowitsch PetscErrorCode PCGAMGASMSetUseAggs(PC pc, PetscBool flg) 1301d71ae5a4SJacob Faibussowitsch { 1302ffc955d6SMark F. Adams PetscFunctionBegin; 1303ffc955d6SMark F. Adams PetscValidHeaderSpecific(pc, PC_CLASSID, 1); 1304cac4c232SBarry Smith PetscTryMethod(pc, "PCGAMGASMSetUseAggs_C", (PC, PetscBool), (pc, flg)); 13053ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1306ffc955d6SMark F. Adams } 1307ffc955d6SMark F. Adams 1308d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCGAMGASMSetUseAggs_GAMG(PC pc, PetscBool flg) 1309d71ae5a4SJacob Faibussowitsch { 1310ffc955d6SMark F. Adams PC_MG *mg = (PC_MG *)pc->data; 1311ffc955d6SMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 1312ffc955d6SMark F. Adams 1313ffc955d6SMark F. Adams PetscFunctionBegin; 1314cab9ed1eSBarry Smith pc_gamg->use_aggs_in_asm = flg; 13153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1316ffc955d6SMark F. Adams } 1317ffc955d6SMark F. Adams 1318171cca9aSMark Adams /*@ 1319d529f056Smarkadams4 PCGAMGSetParallelCoarseGridSolve - allow a parallel coarse grid solver 1320171cca9aSMark Adams 1321c3339decSBarry Smith Collective 1322171cca9aSMark Adams 1323171cca9aSMark Adams Input Parameters: 1324171cca9aSMark Adams + pc - the preconditioner context 1325f1580f4eSBarry Smith - flg - `PETSC_TRUE` to not force coarse grid onto one processor 1326171cca9aSMark Adams 1327171cca9aSMark Adams Options Database Key: 1328a077d33dSBarry Smith . -pc_gamg_parallel_coarse_grid_solver - use a parallel coarse grid solver 1329171cca9aSMark Adams 1330171cca9aSMark Adams Level: intermediate 1331171cca9aSMark Adams 1332a077d33dSBarry Smith .seealso: [the Users Manual section on PCGAMG](sec_amg), [the Users Manual section on PCMG](sec_mg), [](ch_ksp), `PCGAMG`, `PCGAMGSetCoarseGridLayoutType()`, `PCGAMGSetCpuPinCoarseGrids()`, `PCGAMGSetRankReductionFactors()` 1333171cca9aSMark Adams @*/ 1334d529f056Smarkadams4 PetscErrorCode PCGAMGSetParallelCoarseGridSolve(PC pc, PetscBool flg) 1335d71ae5a4SJacob Faibussowitsch { 1336171cca9aSMark Adams PetscFunctionBegin; 1337171cca9aSMark Adams PetscValidHeaderSpecific(pc, PC_CLASSID, 1); 1338d529f056Smarkadams4 PetscTryMethod(pc, "PCGAMGSetParallelCoarseGridSolve_C", (PC, PetscBool), (pc, flg)); 13393ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1340171cca9aSMark Adams } 1341171cca9aSMark Adams 1342d529f056Smarkadams4 static PetscErrorCode PCGAMGSetParallelCoarseGridSolve_GAMG(PC pc, PetscBool flg) 1343d71ae5a4SJacob Faibussowitsch { 1344171cca9aSMark Adams PC_MG *mg = (PC_MG *)pc->data; 1345171cca9aSMark Adams PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 1346171cca9aSMark Adams 1347171cca9aSMark Adams PetscFunctionBegin; 1348171cca9aSMark Adams pc_gamg->use_parallel_coarse_grid_solver = flg; 13493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1350ffc955d6SMark F. Adams } 1351ffc955d6SMark F. Adams 13524ef23d27SMark F. Adams /*@ 1353f1580f4eSBarry Smith PCGAMGSetCpuPinCoarseGrids - pin the coarse grids created in `PCGAMG` to run only on the CPU since the problems may be too small to run efficiently on the GPUs 1354ce7c7f2fSMark Adams 1355c3339decSBarry Smith Collective 1356ce7c7f2fSMark Adams 1357ce7c7f2fSMark Adams Input Parameters: 1358ce7c7f2fSMark Adams + pc - the preconditioner context 1359f1580f4eSBarry Smith - flg - `PETSC_TRUE` to pin coarse grids to the CPU 1360ce7c7f2fSMark Adams 1361ce7c7f2fSMark Adams Options Database Key: 1362147403d9SBarry Smith . -pc_gamg_cpu_pin_coarse_grids - pin the coarse grids to the CPU 1363ce7c7f2fSMark Adams 1364ce7c7f2fSMark Adams Level: intermediate 1365ce7c7f2fSMark Adams 1366a077d33dSBarry Smith .seealso: [the Users Manual section on PCGAMG](sec_amg), [the Users Manual section on PCMG](sec_mg), [](ch_ksp), `PCGAMG`, `PCGAMGSetCoarseGridLayoutType()`, `PCGAMGSetParallelCoarseGridSolve()` 1367ce7c7f2fSMark Adams @*/ 1368d71ae5a4SJacob Faibussowitsch PetscErrorCode PCGAMGSetCpuPinCoarseGrids(PC pc, PetscBool flg) 1369d71ae5a4SJacob Faibussowitsch { 1370ce7c7f2fSMark Adams PetscFunctionBegin; 1371ce7c7f2fSMark Adams PetscValidHeaderSpecific(pc, PC_CLASSID, 1); 1372cac4c232SBarry Smith PetscTryMethod(pc, "PCGAMGSetCpuPinCoarseGrids_C", (PC, PetscBool), (pc, flg)); 13733ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1374ce7c7f2fSMark Adams } 1375ce7c7f2fSMark Adams 1376d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCGAMGSetCpuPinCoarseGrids_GAMG(PC pc, PetscBool flg) 1377d71ae5a4SJacob Faibussowitsch { 1378ce7c7f2fSMark Adams PC_MG *mg = (PC_MG *)pc->data; 1379ce7c7f2fSMark Adams PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 1380ce7c7f2fSMark Adams 1381ce7c7f2fSMark Adams PetscFunctionBegin; 1382ce7c7f2fSMark Adams pc_gamg->cpu_pin_coarse_grids = flg; 13833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1384ce7c7f2fSMark Adams } 1385ce7c7f2fSMark Adams 1386ce7c7f2fSMark Adams /*@ 1387147403d9SBarry Smith PCGAMGSetCoarseGridLayoutType - place coarse grids on processors with natural order (compact type) 1388ce7c7f2fSMark Adams 1389c3339decSBarry Smith Collective 1390ce7c7f2fSMark Adams 1391ce7c7f2fSMark Adams Input Parameters: 1392ce7c7f2fSMark Adams + pc - the preconditioner context 1393f1580f4eSBarry Smith - flg - `PCGAMGLayoutType` type, either `PCGAMG_LAYOUT_COMPACT` or `PCGAMG_LAYOUT_SPREAD` 1394ce7c7f2fSMark Adams 1395ce7c7f2fSMark Adams Options Database Key: 1396147403d9SBarry Smith . -pc_gamg_coarse_grid_layout_type - place the coarse grids with natural ordering 1397ce7c7f2fSMark Adams 1398ce7c7f2fSMark Adams Level: intermediate 1399ce7c7f2fSMark Adams 1400a077d33dSBarry Smith .seealso: [the Users Manual section on PCGAMG](sec_amg), [the Users Manual section on PCMG](sec_mg), [](ch_ksp), `PCGAMG`, `PCGAMGSetParallelCoarseGridSolve()`, `PCGAMGSetCpuPinCoarseGrids()`, `PCGAMGLayoutType`, `PCGAMG_LAYOUT_COMPACT`, `PCGAMG_LAYOUT_SPREAD` 1401ce7c7f2fSMark Adams @*/ 1402d71ae5a4SJacob Faibussowitsch PetscErrorCode PCGAMGSetCoarseGridLayoutType(PC pc, PCGAMGLayoutType flg) 1403d71ae5a4SJacob Faibussowitsch { 1404ce7c7f2fSMark Adams PetscFunctionBegin; 1405ce7c7f2fSMark Adams PetscValidHeaderSpecific(pc, PC_CLASSID, 1); 1406cac4c232SBarry Smith PetscTryMethod(pc, "PCGAMGSetCoarseGridLayoutType_C", (PC, PCGAMGLayoutType), (pc, flg)); 14073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1408ce7c7f2fSMark Adams } 1409ce7c7f2fSMark Adams 1410d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCGAMGSetCoarseGridLayoutType_GAMG(PC pc, PCGAMGLayoutType flg) 1411d71ae5a4SJacob Faibussowitsch { 1412ce7c7f2fSMark Adams PC_MG *mg = (PC_MG *)pc->data; 1413ce7c7f2fSMark Adams PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 1414ce7c7f2fSMark Adams 1415ce7c7f2fSMark Adams PetscFunctionBegin; 1416ce7c7f2fSMark Adams pc_gamg->layout_type = flg; 14173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1418ce7c7f2fSMark Adams } 1419ce7c7f2fSMark Adams 1420ce7c7f2fSMark Adams /*@ 1421f1580f4eSBarry Smith PCGAMGSetNlevels - Sets the maximum number of levels `PCGAMG` will use 14224ef23d27SMark F. Adams 14238926f930SMark Adams Collective 14244ef23d27SMark F. Adams 14254ef23d27SMark F. Adams Input Parameters: 14261cc46a46SBarry Smith + pc - the preconditioner 14271cc46a46SBarry Smith - n - the maximum number of levels to use 14284ef23d27SMark F. Adams 14294ef23d27SMark F. Adams Options Database Key: 1430147403d9SBarry Smith . -pc_mg_levels <n> - set the maximum number of levels to allow 14314ef23d27SMark F. Adams 14324ef23d27SMark F. Adams Level: intermediate 14334ef23d27SMark F. Adams 1434feefa0e1SJacob Faibussowitsch Developer Notes: 1435f1580f4eSBarry Smith Should be called `PCGAMGSetMaximumNumberlevels()` and possible be shared with `PCMG` 1436f1580f4eSBarry Smith 1437a077d33dSBarry Smith .seealso: [the Users Manual section on PCGAMG](sec_amg), [the Users Manual section on PCMG](sec_mg), [](ch_ksp), `PCGAMG` 14384ef23d27SMark F. Adams @*/ 1439d71ae5a4SJacob Faibussowitsch PetscErrorCode PCGAMGSetNlevels(PC pc, PetscInt n) 1440d71ae5a4SJacob Faibussowitsch { 14414ef23d27SMark F. Adams PetscFunctionBegin; 14424ef23d27SMark F. Adams PetscValidHeaderSpecific(pc, PC_CLASSID, 1); 1443cac4c232SBarry Smith PetscTryMethod(pc, "PCGAMGSetNlevels_C", (PC, PetscInt), (pc, n)); 14443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 14454ef23d27SMark F. Adams } 14464ef23d27SMark F. Adams 1447d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCGAMGSetNlevels_GAMG(PC pc, PetscInt n) 1448d71ae5a4SJacob Faibussowitsch { 14494ef23d27SMark F. Adams PC_MG *mg = (PC_MG *)pc->data; 14504ef23d27SMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 14514ef23d27SMark F. Adams 14524ef23d27SMark F. Adams PetscFunctionBegin; 14539d5b6da9SMark F. Adams pc_gamg->Nlevels = n; 14543ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 14554ef23d27SMark F. Adams } 14564ef23d27SMark F. Adams 14573542efc5SMark F. Adams /*@ 14588926f930SMark Adams PCGAMGASMSetHEM - Sets the number of HEM matching passed 14598926f930SMark Adams 14608926f930SMark Adams Collective 14618926f930SMark Adams 14628926f930SMark Adams Input Parameters: 14638926f930SMark Adams + pc - the preconditioner 14648926f930SMark Adams - n - number of HEM matching passed to construct ASM subdomains 14658926f930SMark Adams 14668926f930SMark Adams Options Database Key: 14678926f930SMark Adams . -pc_gamg_asm_hem <n> - set the number of HEM matching passed 14688926f930SMark Adams 14698926f930SMark Adams Level: intermediate 14708926f930SMark Adams 14718926f930SMark Adams Developer Notes: 14728926f930SMark Adams Should be called `PCGAMGSetMaximumNumberlevels()` and possible be shared with `PCMG` 14738926f930SMark Adams 1474a077d33dSBarry Smith .seealso: [the Users Manual section on PCGAMG](sec_amg), [the Users Manual section on PCMG](sec_mg), [](ch_ksp), `PCGAMG` 14758926f930SMark Adams @*/ 14768926f930SMark Adams PetscErrorCode PCGAMGASMSetHEM(PC pc, PetscInt n) 14778926f930SMark Adams { 14788926f930SMark Adams PetscFunctionBegin; 14798926f930SMark Adams PetscValidHeaderSpecific(pc, PC_CLASSID, 1); 14808926f930SMark Adams PetscTryMethod(pc, "PCGAMGASMSetHEM_C", (PC, PetscInt), (pc, n)); 14818926f930SMark Adams PetscFunctionReturn(PETSC_SUCCESS); 14828926f930SMark Adams } 14838926f930SMark Adams 14848926f930SMark Adams static PetscErrorCode PCGAMGASMSetHEM_GAMG(PC pc, PetscInt n) 14858926f930SMark Adams { 14868926f930SMark Adams PC_MG *mg = (PC_MG *)pc->data; 14878926f930SMark Adams PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 14888926f930SMark Adams 14898926f930SMark Adams PetscFunctionBegin; 14908926f930SMark Adams pc_gamg->asm_hem_aggs = n; 14918926f930SMark Adams PetscFunctionReturn(PETSC_SUCCESS); 14928926f930SMark Adams } 14938926f930SMark Adams 14948926f930SMark Adams /*@ 14953542efc5SMark F. Adams PCGAMGSetThreshold - Relative threshold to use for dropping edges in aggregation graph 14963542efc5SMark F. Adams 149720f4b53cSBarry Smith Not Collective 14983542efc5SMark F. Adams 14993542efc5SMark F. Adams Input Parameters: 15001cc46a46SBarry Smith + pc - the preconditioner context 1501c9567895SMark . v - array of threshold values for finest n levels; 0.0 means keep all nonzero entries in the graph; negative means keep even zero entries in the graph 1502055c8bd0SJed Brown - n - number of threshold values provided in array 15033542efc5SMark F. Adams 15043542efc5SMark F. Adams Options Database Key: 1505147403d9SBarry Smith . -pc_gamg_threshold <threshold> - the threshold to drop edges 15063542efc5SMark F. Adams 150720f4b53cSBarry Smith Level: intermediate 150820f4b53cSBarry Smith 150995452b02SPatrick Sanan Notes: 1510af3c827dSMark Adams Increasing the threshold decreases the rate of coarsening. Conversely reducing the threshold increases the rate of coarsening (aggressive coarsening) and thereby reduces the complexity of the coarse grids, and generally results in slower solver converge rates. Reducing coarse grid complexity reduced the complexity of Galerkin coarse grid construction considerably. 1511f1580f4eSBarry Smith Before coarsening or aggregating the graph, `PCGAMG` removes small values from the graph with this threshold, and thus reducing the coupling in the graph and a different (perhaps better) coarser set of points. 1512cab9ed1eSBarry Smith 151320f4b53cSBarry Smith If `n` is less than the total number of coarsenings (see `PCGAMGSetNlevels()`), then threshold scaling (see `PCGAMGSetThresholdScale()`) is used for each successive coarsening. 1514f1580f4eSBarry Smith In this case, `PCGAMGSetThresholdScale()` must be called before `PCGAMGSetThreshold()`. 151520f4b53cSBarry Smith If `n` is greater than the total number of levels, the excess entries in threshold will not be used. 15163542efc5SMark F. Adams 1517a077d33dSBarry Smith .seealso: [the Users Manual section on PCGAMG](sec_amg), [the Users Manual section on PCMG](sec_mg), [](ch_ksp), `PCGAMG`, `PCGAMGSetAggressiveLevels()`, `PCGAMGMISkSetAggressive()`, `PCGAMGSetMinDegreeOrderingMISk()`, `PCGAMGSetThresholdScale()` 15183542efc5SMark F. Adams @*/ 1519d71ae5a4SJacob Faibussowitsch PetscErrorCode PCGAMGSetThreshold(PC pc, PetscReal v[], PetscInt n) 1520d71ae5a4SJacob Faibussowitsch { 15213542efc5SMark F. Adams PetscFunctionBegin; 15223542efc5SMark F. Adams PetscValidHeaderSpecific(pc, PC_CLASSID, 1); 15234f572ea9SToby Isaac if (n) PetscAssertPointer(v, 2); 1524cac4c232SBarry Smith PetscTryMethod(pc, "PCGAMGSetThreshold_C", (PC, PetscReal[], PetscInt), (pc, v, n)); 15253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 15263542efc5SMark F. Adams } 15273542efc5SMark F. Adams 1528d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCGAMGSetThreshold_GAMG(PC pc, PetscReal v[], PetscInt n) 1529d71ae5a4SJacob Faibussowitsch { 1530c20e4228SMark F. Adams PC_MG *mg = (PC_MG *)pc->data; 1531c20e4228SMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 1532c1eae691SMark Adams PetscInt i; 15334d86920dSPierre Jolivet 1534c1eae691SMark Adams PetscFunctionBegin; 1535055c8bd0SJed Brown for (i = 0; i < PetscMin(n, PETSC_MG_MAXLEVELS); i++) pc_gamg->threshold[i] = v[i]; 1536055c8bd0SJed Brown for (; i < PETSC_MG_MAXLEVELS; i++) pc_gamg->threshold[i] = pc_gamg->threshold[i - 1] * pc_gamg->threshold_scale; 15373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1538c1eae691SMark Adams } 1539c1eae691SMark Adams 1540c1eae691SMark Adams /*@ 1541f1580f4eSBarry Smith PCGAMGSetRankReductionFactors - Set a manual schedule for MPI rank reduction on coarse grids 1542c9567895SMark 1543c3339decSBarry Smith Collective 1544c9567895SMark 1545c9567895SMark Input Parameters: 1546c9567895SMark + pc - the preconditioner context 1547f1580f4eSBarry Smith . v - array of reduction factors. 0 for first value forces a reduction to one process/device on first level in CUDA 1548c9567895SMark - n - number of values provided in array 1549c9567895SMark 1550c9567895SMark Options Database Key: 1551147403d9SBarry Smith . -pc_gamg_rank_reduction_factors <factors> - provide the schedule 1552c9567895SMark 1553c9567895SMark Level: intermediate 1554c9567895SMark 1555a077d33dSBarry Smith .seealso: [the Users Manual section on PCGAMG](sec_amg), [the Users Manual section on PCMG](sec_mg), [](ch_ksp), `PCGAMG`, `PCGAMGSetProcEqLim()`, `PCGAMGSetCoarseEqLim()`, `PCGAMGSetParallelCoarseGridSolve()` 1556c9567895SMark @*/ 1557d71ae5a4SJacob Faibussowitsch PetscErrorCode PCGAMGSetRankReductionFactors(PC pc, PetscInt v[], PetscInt n) 1558d71ae5a4SJacob Faibussowitsch { 1559c9567895SMark PetscFunctionBegin; 1560c9567895SMark PetscValidHeaderSpecific(pc, PC_CLASSID, 1); 15614f572ea9SToby Isaac if (n) PetscAssertPointer(v, 2); 1562cac4c232SBarry Smith PetscTryMethod(pc, "PCGAMGSetRankReductionFactors_C", (PC, PetscInt[], PetscInt), (pc, v, n)); 15633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1564c9567895SMark } 1565c9567895SMark 1566d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCGAMGSetRankReductionFactors_GAMG(PC pc, PetscInt v[], PetscInt n) 1567d71ae5a4SJacob Faibussowitsch { 1568c9567895SMark PC_MG *mg = (PC_MG *)pc->data; 1569c9567895SMark PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 1570c9567895SMark PetscInt i; 15714d86920dSPierre Jolivet 1572c9567895SMark PetscFunctionBegin; 1573c9567895SMark for (i = 0; i < PetscMin(n, PETSC_MG_MAXLEVELS); i++) pc_gamg->level_reduction_factors[i] = v[i]; 1574c9567895SMark for (; i < PETSC_MG_MAXLEVELS; i++) pc_gamg->level_reduction_factors[i] = -1; /* 0 stop putting one process/device on first level */ 15753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1576c9567895SMark } 1577c9567895SMark 1578c9567895SMark /*@ 1579c1eae691SMark Adams PCGAMGSetThresholdScale - Relative threshold reduction at each level 1580c1eae691SMark Adams 158120f4b53cSBarry Smith Not Collective 1582c1eae691SMark Adams 1583c1eae691SMark Adams Input Parameters: 1584c1eae691SMark Adams + pc - the preconditioner context 1585feefa0e1SJacob Faibussowitsch - v - the threshold value reduction, usually < 1.0 1586c1eae691SMark Adams 1587c1eae691SMark Adams Options Database Key: 1588147403d9SBarry Smith . -pc_gamg_threshold_scale <v> - set the relative threshold reduction on each level 1589c1eae691SMark Adams 159020f4b53cSBarry Smith Level: advanced 159120f4b53cSBarry Smith 1592f1580f4eSBarry Smith Note: 1593f1580f4eSBarry Smith The initial threshold (for an arbitrary number of levels starting from the finest) can be set with `PCGAMGSetThreshold()`. 1594f1580f4eSBarry Smith This scaling is used for each subsequent coarsening, but must be called before `PCGAMGSetThreshold()`. 1595055c8bd0SJed Brown 1596a077d33dSBarry Smith .seealso: [the Users Manual section on PCGAMG](sec_amg), [the Users Manual section on PCMG](sec_mg), [](ch_ksp), `PCGAMG`, `PCGAMGSetThreshold()` 1597c1eae691SMark Adams @*/ 1598d71ae5a4SJacob Faibussowitsch PetscErrorCode PCGAMGSetThresholdScale(PC pc, PetscReal v) 1599d71ae5a4SJacob Faibussowitsch { 16003542efc5SMark F. Adams PetscFunctionBegin; 1601c1eae691SMark Adams PetscValidHeaderSpecific(pc, PC_CLASSID, 1); 1602cac4c232SBarry Smith PetscTryMethod(pc, "PCGAMGSetThresholdScale_C", (PC, PetscReal), (pc, v)); 16033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1604c1eae691SMark Adams } 1605c1eae691SMark Adams 1606d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCGAMGSetThresholdScale_GAMG(PC pc, PetscReal v) 1607d71ae5a4SJacob Faibussowitsch { 1608c1eae691SMark Adams PC_MG *mg = (PC_MG *)pc->data; 1609c1eae691SMark Adams PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 16104d86920dSPierre Jolivet 1611c1eae691SMark Adams PetscFunctionBegin; 1612c1eae691SMark Adams pc_gamg->threshold_scale = v; 16133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 16143542efc5SMark F. Adams } 16153542efc5SMark F. Adams 1616cc4c1da9SBarry Smith /*@ 1617f1580f4eSBarry Smith PCGAMGSetType - Set the type of algorithm `PCGAMG` should use 1618676e1743SMark F. Adams 1619c3339decSBarry Smith Collective 1620676e1743SMark F. Adams 1621676e1743SMark F. Adams Input Parameters: 1622c60c7ad4SBarry Smith + pc - the preconditioner context 1623f1580f4eSBarry Smith - type - `PCGAMGAGG`, `PCGAMGGEO`, or `PCGAMGCLASSICAL` 1624676e1743SMark F. Adams 1625676e1743SMark F. Adams Options Database Key: 1626a077d33dSBarry Smith . -pc_gamg_type <agg,geo,classical> - type of algebraic multigrid to apply - only agg is supported 1627676e1743SMark F. Adams 1628676e1743SMark F. Adams Level: intermediate 1629676e1743SMark F. Adams 1630a077d33dSBarry Smith .seealso: [the Users Manual section on PCGAMG](sec_amg), [the Users Manual section on PCMG](sec_mg), [](ch_ksp), `PCGAMGGetType()`, `PCGAMG`, `PCGAMGType` 1631676e1743SMark F. Adams @*/ 1632d71ae5a4SJacob Faibussowitsch PetscErrorCode PCGAMGSetType(PC pc, PCGAMGType type) 1633d71ae5a4SJacob Faibussowitsch { 1634676e1743SMark F. Adams PetscFunctionBegin; 1635676e1743SMark F. Adams PetscValidHeaderSpecific(pc, PC_CLASSID, 1); 1636cac4c232SBarry Smith PetscTryMethod(pc, "PCGAMGSetType_C", (PC, PCGAMGType), (pc, type)); 16373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1638676e1743SMark F. Adams } 1639676e1743SMark F. Adams 1640cc4c1da9SBarry Smith /*@ 1641f1580f4eSBarry Smith PCGAMGGetType - Get the type of algorithm `PCGAMG` will use 1642c60c7ad4SBarry Smith 1643c3339decSBarry Smith Collective 1644c60c7ad4SBarry Smith 1645c60c7ad4SBarry Smith Input Parameter: 1646c60c7ad4SBarry Smith . pc - the preconditioner context 1647c60c7ad4SBarry Smith 1648c60c7ad4SBarry Smith Output Parameter: 1649c60c7ad4SBarry Smith . type - the type of algorithm used 1650c60c7ad4SBarry Smith 1651c60c7ad4SBarry Smith Level: intermediate 1652c60c7ad4SBarry Smith 1653a077d33dSBarry Smith .seealso: [the Users Manual section on PCGAMG](sec_amg), [the Users Manual section on PCMG](sec_mg), [](ch_ksp), `PCGAMG`, `PCGAMGSetType()`, `PCGAMGType` 1654c60c7ad4SBarry Smith @*/ 1655d71ae5a4SJacob Faibussowitsch PetscErrorCode PCGAMGGetType(PC pc, PCGAMGType *type) 1656d71ae5a4SJacob Faibussowitsch { 1657c60c7ad4SBarry Smith PetscFunctionBegin; 1658c60c7ad4SBarry Smith PetscValidHeaderSpecific(pc, PC_CLASSID, 1); 1659cac4c232SBarry Smith PetscUseMethod(pc, "PCGAMGGetType_C", (PC, PCGAMGType *), (pc, type)); 16603ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1661c60c7ad4SBarry Smith } 1662c60c7ad4SBarry Smith 1663d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCGAMGGetType_GAMG(PC pc, PCGAMGType *type) 1664d71ae5a4SJacob Faibussowitsch { 1665c60c7ad4SBarry Smith PC_MG *mg = (PC_MG *)pc->data; 1666c60c7ad4SBarry Smith PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 1667c60c7ad4SBarry Smith 1668c60c7ad4SBarry Smith PetscFunctionBegin; 1669c60c7ad4SBarry Smith *type = pc_gamg->type; 16703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1671c60c7ad4SBarry Smith } 1672c60c7ad4SBarry Smith 1673d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCGAMGSetType_GAMG(PC pc, PCGAMGType type) 1674d71ae5a4SJacob Faibussowitsch { 16751ab5ffc9SJed Brown PC_MG *mg = (PC_MG *)pc->data; 16761ab5ffc9SJed Brown PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 16775f80ce2aSJacob Faibussowitsch PetscErrorCode (*r)(PC); 1678676e1743SMark F. Adams 1679676e1743SMark F. Adams PetscFunctionBegin; 1680c60c7ad4SBarry Smith pc_gamg->type = type; 16819566063dSJacob Faibussowitsch PetscCall(PetscFunctionListFind(GAMGList, type, &r)); 16826adde796SStefano Zampini PetscCheck(r, PetscObjectComm((PetscObject)pc), PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown GAMG type %s given", type); 16831ab5ffc9SJed Brown if (pc_gamg->ops->destroy) { 16849566063dSJacob Faibussowitsch PetscCall((*pc_gamg->ops->destroy)(pc)); 16859566063dSJacob Faibussowitsch PetscCall(PetscMemzero(pc_gamg->ops, sizeof(struct _PCGAMGOps))); 1686e616c208SToby Isaac pc_gamg->ops->createlevel = PCGAMGCreateLevel_GAMG; 1687da81f932SPierre Jolivet /* cleaning up common data in pc_gamg - this should disappear someday */ 16883ae0bb68SMark Adams pc_gamg->data_cell_cols = 0; 16893ae0bb68SMark Adams pc_gamg->data_cell_rows = 0; 16903ae0bb68SMark Adams pc_gamg->orig_data_cell_cols = 0; 16913ae0bb68SMark Adams pc_gamg->orig_data_cell_rows = 0; 16929566063dSJacob Faibussowitsch PetscCall(PetscFree(pc_gamg->data)); 16933ae0bb68SMark Adams pc_gamg->data_sz = 0; 16941ab5ffc9SJed Brown } 16959566063dSJacob Faibussowitsch PetscCall(PetscFree(pc_gamg->gamg_type_name)); 16969566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(type, &pc_gamg->gamg_type_name)); 16979566063dSJacob Faibussowitsch PetscCall((*r)(pc)); 16983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1699676e1743SMark F. Adams } 1700676e1743SMark F. Adams 1701d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCView_GAMG(PC pc, PetscViewer viewer) 1702d71ae5a4SJacob Faibussowitsch { 17035adeb434SBarry Smith PC_MG *mg = (PC_MG *)pc->data; 17046c34c54dSStefano Zampini PC_MG_Levels **mglevels = mg->levels; 17055adeb434SBarry Smith PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 17066c34c54dSStefano Zampini PetscReal gc, oc; 170790db8557SMark Adams 17085adeb434SBarry Smith PetscFunctionBegin; 17099566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " GAMG specific options\n")); 17109566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " Threshold for dropping small values in graph on each level =")); 17119566063dSJacob Faibussowitsch for (PetscInt i = 0; i < mg->nlevels; i++) PetscCall(PetscViewerASCIIPrintf(viewer, " %g", (double)pc_gamg->threshold[i])); 17129566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 17139566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " Threshold scaling factor for each level not specified = %g\n", (double)pc_gamg->threshold_scale)); 1714e0b7e82fSBarry Smith if (pc_gamg->use_aggs_in_asm) PetscCall(PetscViewerASCIIPrintf(viewer, " Using aggregates from GAMG coarsening process to define subdomains for PCASM\n")); // this take presedence 1715e0b7e82fSBarry Smith else if (pc_gamg->asm_hem_aggs) { 1716e0b7e82fSBarry Smith PetscCall(PetscViewerASCIIPrintf(viewer, " Using aggregates made with %d applications of heavy edge matching (HEM) to define subdomains for PCASM\n", (int)pc_gamg->asm_hem_aggs)); 1717e0b7e82fSBarry Smith PetscCall(PetscViewerASCIIPushTab(viewer)); 1718e0b7e82fSBarry Smith PetscCall(PetscViewerASCIIPushTab(viewer)); 1719e0b7e82fSBarry Smith PetscCall(PetscViewerASCIIPushTab(viewer)); 1720e0b7e82fSBarry Smith PetscCall(PetscViewerASCIIPushTab(viewer)); 1721e0b7e82fSBarry Smith PetscCall(MatCoarsenView(pc_gamg->asm_crs, viewer)); 1722e0b7e82fSBarry Smith PetscCall(PetscViewerASCIIPopTab(viewer)); 1723e0b7e82fSBarry Smith PetscCall(PetscViewerASCIIPopTab(viewer)); 1724e0b7e82fSBarry Smith PetscCall(PetscViewerASCIIPopTab(viewer)); 1725e0b7e82fSBarry Smith } 172648a46eb9SPierre Jolivet if (pc_gamg->use_parallel_coarse_grid_solver) PetscCall(PetscViewerASCIIPrintf(viewer, " Using parallel coarse grid solver (all coarse grid equations not put on one process)\n")); 1727b65aec2dSMark Adams if (pc_gamg->injection_index_size) { 1728b65aec2dSMark Adams PetscCall(PetscViewerASCIIPrintf(viewer, " Using injection restriction/prolongation on first level, dofs:")); 1729b65aec2dSMark Adams for (int i = 0; i < pc_gamg->injection_index_size; i++) PetscCall(PetscViewerASCIIPrintf(viewer, " %d", (int)pc_gamg->injection_index[i])); 1730b65aec2dSMark Adams PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 1731b65aec2dSMark Adams } 17321baa6e33SBarry Smith if (pc_gamg->ops->view) PetscCall((*pc_gamg->ops->view)(pc, viewer)); 17336c34c54dSStefano Zampini gc = oc = 0; 17349566063dSJacob Faibussowitsch PetscCall(PCMGGetGridComplexity(pc, &gc, &oc)); 173563a3b9bcSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " Complexity: grid = %g operator = %g\n", (double)gc, (double)oc)); 17366c34c54dSStefano Zampini PetscCall(PetscViewerASCIIPrintf(viewer, " Per-level complexity: op = operator, int = interpolation\n")); 17376c34c54dSStefano Zampini PetscCall(PetscViewerASCIIPrintf(viewer, " #equations | #active PEs | avg nnz/row op | avg nnz/row int\n")); 17386c34c54dSStefano Zampini for (PetscInt i = 0; i < mg->nlevels; i++) { 17396c34c54dSStefano Zampini MatInfo info; 17406c34c54dSStefano Zampini Mat A; 17416c34c54dSStefano Zampini PetscReal rd[3]; 17426c34c54dSStefano Zampini PetscInt rst, ren, N; 17436c34c54dSStefano Zampini 17446c34c54dSStefano Zampini PetscCall(KSPGetOperators(mglevels[i]->smoothd, NULL, &A)); 17456c34c54dSStefano Zampini PetscCall(MatGetOwnershipRange(A, &rst, &ren)); 17466c34c54dSStefano Zampini PetscCall(MatGetSize(A, &N, NULL)); 17476c34c54dSStefano Zampini PetscCall(MatGetInfo(A, MAT_LOCAL, &info)); 17486c34c54dSStefano Zampini rd[0] = (ren - rst > 0) ? 1 : 0; 17496c34c54dSStefano Zampini rd[1] = info.nz_used; 17506c34c54dSStefano Zampini rd[2] = 0; 17516c34c54dSStefano Zampini if (i) { 17526c34c54dSStefano Zampini Mat P; 17536c34c54dSStefano Zampini PetscCall(PCMGGetInterpolation(pc, i, &P)); 17546c34c54dSStefano Zampini PetscCall(MatGetInfo(P, MAT_LOCAL, &info)); 17556c34c54dSStefano Zampini rd[2] = info.nz_used; 17566c34c54dSStefano Zampini } 17576c34c54dSStefano Zampini PetscCall(MPIU_Allreduce(MPI_IN_PLACE, rd, 3, MPIU_REAL, MPIU_SUM, PetscObjectComm((PetscObject)pc))); 17586c34c54dSStefano Zampini PetscCall(PetscViewerASCIIPrintf(viewer, " %12" PetscInt_FMT " %12" PetscInt_FMT " %12" PetscInt_FMT " %12" PetscInt_FMT "\n", N, (PetscInt)rd[0], (PetscInt)PetscCeilReal(rd[1] / N), (PetscInt)PetscCeilReal(rd[2] / N))); 17596c34c54dSStefano Zampini } 17603ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 17615adeb434SBarry Smith } 17625adeb434SBarry Smith 1763b65aec2dSMark Adams /*@ 1764b65aec2dSMark Adams PCGAMGSetInjectionIndex - Array of subset of variables per vertex to inject into coarse grid space 1765b65aec2dSMark Adams 1766b65aec2dSMark Adams Logically Collective 1767b65aec2dSMark Adams 1768b65aec2dSMark Adams Input Parameters: 1769b65aec2dSMark Adams + pc - the coarsen context 1770b65aec2dSMark Adams . n - number of indices 1771b65aec2dSMark Adams - idx - array of indices 1772b65aec2dSMark Adams 1773b65aec2dSMark Adams Options Database Key: 1774b65aec2dSMark Adams . -pc_gamg_injection_index - array of subset of variables per vertex to use for injection coarse grid space 1775b65aec2dSMark Adams 1776b65aec2dSMark Adams Level: intermediate 1777b65aec2dSMark Adams 1778a077d33dSBarry Smith .seealso: [the Users Manual section on PCGAMG](sec_amg), [the Users Manual section on PCMG](sec_mg), `PCGAMG` 1779b65aec2dSMark Adams @*/ 1780b65aec2dSMark Adams PetscErrorCode PCGAMGSetInjectionIndex(PC pc, PetscInt n, PetscInt idx[]) 1781b65aec2dSMark Adams { 1782b65aec2dSMark Adams PetscFunctionBegin; 1783b65aec2dSMark Adams PetscValidHeaderSpecific(pc, PC_CLASSID, 1); 1784b65aec2dSMark Adams PetscValidLogicalCollectiveInt(pc, n, 2); 1785b65aec2dSMark Adams PetscTryMethod(pc, "PCGAMGSetInjectionIndex_C", (PC, PetscInt, PetscInt[]), (pc, n, idx)); 1786b65aec2dSMark Adams PetscFunctionReturn(PETSC_SUCCESS); 1787b65aec2dSMark Adams } 1788b65aec2dSMark Adams 1789b65aec2dSMark Adams static PetscErrorCode PCGAMGSetInjectionIndex_GAMG(PC pc, PetscInt n, PetscInt idx[]) 1790b65aec2dSMark Adams { 1791b65aec2dSMark Adams PC_MG *mg = (PC_MG *)pc->data; 1792b65aec2dSMark Adams PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 17934d86920dSPierre Jolivet 1794b65aec2dSMark Adams PetscFunctionBegin; 1795b65aec2dSMark Adams pc_gamg->injection_index_size = n; 1796b65aec2dSMark Adams PetscCheck(n < MAT_COARSEN_STRENGTH_INDEX_SIZE, PetscObjectComm((PetscObject)pc), PETSC_ERR_ARG_INCOMP, "array size %d larger than max %d", (int)n, MAT_COARSEN_STRENGTH_INDEX_SIZE); 17974d86920dSPierre Jolivet for (PetscInt i = 0; i < n; i++) pc_gamg->injection_index[i] = idx[i]; 1798b65aec2dSMark Adams PetscFunctionReturn(PETSC_SUCCESS); 1799b65aec2dSMark Adams } 1800b65aec2dSMark Adams 180166976f2fSJacob Faibussowitsch static PetscErrorCode PCSetFromOptions_GAMG(PC pc, PetscOptionItems *PetscOptionsObject) 1802d71ae5a4SJacob Faibussowitsch { 1803676e1743SMark F. Adams PC_MG *mg = (PC_MG *)pc->data; 1804676e1743SMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 18057e6512fdSJed Brown PetscBool flag; 18063b4367a7SBarry Smith MPI_Comm comm; 180718c3aa7eSMark char prefix[256], tname[32]; 1808c1eae691SMark Adams PetscInt i, n; 180914a9496bSBarry Smith const char *pcpre; 18100a545947SLisandro Dalcin static const char *LayoutTypes[] = {"compact", "spread", "PCGAMGLayoutType", "PC_GAMG_LAYOUT", NULL}; 18118926f930SMark Adams 18125b89ad90SMark F. Adams PetscFunctionBegin; 18139566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)pc, &comm)); 1814d0609cedSBarry Smith PetscOptionsHeadBegin(PetscOptionsObject, "GAMG options"); 18155fb461b6SMatthew Knepley PetscCall(PetscOptionsInt("-pc_mg_levels", "Number of Levels", "PCMGSetLevels", -1, &n, &flag)); 18165fb461b6SMatthew Knepley PetscCheck(!flag, comm, PETSC_ERR_ARG_WRONG, "Invalid flag -pc_mg_levels. GAMG does not allow the number of levels to be set."); 18175e4ac8c8Smarkadams4 PetscCall(PetscOptionsFList("-pc_gamg_type", "Type of AMG method (only 'agg' supported and useful)", "PCGAMGSetType", GAMGList, pc_gamg->gamg_type_name, tname, sizeof(tname), &flag)); 18181baa6e33SBarry Smith if (flag) PetscCall(PCGAMGSetType(pc, tname)); 18199566063dSJacob Faibussowitsch PetscCall(PetscOptionsBool("-pc_gamg_repartition", "Repartion coarse grids", "PCGAMGSetRepartition", pc_gamg->repart, &pc_gamg->repart, NULL)); 1820f1580f4eSBarry Smith PetscCall(PetscOptionsBool("-pc_gamg_use_sa_esteig", "Use eigen estimate from smoothed aggregation for smoother", "PCGAMGSetUseSAEstEig", pc_gamg->use_sa_esteig, &pc_gamg->use_sa_esteig, NULL)); 1821e1cf1444SMark Adams PetscCall(PetscOptionsBool("-pc_gamg_recompute_esteig", "Set flag to recompute eigen estimates for Chebyshev when matrix changes", "PCGAMGSetRecomputeEstEig", pc_gamg->recompute_esteig, &pc_gamg->recompute_esteig, NULL)); 18229566063dSJacob Faibussowitsch PetscCall(PetscOptionsBool("-pc_gamg_reuse_interpolation", "Reuse prolongation operator", "PCGAMGReuseInterpolation", pc_gamg->reuse_prol, &pc_gamg->reuse_prol, NULL)); 18239566063dSJacob Faibussowitsch PetscCall(PetscOptionsBool("-pc_gamg_asm_use_agg", "Use aggregation aggregates for ASM smoother", "PCGAMGASMSetUseAggs", pc_gamg->use_aggs_in_asm, &pc_gamg->use_aggs_in_asm, NULL)); 1824d529f056Smarkadams4 PetscCall(PetscOptionsBool("-pc_gamg_parallel_coarse_grid_solver", "Use parallel coarse grid solver (otherwise put last grid on one process)", "PCGAMGSetParallelCoarseGridSolve", pc_gamg->use_parallel_coarse_grid_solver, &pc_gamg->use_parallel_coarse_grid_solver, NULL)); 18259566063dSJacob Faibussowitsch PetscCall(PetscOptionsBool("-pc_gamg_cpu_pin_coarse_grids", "Pin coarse grids to the CPU", "PCGAMGSetCpuPinCoarseGrids", pc_gamg->cpu_pin_coarse_grids, &pc_gamg->cpu_pin_coarse_grids, NULL)); 18269371c9d4SSatish Balay PetscCall(PetscOptionsEnum("-pc_gamg_coarse_grid_layout_type", "compact: place reduced grids on processes in natural order; spread: distribute to whole machine for more memory bandwidth", "PCGAMGSetCoarseGridLayoutType", LayoutTypes, 18279371c9d4SSatish Balay (PetscEnum)pc_gamg->layout_type, (PetscEnum *)&pc_gamg->layout_type, NULL)); 18289566063dSJacob Faibussowitsch PetscCall(PetscOptionsInt("-pc_gamg_process_eq_limit", "Limit (goal) on number of equations per process on coarse grids", "PCGAMGSetProcEqLim", pc_gamg->min_eq_proc, &pc_gamg->min_eq_proc, NULL)); 18299566063dSJacob Faibussowitsch PetscCall(PetscOptionsInt("-pc_gamg_coarse_eq_limit", "Limit on number of equations for the coarse grid", "PCGAMGSetCoarseEqLim", pc_gamg->coarse_eq_limit, &pc_gamg->coarse_eq_limit, NULL)); 18308926f930SMark Adams PetscCall(PetscOptionsInt("-pc_gamg_asm_hem_aggs", "Number of HEM matching passed in aggregates for ASM smoother", "PCGAMGASMSetHEM", pc_gamg->asm_hem_aggs, &pc_gamg->asm_hem_aggs, NULL)); 18319566063dSJacob Faibussowitsch PetscCall(PetscOptionsReal("-pc_gamg_threshold_scale", "Scaling of threshold for each level not specified", "PCGAMGSetThresholdScale", pc_gamg->threshold_scale, &pc_gamg->threshold_scale, NULL)); 183218c3aa7eSMark n = PETSC_MG_MAXLEVELS; 18339566063dSJacob Faibussowitsch PetscCall(PetscOptionsRealArray("-pc_gamg_threshold", "Relative threshold to use for dropping edges in aggregation graph", "PCGAMGSetThreshold", pc_gamg->threshold, &n, &flag)); 183418c3aa7eSMark if (!flag || n < PETSC_MG_MAXLEVELS) { 1835efd3c5ceSMark Adams if (!flag) n = 1; 1836c1eae691SMark Adams i = n; 1837d71ae5a4SJacob Faibussowitsch do { 1838d71ae5a4SJacob Faibussowitsch pc_gamg->threshold[i] = pc_gamg->threshold[i - 1] * pc_gamg->threshold_scale; 1839d71ae5a4SJacob Faibussowitsch } while (++i < PETSC_MG_MAXLEVELS); 1840c1eae691SMark Adams } 18419c15c1aeSMark Adams PetscCall(PetscOptionsInt("-pc_mg_levels", "Set number of MG levels (should get from base class)", "PCGAMGSetNlevels", pc_gamg->Nlevels, &pc_gamg->Nlevels, NULL)); 18429c15c1aeSMark Adams PetscCheck(pc_gamg->Nlevels <= PETSC_MG_MAXLEVELS, PetscObjectComm((PetscObject)pc), PETSC_ERR_ARG_INCOMP, "-pc_mg_levels (%d) >= PETSC_MG_MAXLEVELS (%d)", (int)pc_gamg->Nlevels, (int)PETSC_MG_MAXLEVELS); 1843c9567895SMark n = PETSC_MG_MAXLEVELS; 18449566063dSJacob Faibussowitsch PetscCall(PetscOptionsIntArray("-pc_gamg_rank_reduction_factors", "Manual schedule of coarse grid reduction factors that overrides internal heuristics (0 for first reduction puts one process/device)", "PCGAMGSetRankReductionFactors", pc_gamg->level_reduction_factors, &n, &flag)); 1845c9567895SMark if (!flag) i = 0; 1846c9567895SMark else i = n; 1847d71ae5a4SJacob Faibussowitsch do { 1848d71ae5a4SJacob Faibussowitsch pc_gamg->level_reduction_factors[i] = -1; 1849d71ae5a4SJacob Faibussowitsch } while (++i < PETSC_MG_MAXLEVELS); 185018c3aa7eSMark { 185118c3aa7eSMark PetscReal eminmax[2] = {0., 0.}; 185218c3aa7eSMark n = 2; 18539566063dSJacob Faibussowitsch PetscCall(PetscOptionsRealArray("-pc_gamg_eigenvalues", "extreme eigenvalues for smoothed aggregation", "PCGAMGSetEigenvalues", eminmax, &n, &flag)); 185418c3aa7eSMark if (flag) { 185508401ef6SPierre Jolivet PetscCheck(n == 2, PetscObjectComm((PetscObject)pc), PETSC_ERR_ARG_INCOMP, "-pc_gamg_eigenvalues: must specify 2 parameters, min and max eigenvalues"); 18569566063dSJacob Faibussowitsch PetscCall(PCGAMGSetEigenvalues(pc, eminmax[1], eminmax[0])); 185718c3aa7eSMark } 185818c3aa7eSMark } 1859b65aec2dSMark Adams pc_gamg->injection_index_size = MAT_COARSEN_STRENGTH_INDEX_SIZE; 1860b65aec2dSMark Adams PetscCall(PetscOptionsIntArray("-pc_gamg_injection_index", "Array of indices to use to use injection coarse grid space", "PCGAMGSetInjectionIndex", pc_gamg->injection_index, &pc_gamg->injection_index_size, NULL)); 1861b7cbab4eSMark Adams /* set options for subtype */ 1862dbbe0bcdSBarry Smith PetscCall((*pc_gamg->ops->setfromoptions)(pc, PetscOptionsObject)); 186318c3aa7eSMark 18649566063dSJacob Faibussowitsch PetscCall(PCGetOptionsPrefix(pc, &pcpre)); 18659566063dSJacob Faibussowitsch PetscCall(PetscSNPrintf(prefix, sizeof(prefix), "%spc_gamg_", pcpre ? pcpre : "")); 1866d0609cedSBarry Smith PetscOptionsHeadEnd(); 18673ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18685b89ad90SMark F. Adams } 18695b89ad90SMark F. Adams 18705b89ad90SMark F. Adams /*MC 18711cc46a46SBarry Smith PCGAMG - Geometric algebraic multigrid (AMG) preconditioner 18725b89ad90SMark F. Adams 1873280d9858SJed Brown Options Database Keys: 18745e4ac8c8Smarkadams4 + -pc_gamg_type <type,default=agg> - one of agg, geo, or classical (only smoothed aggregation, agg, supported) 1875da81f932SPierre Jolivet . -pc_gamg_repartition <bool,default=false> - repartition the degrees of freedom across the coarse grids as they are determined 187621d928e4Smarkadams4 . -pc_gamg_asm_use_agg <bool,default=false> - use the aggregates from the coasening process to defined the subdomains on each level for the PCASM smoother 1877da81f932SPierre Jolivet . -pc_gamg_process_eq_limit <limit, default=50> - `PCGAMG` will reduce the number of MPI ranks used directly on the coarse grids so that there are around <limit> 1878cab9ed1eSBarry Smith equations on each process that has degrees of freedom 18792d776b49SBarry Smith . -pc_gamg_coarse_eq_limit <limit, default=50> - Set maximum number of equations on coarsest grid to aim for. 188021d928e4Smarkadams4 . -pc_gamg_reuse_interpolation <bool,default=true> - when rebuilding the algebraic multigrid preconditioner reuse the previously computed interpolations (should always be true) 188121d928e4Smarkadams4 . -pc_gamg_threshold[] <thresh,default=[-1,...]> - Before aggregating the graph `PCGAMG` will remove small values from the graph on each level (< 0 does no filtering) 18822d776b49SBarry Smith - -pc_gamg_threshold_scale <scale,default=1> - Scaling of threshold on each coarser grid if not specified 1883cab9ed1eSBarry Smith 1884f1580f4eSBarry Smith Options Database Keys for Aggregation: 1885a077d33dSBarry Smith + -pc_gamg_agg_nsmooths <nsmooth, default=1> - number of smoothing steps to use with smooth aggregation to construct prolongation 1886d529f056Smarkadams4 . -pc_gamg_aggressive_coarsening <n,default=1> - number of aggressive coarsening (MIS-2) levels from finest. 1887d529f056Smarkadams4 . -pc_gamg_aggressive_square_graph <bool,default=false> - Use square graph (A'A) or MIS-k (k=2) for aggressive coarsening 1888d529f056Smarkadams4 . -pc_gamg_mis_k_minimum_degree_ordering <bool,default=true> - Use minimum degree ordering in greedy MIS algorithm 18898926f930SMark Adams . -pc_gamg_pc_gamg_asm_hem_aggs <n,default=0> - Number of HEM aggregation steps for ASM smoother 1890d529f056Smarkadams4 - -pc_gamg_aggressive_mis_k <n,default=2> - Number (k) distance in MIS coarsening (>2 is 'aggressive') 1891cab9ed1eSBarry Smith 1892f1580f4eSBarry Smith Options Database Keys for Multigrid: 1893a9f5add0SYANG Zongze + -pc_mg_cycle_type <v> - v or w, see `PCMGSetCycleType()` 1894db9745e2SBarry Smith . -pc_mg_distinct_smoothup - configure the up and down (pre and post) smoothers separately, see PCMGSetDistinctSmoothUp() 1895db9745e2SBarry Smith . -pc_mg_type <multiplicative> - (one of) additive multiplicative full kascade 189621d928e4Smarkadams4 - -pc_mg_levels <levels> - Number of levels of multigrid to use. GAMG has a heuristic so pc_mg_levels is not usually used with GAMG 18975b89ad90SMark F. Adams 189820f4b53cSBarry Smith Level: intermediate 189920f4b53cSBarry Smith 190095452b02SPatrick Sanan Notes: 1901f1580f4eSBarry Smith To obtain good performance for `PCGAMG` for vector valued problems you must 1902f1580f4eSBarry Smith call `MatSetBlockSize()` to indicate the number of degrees of freedom per grid point 1903f1580f4eSBarry Smith call `MatSetNearNullSpace()` (or `PCSetCoordinates()` if solving the equations of elasticity) to indicate the near null space of the operator 1904f1580f4eSBarry Smith 190504c3f3b8SBarry Smith The many options for `PCMG` also work directly for `PCGAMG` such as controlling the smoothers on each level etc. 190604c3f3b8SBarry Smith 1907a077d33dSBarry Smith .seealso: [the Users Manual section on PCGAMG](sec_amg), [the Users Manual section on PCMG](sec_mg), [](ch_ksp), `PCCreate()`, `PCSetType()`, 1908a077d33dSBarry Smith `MatSetBlockSize()`, 1909a077d33dSBarry Smith `PCMGType`, `PCSetCoordinates()`, `MatSetNearNullSpace()`, `PCGAMGSetType()`, `PCGAMGAGG`, `PCGAMGGEO`, `PCGAMGCLASSICAL`, `PCGAMGSetProcEqLim()`, 1910a077d33dSBarry Smith `PCGAMGSetCoarseEqLim()`, `PCGAMGSetRepartition()`, `PCGAMGRegister()`, `PCGAMGSetReuseInterpolation()`, `PCGAMGASMSetUseAggs()`, 1911a077d33dSBarry Smith `PCGAMGSetParallelCoarseGridSolve()`, `PCGAMGSetNlevels()`, `PCGAMGSetThreshold()`, `PCGAMGGetType()`, `PCGAMGSetUseSAEstEig()` 19125b89ad90SMark F. Adams M*/ 1913d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode PCCreate_GAMG(PC pc) 1914d71ae5a4SJacob Faibussowitsch { 19155b89ad90SMark F. Adams PC_GAMG *pc_gamg; 19165b89ad90SMark F. Adams PC_MG *mg; 19175b89ad90SMark F. Adams 19185b89ad90SMark F. Adams PetscFunctionBegin; 19191c1aac46SBarry Smith /* register AMG type */ 19209566063dSJacob Faibussowitsch PetscCall(PCGAMGInitializePackage()); 19211c1aac46SBarry Smith 19225b89ad90SMark F. Adams /* PCGAMG is an inherited class of PCMG. Initialize pc as PCMG */ 19239566063dSJacob Faibussowitsch PetscCall(PCSetType(pc, PCMG)); 19249566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)pc, PCGAMG)); 19255b89ad90SMark F. Adams 19265b89ad90SMark F. Adams /* create a supporting struct and attach it to pc */ 19274dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&pc_gamg)); 19289566063dSJacob Faibussowitsch PetscCall(PCMGSetGalerkin(pc, PC_MG_GALERKIN_EXTERNAL)); 19295b89ad90SMark F. Adams mg = (PC_MG *)pc->data; 19305b89ad90SMark F. Adams mg->innerctx = pc_gamg; 19315b89ad90SMark F. Adams 19324dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&pc_gamg->ops)); 19331ab5ffc9SJed Brown 19349d5b6da9SMark F. Adams /* these should be in subctx but repartitioning needs simple arrays */ 19359d5b6da9SMark F. Adams pc_gamg->data_sz = 0; 19360a545947SLisandro Dalcin pc_gamg->data = NULL; 19375b89ad90SMark F. Adams 19389d5b6da9SMark F. Adams /* overwrite the pointers of PCMG by the functions of base class PCGAMG */ 19395b89ad90SMark F. Adams pc->ops->setfromoptions = PCSetFromOptions_GAMG; 19405b89ad90SMark F. Adams pc->ops->setup = PCSetUp_GAMG; 19415b89ad90SMark F. Adams pc->ops->reset = PCReset_GAMG; 19425b89ad90SMark F. Adams pc->ops->destroy = PCDestroy_GAMG; 19435adeb434SBarry Smith mg->view = PCView_GAMG; 19445b89ad90SMark F. Adams 19459566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetProcEqLim_C", PCGAMGSetProcEqLim_GAMG)); 19469566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetCoarseEqLim_C", PCGAMGSetCoarseEqLim_GAMG)); 19479566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetRepartition_C", PCGAMGSetRepartition_GAMG)); 19489566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetEigenvalues_C", PCGAMGSetEigenvalues_GAMG)); 19499566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetUseSAEstEig_C", PCGAMGSetUseSAEstEig_GAMG)); 1950e1cf1444SMark Adams PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetRecomputeEstEig_C", PCGAMGSetRecomputeEstEig_GAMG)); 19519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetReuseInterpolation_C", PCGAMGSetReuseInterpolation_GAMG)); 19529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGASMSetUseAggs_C", PCGAMGASMSetUseAggs_GAMG)); 1953d529f056Smarkadams4 PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetParallelCoarseGridSolve_C", PCGAMGSetParallelCoarseGridSolve_GAMG)); 19549566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetCpuPinCoarseGrids_C", PCGAMGSetCpuPinCoarseGrids_GAMG)); 19559566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetCoarseGridLayoutType_C", PCGAMGSetCoarseGridLayoutType_GAMG)); 19569566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetThreshold_C", PCGAMGSetThreshold_GAMG)); 19579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetRankReductionFactors_C", PCGAMGSetRankReductionFactors_GAMG)); 19589566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetThresholdScale_C", PCGAMGSetThresholdScale_GAMG)); 19599566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetType_C", PCGAMGSetType_GAMG)); 19609566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGGetType_C", PCGAMGGetType_GAMG)); 19619566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetNlevels_C", PCGAMGSetNlevels_GAMG)); 19628926f930SMark Adams PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGASMSetHEM_C", PCGAMGASMSetHEM_GAMG)); 1963b65aec2dSMark Adams PetscCall(PetscObjectComposeFunction((PetscObject)pc, "PCGAMGSetInjectionIndex_C", PCGAMGSetInjectionIndex_GAMG)); 19649d5b6da9SMark F. Adams pc_gamg->repart = PETSC_FALSE; 196521d928e4Smarkadams4 pc_gamg->reuse_prol = PETSC_TRUE; 19660c3bc534SBarry Smith pc_gamg->use_aggs_in_asm = PETSC_FALSE; 1967171cca9aSMark Adams pc_gamg->use_parallel_coarse_grid_solver = PETSC_FALSE; 1968a0095786SMark pc_gamg->cpu_pin_coarse_grids = PETSC_FALSE; 1969a0095786SMark pc_gamg->layout_type = PCGAMG_LAYOUT_SPREAD; 1970038f3aa4SMark F. Adams pc_gamg->min_eq_proc = 50; 19718926f930SMark Adams pc_gamg->asm_hem_aggs = 0; 197225a145a7SMark Adams pc_gamg->coarse_eq_limit = 50; 197353134ebeSMark Adams for (int i = 0; i < PETSC_MG_MAXLEVELS; i++) pc_gamg->threshold[i] = -1; 1974c1eae691SMark Adams pc_gamg->threshold_scale = 1.; 197518c3aa7eSMark pc_gamg->Nlevels = PETSC_MG_MAXLEVELS; 19769ab59c8bSMark Adams pc_gamg->current_level = 0; /* don't need to init really */ 19777e6512fdSJed Brown pc_gamg->use_sa_esteig = PETSC_TRUE; 1978e1cf1444SMark Adams pc_gamg->recompute_esteig = PETSC_TRUE; 197918c3aa7eSMark pc_gamg->emin = 0; 198018c3aa7eSMark pc_gamg->emax = 0; 198118c3aa7eSMark 1982c238b0ebSToby Isaac pc_gamg->ops->createlevel = PCGAMGCreateLevel_GAMG; 19839d5b6da9SMark F. Adams 1984bd94a7aaSJed Brown /* PCSetUp_GAMG assumes that the type has been set, so set it to the default now */ 19859566063dSJacob Faibussowitsch PetscCall(PCGAMGSetType(pc, PCGAMGAGG)); 19863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 19875b89ad90SMark F. Adams } 19883e3471ccSMark Adams 19893e3471ccSMark Adams /*@C 1990f1580f4eSBarry Smith PCGAMGInitializePackage - This function initializes everything in the `PCGAMG` package. It is called 1991f1580f4eSBarry Smith from `PCInitializePackage()`. 19923e3471ccSMark Adams 19933e3471ccSMark Adams Level: developer 19943e3471ccSMark Adams 1995562efe2eSBarry Smith .seealso: [](ch_ksp), `PetscInitialize()` 19963e3471ccSMark Adams @*/ 1997d71ae5a4SJacob Faibussowitsch PetscErrorCode PCGAMGInitializePackage(void) 1998d71ae5a4SJacob Faibussowitsch { 19994555aa8cSStefano Zampini PetscInt l; 20003e3471ccSMark Adams 20013e3471ccSMark Adams PetscFunctionBegin; 20023ba16761SJacob Faibussowitsch if (PCGAMGPackageInitialized) PetscFunctionReturn(PETSC_SUCCESS); 20033e3471ccSMark Adams PCGAMGPackageInitialized = PETSC_TRUE; 20049566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&GAMGList, PCGAMGGEO, PCCreateGAMG_GEO)); 20059566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&GAMGList, PCGAMGAGG, PCCreateGAMG_AGG)); 20069566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&GAMGList, PCGAMGCLASSICAL, PCCreateGAMG_Classical)); 20079566063dSJacob Faibussowitsch PetscCall(PetscRegisterFinalize(PCGAMGFinalizePackage)); 2008c1c463dbSMark Adams 2009c1c463dbSMark Adams /* general events */ 2010849bee69SMark Adams PetscCall(PetscLogEventRegister("PCSetUp_GAMG+", PC_CLASSID, &petsc_gamg_setup_events[GAMG_SETUP])); 2011849bee69SMark Adams PetscCall(PetscLogEventRegister(" PCGAMGCreateG", PC_CLASSID, &petsc_gamg_setup_events[GAMG_GRAPH])); 2012849bee69SMark Adams PetscCall(PetscLogEventRegister(" GAMG Coarsen", PC_CLASSID, &petsc_gamg_setup_events[GAMG_COARSEN])); 2013849bee69SMark Adams PetscCall(PetscLogEventRegister(" GAMG MIS/Agg", PC_CLASSID, &petsc_gamg_setup_events[GAMG_MIS])); 2014849bee69SMark Adams PetscCall(PetscLogEventRegister(" PCGAMGProl", PC_CLASSID, &petsc_gamg_setup_events[GAMG_PROL])); 2015849bee69SMark Adams PetscCall(PetscLogEventRegister(" GAMG Prol-col", PC_CLASSID, &petsc_gamg_setup_events[GAMG_PROLA])); 2016849bee69SMark Adams PetscCall(PetscLogEventRegister(" GAMG Prol-lift", PC_CLASSID, &petsc_gamg_setup_events[GAMG_PROLB])); 2017849bee69SMark Adams PetscCall(PetscLogEventRegister(" PCGAMGOptProl", PC_CLASSID, &petsc_gamg_setup_events[GAMG_OPT])); 2018849bee69SMark Adams PetscCall(PetscLogEventRegister(" GAMG smooth", PC_CLASSID, &petsc_gamg_setup_events[GAMG_OPTSM])); 2019849bee69SMark Adams PetscCall(PetscLogEventRegister(" PCGAMGCreateL", PC_CLASSID, &petsc_gamg_setup_events[GAMG_LEVEL])); 2020849bee69SMark Adams PetscCall(PetscLogEventRegister(" GAMG PtAP", PC_CLASSID, &petsc_gamg_setup_events[GAMG_PTAP])); 2021849bee69SMark Adams PetscCall(PetscLogEventRegister(" GAMG Reduce", PC_CLASSID, &petsc_gamg_setup_events[GAMG_REDUCE])); 2022849bee69SMark Adams PetscCall(PetscLogEventRegister(" GAMG Repart", PC_CLASSID, &petsc_gamg_setup_events[GAMG_REPART])); 2023849bee69SMark Adams /* PetscCall(PetscLogEventRegister(" GAMG Inv-Srt", PC_CLASSID, &petsc_gamg_setup_events[SET13])); */ 2024849bee69SMark Adams /* PetscCall(PetscLogEventRegister(" GAMG Move A", PC_CLASSID, &petsc_gamg_setup_events[SET14])); */ 2025849bee69SMark Adams /* PetscCall(PetscLogEventRegister(" GAMG Move P", PC_CLASSID, &petsc_gamg_setup_events[SET15])); */ 20264555aa8cSStefano Zampini for (l = 0; l < PETSC_MG_MAXLEVELS; l++) { 20274555aa8cSStefano Zampini char ename[32]; 20285b89ad90SMark F. Adams 202963a3b9bcSJacob Faibussowitsch PetscCall(PetscSNPrintf(ename, sizeof(ename), "PCGAMG Squ l%02" PetscInt_FMT, l)); 20309566063dSJacob Faibussowitsch PetscCall(PetscLogEventRegister(ename, PC_CLASSID, &petsc_gamg_setup_matmat_events[l][0])); 203163a3b9bcSJacob Faibussowitsch PetscCall(PetscSNPrintf(ename, sizeof(ename), "PCGAMG Gal l%02" PetscInt_FMT, l)); 20329566063dSJacob Faibussowitsch PetscCall(PetscLogEventRegister(ename, PC_CLASSID, &petsc_gamg_setup_matmat_events[l][1])); 203363a3b9bcSJacob Faibussowitsch PetscCall(PetscSNPrintf(ename, sizeof(ename), "PCGAMG Opt l%02" PetscInt_FMT, l)); 20349566063dSJacob Faibussowitsch PetscCall(PetscLogEventRegister(ename, PC_CLASSID, &petsc_gamg_setup_matmat_events[l][2])); 20354555aa8cSStefano Zampini } 20364555aa8cSStefano Zampini #if defined(GAMG_STAGES) 2037849bee69SMark Adams { /* create timer stages */ 20385b89ad90SMark F. Adams char str[32]; 2039a364092eSJacob Faibussowitsch PetscCall(PetscSNPrintf(str, PETSC_STATIC_ARRAY_LENGTH(str), "GAMG Level %d", 0)); 20409566063dSJacob Faibussowitsch PetscCall(PetscLogStageRegister(str, &gamg_stages[0])); 20415b89ad90SMark F. Adams } 20425b89ad90SMark F. Adams #endif 20433ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 20443e3471ccSMark Adams } 20453e3471ccSMark Adams 20463e3471ccSMark Adams /*@C 2047f1580f4eSBarry Smith PCGAMGFinalizePackage - This function frees everything from the `PCGAMG` package. It is 2048f1580f4eSBarry Smith called from `PetscFinalize()` automatically. 20493e3471ccSMark Adams 20503e3471ccSMark Adams Level: developer 20513e3471ccSMark Adams 2052562efe2eSBarry Smith .seealso: [](ch_ksp), `PetscFinalize()` 20533e3471ccSMark Adams @*/ 2054d71ae5a4SJacob Faibussowitsch PetscErrorCode PCGAMGFinalizePackage(void) 2055d71ae5a4SJacob Faibussowitsch { 20563e3471ccSMark Adams PetscFunctionBegin; 20573e3471ccSMark Adams PCGAMGPackageInitialized = PETSC_FALSE; 20589566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDestroy(&GAMGList)); 20593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 20603e3471ccSMark Adams } 2061a36cf38bSToby Isaac 2062a36cf38bSToby Isaac /*@C 2063f1580f4eSBarry Smith PCGAMGRegister - Register a `PCGAMG` implementation. 2064a36cf38bSToby Isaac 2065a36cf38bSToby Isaac Input Parameters: 2066f1580f4eSBarry Smith + type - string that will be used as the name of the `PCGAMG` type. 2067a36cf38bSToby Isaac - create - function for creating the gamg context. 2068a36cf38bSToby Isaac 2069f1580f4eSBarry Smith Level: developer 2070a36cf38bSToby Isaac 2071562efe2eSBarry Smith .seealso: [](ch_ksp), `PCGAMGType`, `PCGAMG`, `PCGAMGSetType()` 2072a36cf38bSToby Isaac @*/ 2073d71ae5a4SJacob Faibussowitsch PetscErrorCode PCGAMGRegister(PCGAMGType type, PetscErrorCode (*create)(PC)) 2074d71ae5a4SJacob Faibussowitsch { 2075a36cf38bSToby Isaac PetscFunctionBegin; 20769566063dSJacob Faibussowitsch PetscCall(PCGAMGInitializePackage()); 20779566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&GAMGList, type, create)); 20783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2079a36cf38bSToby Isaac } 20802d776b49SBarry Smith 2081cc4c1da9SBarry Smith /*@ 20822d776b49SBarry Smith PCGAMGCreateGraph - Creates a graph that is used by the ``PCGAMGType`` in the coarsening process 20832d776b49SBarry Smith 20842d776b49SBarry Smith Input Parameters: 20852d776b49SBarry Smith + pc - the `PCGAMG` 20862d776b49SBarry Smith - A - the matrix, for any level 20872d776b49SBarry Smith 20882d776b49SBarry Smith Output Parameter: 20892d776b49SBarry Smith . G - the graph 20902d776b49SBarry Smith 20912d776b49SBarry Smith Level: advanced 20922d776b49SBarry Smith 2093562efe2eSBarry Smith .seealso: [](ch_ksp), `PCGAMGType`, `PCGAMG`, `PCGAMGSetType()` 20942d776b49SBarry Smith @*/ 20952d776b49SBarry Smith PetscErrorCode PCGAMGCreateGraph(PC pc, Mat A, Mat *G) 20962d776b49SBarry Smith { 20972d776b49SBarry Smith PC_MG *mg = (PC_MG *)pc->data; 20982d776b49SBarry Smith PC_GAMG *pc_gamg = (PC_GAMG *)mg->innerctx; 20992d776b49SBarry Smith 21002d776b49SBarry Smith PetscFunctionBegin; 21012d776b49SBarry Smith PetscCall(pc_gamg->ops->creategraph(pc, A, G)); 21023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 21032d776b49SBarry Smith } 2104