15b89ad90SMark F. Adams /* 20cd22d39SHong Zhang GAMG geometric-algebric multigrid PC - Mark Adams 2011 35b89ad90SMark F. Adams */ 4af0996ceSBarry Smith #include <petsc/private/matimpl.h> 5389730f3SMark F. Adams #include <../src/ksp/pc/impls/gamg/gamg.h> /*I "petscpc.h" I*/ 65b42dca8SJed Brown #include <../src/ksp/pc/impls/bjacobi/bjacobi.h> /* Hack to access same_local_solves */ 718c3aa7eSMark #include <../src/ksp/ksp/impls/cheby/chebyshevimpl.h> /*I "petscksp.h" I*/ 8f96513f1SMatthew G Knepley 9c9567895SMark #if defined(PETSC_HAVE_CUDA) 10c9567895SMark #include <cuda_runtime.h> 11c9567895SMark #endif 12c9567895SMark 13c9567895SMark #if defined(PETSC_HAVE_HIP) 14c9567895SMark #include <hip/hip_runtime.h> 15c9567895SMark #endif 16c9567895SMark 170cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG 180cbbd2e1SMark F. Adams PetscLogEvent petsc_gamg_setup_events[NUM_SET]; 19b4fbaa2aSMark F. Adams #endif 200cbbd2e1SMark F. Adams 210cbbd2e1SMark F. Adams #if defined PETSC_USE_LOG 22fd1112cbSBarry Smith PetscLogEvent PC_GAMGGraph_AGG; 23fd1112cbSBarry Smith PetscLogEvent PC_GAMGGraph_GEO; 240cbbd2e1SMark F. Adams PetscLogEvent PC_GAMGCoarsen_AGG; 250cbbd2e1SMark F. Adams PetscLogEvent PC_GAMGCoarsen_GEO; 260cbbd2e1SMark F. Adams PetscLogEvent PC_GAMGProlongator_AGG; 270cbbd2e1SMark F. Adams PetscLogEvent PC_GAMGProlongator_GEO; 28fd1112cbSBarry Smith PetscLogEvent PC_GAMGOptProlongator_AGG; 290cbbd2e1SMark F. Adams #endif 300cbbd2e1SMark F. Adams 31b8fd24d8SMark F. Adams /* #define GAMG_STAGES */ 320cbbd2e1SMark F. Adams #if (defined PETSC_GAMG_USE_LOG && defined GAMG_STAGES) 3318c3aa7eSMark static PetscLogStage gamg_stages[PETSC_MG_MAXLEVELS]; 34b4fbaa2aSMark F. Adams #endif 35f96513f1SMatthew G Knepley 360a545947SLisandro Dalcin static PetscFunctionList GAMGList = NULL; 373e3471ccSMark Adams static PetscBool PCGAMGPackageInitialized; 389d5b6da9SMark F. Adams 39d3d6bff4SMark F. Adams /* ----------------------------------------------------------------------------- */ 40d3d6bff4SMark F. Adams PetscErrorCode PCReset_GAMG(PC pc) 41d3d6bff4SMark F. Adams { 4218c3aa7eSMark PetscErrorCode ierr, level; 43d3d6bff4SMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 44d3d6bff4SMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 45d3d6bff4SMark F. Adams 46d3d6bff4SMark F. Adams PetscFunctionBegin; 4722a233eaSStefano Zampini ierr = PetscFree(pc_gamg->data);CHKERRQ(ierr); 481c1aac46SBarry Smith pc_gamg->data_sz = 0; 49878e152fSMark F. Adams ierr = PetscFree(pc_gamg->orig_data);CHKERRQ(ierr); 5018c3aa7eSMark for (level = 0; level < PETSC_MG_MAXLEVELS ; level++) { 5118c3aa7eSMark mg->min_eigen_DinvA[level] = 0; 5218c3aa7eSMark mg->max_eigen_DinvA[level] = 0; 5318c3aa7eSMark } 5418c3aa7eSMark pc_gamg->emin = 0; 5518c3aa7eSMark pc_gamg->emax = 0; 56a2f3521dSMark F. Adams PetscFunctionReturn(0); 57a2f3521dSMark F. Adams } 58a2f3521dSMark F. Adams 595b89ad90SMark F. Adams /* -------------------------------------------------------------------------- */ 605b89ad90SMark F. Adams /* 61c238b0ebSToby Isaac PCGAMGCreateLevel_GAMG: create coarse op with RAP. repartition and/or reduce number 62a147abb0SMark F. Adams of active processors. 635b89ad90SMark F. Adams 645b89ad90SMark F. Adams Input Parameter: 65a2f3521dSMark F. Adams . pc - parameters + side effect: coarse data in 'pc_gamg->data' and 66a2f3521dSMark F. Adams 'pc_gamg->data_sz' are changed via repartitioning/reduction. 679d5b6da9SMark F. Adams . Amat_fine - matrix on this fine (k) level 68c5bfad50SMark F. Adams . cr_bs - coarse block size 693530afc2SMark F. Adams In/Output Parameter: 70a2f3521dSMark F. Adams . a_P_inout - prolongation operator to the next level (k-->k-1) 71afc97cdcSMark F. Adams . a_nactive_proc - number of active procs 7211e60469SMark F. Adams Output Parameter: 733530afc2SMark F. Adams . a_Amat_crs - coarse matrix that is created (k-1) 745b89ad90SMark F. Adams */ 755cb416c2SMark F. Adams 76171cca9aSMark Adams static PetscErrorCode PCGAMGCreateLevel_GAMG(PC pc,Mat Amat_fine,PetscInt cr_bs,Mat *a_P_inout,Mat *a_Amat_crs,PetscMPIInt *a_nactive_proc,IS * Pcolumnperm, PetscBool is_last) 775b89ad90SMark F. Adams { 78a2f3521dSMark F. Adams PetscErrorCode ierr; 799d5b6da9SMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 80486a8d0bSJed Brown PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 81a2f3521dSMark F. Adams Mat Cmat,Pold=*a_P_inout; 823b4367a7SBarry Smith MPI_Comm comm; 83c5df96a5SBarry Smith PetscMPIInt rank,size,new_size,nactive=*a_nactive_proc; 843ae0bb68SMark Adams PetscInt ncrs_eq,ncrs,f_bs; 855b89ad90SMark F. Adams 865b89ad90SMark F. Adams PetscFunctionBegin; 873b4367a7SBarry Smith ierr = PetscObjectGetComm((PetscObject)Amat_fine,&comm);CHKERRQ(ierr); 88ffc4695bSBarry Smith ierr = MPI_Comm_rank(comm, &rank);CHKERRMPI(ierr); 89ffc4695bSBarry Smith ierr = MPI_Comm_size(comm, &size);CHKERRMPI(ierr); 90c5bfad50SMark F. Adams ierr = MatGetBlockSize(Amat_fine, &f_bs);CHKERRQ(ierr); 919d5b6da9SMark F. Adams ierr = MatPtAP(Amat_fine, Pold, MAT_INITIAL_MATRIX, 2.0, &Cmat);CHKERRQ(ierr); 92038e3b61SMark F. Adams 93ce7c7f2fSMark Adams if (Pcolumnperm) *Pcolumnperm = NULL; 94ce7c7f2fSMark Adams 953ae0bb68SMark Adams /* set 'ncrs' (nodes), 'ncrs_eq' (equations)*/ 960298fd71SBarry Smith ierr = MatGetLocalSize(Cmat, &ncrs_eq, NULL);CHKERRQ(ierr); 973ae0bb68SMark Adams if (pc_gamg->data_cell_rows>0) { 983ae0bb68SMark Adams ncrs = pc_gamg->data_sz/pc_gamg->data_cell_cols/pc_gamg->data_cell_rows; 9973911c69SBarry Smith } else { 1003ae0bb68SMark Adams PetscInt bs; 1013ae0bb68SMark Adams ierr = MatGetBlockSize(Cmat, &bs);CHKERRQ(ierr); 1023ae0bb68SMark Adams ncrs = ncrs_eq/bs; 1033ae0bb68SMark Adams } 104c5df96a5SBarry Smith /* get number of PEs to make active 'new_size', reduce, can be any integer 1-P */ 105c9567895SMark if (pc_gamg->level_reduction_factors[pc_gamg->current_level] == 0 && PetscDefined(HAVE_CUDA) && pc_gamg->current_level==0) { /* 0 turns reducing to 1 process/device on; do for HIP, etc. */ 106c9567895SMark #if defined(PETSC_HAVE_CUDA) 107c9567895SMark PetscShmComm pshmcomm; 108c9567895SMark PetscMPIInt locrank; 109c9567895SMark MPI_Comm loccomm; 110c9567895SMark PetscInt s_nnodes,r_nnodes, new_new_size; 111c9567895SMark cudaError_t cerr; 112c9567895SMark int devCount; 113c9567895SMark ierr = PetscShmCommGet(comm,&pshmcomm);CHKERRQ(ierr); 114c9567895SMark ierr = PetscShmCommGetMpiShmComm(pshmcomm,&loccomm);CHKERRQ(ierr); 115c9567895SMark ierr = MPI_Comm_rank(loccomm, &locrank);CHKERRQ(ierr); 116c9567895SMark s_nnodes = !locrank; 117c9567895SMark ierr = MPI_Allreduce(&s_nnodes,&r_nnodes,1,MPIU_INT,MPI_SUM,comm);CHKERRQ(ierr); 118c9567895SMark if (size%r_nnodes) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"odd number of nodes np=%D nnodes%D",size,r_nnodes); 119c9567895SMark devCount = 0; 120c9567895SMark cerr = cudaGetDeviceCount(&devCount); 121c9567895SMark cudaGetLastError(); /* Reset the last error */ 122c9567895SMark if (cerr == cudaSuccess && devCount >= 1) { /* There are devices, else go to heuristic */ 123c9567895SMark new_new_size = r_nnodes * devCount; 124c9567895SMark new_size = new_new_size; 125c9567895SMark ierr = PetscInfo5(pc,"Fine grid with Cuda. %D nodes. Change new active set size %D --> %D (devCount=%D #nodes=%D)\n",r_nnodes,nactive,new_size,devCount,r_nnodes);CHKERRQ(ierr); 126c9567895SMark } else { 127c9567895SMark ierr = PetscInfo(pc,"With Cuda but no device. Use heuristics.");CHKERRQ(ierr); 128c9567895SMark goto HEURISTIC; 129c9567895SMark } 130c9567895SMark #else 131c9567895SMark SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"should not be here"); 132c9567895SMark #endif 133c9567895SMark } else if (pc_gamg->level_reduction_factors[pc_gamg->current_level] > 0) { 134c9567895SMark if (nactive%pc_gamg->level_reduction_factors[pc_gamg->current_level]) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"odd number of active process %D wrt reduction factor %D",nactive,pc_gamg->level_reduction_factors[pc_gamg->current_level]); 135c9567895SMark new_size = nactive/pc_gamg->level_reduction_factors[pc_gamg->current_level]; 136c9567895SMark ierr = PetscInfo3(pc,"Manually setting reduction to %D active processes (%D/%D)\n",new_size,nactive,pc_gamg->level_reduction_factors[pc_gamg->current_level]);CHKERRQ(ierr); 137c9567895SMark } else if (is_last && !pc_gamg->use_parallel_coarse_grid_solver) { 138c9567895SMark new_size = 1; 139*8abdc6daSStefano Zampini ierr = PetscInfo1(pc,"Force coarsest grid reduction to %D active processes\n",new_size);CHKERRQ(ierr); 140c9567895SMark } else { 141472110cdSMark F. Adams PetscInt ncrs_eq_glob; 142c9567895SMark #if defined(PETSC_HAVE_CUDA) 143c9567895SMark HEURISTIC: 144c9567895SMark #endif 1450298fd71SBarry Smith ierr = MatGetSize(Cmat, &ncrs_eq_glob, NULL);CHKERRQ(ierr); 146a90e85d9SMark Adams new_size = (PetscMPIInt)((float)ncrs_eq_glob/(float)pc_gamg->min_eq_proc + 0.5); /* hardwire min. number of eq/proc */ 1477f66b68fSMark Adams if (!new_size) new_size = 1; /* not likely, posible? */ 148c5df96a5SBarry Smith else if (new_size >= nactive) new_size = nactive; /* no change, rare */ 149*8abdc6daSStefano Zampini ierr = PetscInfo2(pc,"Coarse grid reduction from %D to %D active processes\n",nactive,new_size);CHKERRQ(ierr); 150a2f3521dSMark F. Adams } 1512e3501ffSMark Adams if (new_size==nactive) { 152ef3f0257SMark Adams *a_Amat_crs = Cmat; /* output - no repartitioning or reduction - could bail here */ 153ce7c7f2fSMark Adams if (new_size < size) { 154ce7c7f2fSMark Adams /* odd case where multiple coarse grids are on one processor or no coarsening ... */ 155c9567895SMark ierr = PetscInfo1(pc,"reduced grid using same number of processors (%D) as last grid (use larger coarse grid)\n",nactive);CHKERRQ(ierr); 156ce7c7f2fSMark Adams if (pc_gamg->cpu_pin_coarse_grids) { 157b470e4b4SRichard Tran Mills ierr = MatBindToCPU(*a_Amat_crs,PETSC_TRUE);CHKERRQ(ierr); 158b470e4b4SRichard Tran Mills ierr = MatBindToCPU(*a_P_inout,PETSC_TRUE);CHKERRQ(ierr); 159ce7c7f2fSMark Adams } 160ce7c7f2fSMark Adams } 161ef3f0257SMark Adams /* we know that the grid structure can be reused in MatPtAP */ 1622e3501ffSMark Adams } else { /* reduce active processors - we know that the grid structure can NOT be reused in MatPtAP */ 163192c0e8bSMark Adams PetscInt *counts,*newproc_idx,ii,jj,kk,strideNew,*tidx,ncrs_new,ncrs_eq_new,nloc_old,expand_factor=1,rfactor=1; 164885364a3SMark Adams IS is_eq_newproc,is_eq_num,is_eq_num_prim,new_eq_indices; 16571959b99SBarry Smith nloc_old = ncrs_eq/cr_bs; 16671959b99SBarry Smith if (ncrs_eq % cr_bs) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"ncrs_eq %D not divisible by cr_bs %D",ncrs_eq,cr_bs); 167ce7c7f2fSMark Adams /* get new_size and rfactor */ 168ce7c7f2fSMark Adams if (pc_gamg->layout_type==PCGAMG_LAYOUT_SPREAD || !pc_gamg->repart) { 169ce7c7f2fSMark Adams /* find factor */ 170ce7c7f2fSMark Adams if (new_size == 1) rfactor = size; /* don't modify */ 171ce7c7f2fSMark Adams else { 172ce7c7f2fSMark Adams PetscReal best_fact = 0.; 173ce7c7f2fSMark Adams jj = -1; 174ce7c7f2fSMark Adams for (kk = 1 ; kk <= size ; kk++) { 175ce7c7f2fSMark Adams if (!(size%kk)) { /* a candidate */ 176ce7c7f2fSMark Adams PetscReal nactpe = (PetscReal)size/(PetscReal)kk, fact = nactpe/(PetscReal)new_size; 177ce7c7f2fSMark Adams if (fact > 1.0) fact = 1./fact; /* keep fact < 1 */ 178ce7c7f2fSMark Adams if (fact > best_fact) { 179ce7c7f2fSMark Adams best_fact = fact; jj = kk; 180ce7c7f2fSMark Adams } 181ce7c7f2fSMark Adams } 182ce7c7f2fSMark Adams } 183ce7c7f2fSMark Adams if (jj != -1) rfactor = jj; 184ce7c7f2fSMark Adams else rfactor = 1; /* a prime */ 185ce7c7f2fSMark Adams if (pc_gamg->layout_type == PCGAMG_LAYOUT_COMPACT) expand_factor = 1; 186ce7c7f2fSMark Adams else expand_factor = rfactor; 187ce7c7f2fSMark Adams } 188ce7c7f2fSMark Adams new_size = size/rfactor; /* make new size one that is factor */ 1894cdfd227SMark if (new_size==nactive) { /* no repartitioning or reduction, bail out because nested here (rare) */ 1904cdfd227SMark *a_Amat_crs = Cmat; 191c9567895SMark ierr = PetscInfo2(pc,"Finding factorable processor set stopped reduction: new_size=%D, neq(loc)=%D\n",new_size,ncrs_eq);CHKERRQ(ierr); 192ce7c7f2fSMark Adams PetscFunctionReturn(0); 193ce7c7f2fSMark Adams } 194ce7c7f2fSMark Adams } 1954cdfd227SMark #if defined PETSC_GAMG_USE_LOG 1964cdfd227SMark ierr = PetscLogEventBegin(petsc_gamg_setup_events[SET12],0,0,0,0);CHKERRQ(ierr); 1974cdfd227SMark #endif 198a2f3521dSMark F. Adams /* make 'is_eq_newproc' */ 199785e854fSJed Brown ierr = PetscMalloc1(size, &counts);CHKERRQ(ierr); 2002e3501ffSMark Adams if (pc_gamg->repart) { 201a2f3521dSMark F. Adams /* Repartition Cmat_{k} and move colums of P^{k}_{k-1} and coordinates of primal part accordingly */ 2025a9b9e01SMark F. Adams Mat adj; 203c9567895SMark ierr = PetscInfo4(pc,"Repartition: size (active): %D --> %D, %D local equations, using %s process layout\n",*a_nactive_proc, new_size, ncrs_eq, (pc_gamg->layout_type==PCGAMG_LAYOUT_COMPACT) ? "compact" : "spread");CHKERRQ(ierr); 204a2f3521dSMark F. Adams /* get 'adj' */ 205c5bfad50SMark F. Adams if (cr_bs == 1) { 206038e3b61SMark F. Adams ierr = MatConvert(Cmat, MATMPIADJ, MAT_INITIAL_MATRIX, &adj);CHKERRQ(ierr); 207806fa848SBarry Smith } else { 208a2f3521dSMark F. Adams /* make a scalar matrix to partition (no Stokes here) */ 209eb07cef2SMark F. Adams Mat tMat; 210a2f3521dSMark F. Adams PetscInt Istart_crs,Iend_crs,ncols,jj,Ii; 211b4fbaa2aSMark F. Adams const PetscScalar *vals; 212b4fbaa2aSMark F. Adams const PetscInt *idx; 213a2f3521dSMark F. Adams PetscInt *d_nnz, *o_nnz, M, N; 21439d09545SMark Adams static PetscInt llev = 0; /* ugly but just used for debugging */ 215d9558ea9SBarry Smith MatType mtype; 216b4fbaa2aSMark F. Adams 217e632b94dSBarry Smith ierr = PetscMalloc2(ncrs, &d_nnz,ncrs, &o_nnz);CHKERRQ(ierr); 218a2f3521dSMark F. Adams ierr = MatGetOwnershipRange(Cmat, &Istart_crs, &Iend_crs);CHKERRQ(ierr); 219a2f3521dSMark F. Adams ierr = MatGetSize(Cmat, &M, &N);CHKERRQ(ierr); 220c5bfad50SMark F. Adams for (Ii = Istart_crs, jj = 0; Ii < Iend_crs; Ii += cr_bs, jj++) { 2210a545947SLisandro Dalcin ierr = MatGetRow(Cmat,Ii,&ncols,NULL,NULL);CHKERRQ(ierr); 222c5bfad50SMark F. Adams d_nnz[jj] = ncols/cr_bs; 223c5bfad50SMark F. Adams o_nnz[jj] = ncols/cr_bs; 2240a545947SLisandro Dalcin ierr = MatRestoreRow(Cmat,Ii,&ncols,NULL,NULL);CHKERRQ(ierr); 2253ae0bb68SMark Adams if (d_nnz[jj] > ncrs) d_nnz[jj] = ncrs; 2263ae0bb68SMark Adams if (o_nnz[jj] > (M/cr_bs-ncrs)) o_nnz[jj] = M/cr_bs-ncrs; 22758471d46SMark F. Adams } 2286876a03eSMark F. Adams 229d9558ea9SBarry Smith ierr = MatGetType(Amat_fine,&mtype);CHKERRQ(ierr); 2303b4367a7SBarry Smith ierr = MatCreate(comm, &tMat);CHKERRQ(ierr); 2313ae0bb68SMark Adams ierr = MatSetSizes(tMat, ncrs, ncrs,PETSC_DETERMINE, PETSC_DETERMINE);CHKERRQ(ierr); 232d9558ea9SBarry Smith ierr = MatSetType(tMat,mtype);CHKERRQ(ierr); 233a2f3521dSMark F. Adams ierr = MatSeqAIJSetPreallocation(tMat,0,d_nnz);CHKERRQ(ierr); 234a2f3521dSMark F. Adams ierr = MatMPIAIJSetPreallocation(tMat,0,d_nnz,0,o_nnz);CHKERRQ(ierr); 235e632b94dSBarry Smith ierr = PetscFree2(d_nnz,o_nnz);CHKERRQ(ierr); 236eb07cef2SMark F. Adams 237a2f3521dSMark F. Adams for (ii = Istart_crs; ii < Iend_crs; ii++) { 238c5bfad50SMark F. Adams PetscInt dest_row = ii/cr_bs; 23922063be5SMark F. Adams ierr = MatGetRow(Cmat,ii,&ncols,&idx,&vals);CHKERRQ(ierr); 240eb07cef2SMark F. Adams for (jj = 0; jj < ncols; jj++) { 241c5bfad50SMark F. Adams PetscInt dest_col = idx[jj]/cr_bs; 242eb07cef2SMark F. Adams PetscScalar v = 1.0; 243eb07cef2SMark F. Adams ierr = MatSetValues(tMat,1,&dest_row,1,&dest_col,&v,ADD_VALUES);CHKERRQ(ierr); 244eb07cef2SMark F. Adams } 24522063be5SMark F. Adams ierr = MatRestoreRow(Cmat,ii,&ncols,&idx,&vals);CHKERRQ(ierr); 246eb07cef2SMark F. Adams } 247eb07cef2SMark F. Adams ierr = MatAssemblyBegin(tMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 248eb07cef2SMark F. Adams ierr = MatAssemblyEnd(tMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 249eb07cef2SMark F. Adams 250b4fbaa2aSMark F. Adams if (llev++ == -1) { 251b4fbaa2aSMark F. Adams PetscViewer viewer; char fname[32]; 2528caf3d72SBarry Smith ierr = PetscSNPrintf(fname,sizeof(fname),"part_mat_%D.mat",llev);CHKERRQ(ierr); 2533b4367a7SBarry Smith PetscViewerBinaryOpen(comm,fname,FILE_MODE_WRITE,&viewer); 254b4fbaa2aSMark F. Adams ierr = MatView(tMat, viewer);CHKERRQ(ierr); 2553bf036e2SBarry Smith ierr = PetscViewerDestroy(&viewer);CHKERRQ(ierr); 256b4fbaa2aSMark F. Adams } 257eb07cef2SMark F. Adams ierr = MatConvert(tMat, MATMPIADJ, MAT_INITIAL_MATRIX, &adj);CHKERRQ(ierr); 258eb07cef2SMark F. Adams ierr = MatDestroy(&tMat);CHKERRQ(ierr); 259a2f3521dSMark F. Adams } /* create 'adj' */ 260f150b916SMark F. Adams 261a2f3521dSMark F. Adams { /* partition: get newproc_idx */ 2625a9b9e01SMark F. Adams char prefix[256]; 2635a9b9e01SMark F. Adams const char *pcpre; 264b4fbaa2aSMark F. Adams const PetscInt *is_idx; 265b4fbaa2aSMark F. Adams MatPartitioning mpart; 266a4b7d37bSMark F. Adams IS proc_is; 2672f03bc48SMark F. Adams 2683b4367a7SBarry Smith ierr = MatPartitioningCreate(comm, &mpart);CHKERRQ(ierr); 2695ef31b24SMark F. Adams ierr = MatPartitioningSetAdjacency(mpart, adj);CHKERRQ(ierr); 2709d5b6da9SMark F. Adams ierr = PCGetOptionsPrefix(pc, &pcpre);CHKERRQ(ierr); 2718caf3d72SBarry Smith ierr = PetscSNPrintf(prefix,sizeof(prefix),"%spc_gamg_",pcpre ? pcpre : "");CHKERRQ(ierr); 27259a0be82SJed Brown ierr = PetscObjectSetOptionsPrefix((PetscObject)mpart,prefix);CHKERRQ(ierr); 27311e60469SMark F. Adams ierr = MatPartitioningSetFromOptions(mpart);CHKERRQ(ierr); 274c5df96a5SBarry Smith ierr = MatPartitioningSetNParts(mpart, new_size);CHKERRQ(ierr); 275a4b7d37bSMark F. Adams ierr = MatPartitioningApply(mpart, &proc_is);CHKERRQ(ierr); 27611e60469SMark F. Adams ierr = MatPartitioningDestroy(&mpart);CHKERRQ(ierr); 2775a9b9e01SMark F. Adams 2785ef31b24SMark F. Adams /* collect IS info */ 279785e854fSJed Brown ierr = PetscMalloc1(ncrs_eq, &newproc_idx);CHKERRQ(ierr); 280a4b7d37bSMark F. Adams ierr = ISGetIndices(proc_is, &is_idx);CHKERRQ(ierr); 281a2f3521dSMark F. Adams for (kk = jj = 0 ; kk < nloc_old ; kk++) { 282c5bfad50SMark F. Adams for (ii = 0 ; ii < cr_bs ; ii++, jj++) { 283ce7c7f2fSMark Adams newproc_idx[jj] = is_idx[kk] * expand_factor; /* distribution */ 284eb07cef2SMark F. Adams } 2855ef31b24SMark F. Adams } 286a4b7d37bSMark F. Adams ierr = ISRestoreIndices(proc_is, &is_idx);CHKERRQ(ierr); 287a4b7d37bSMark F. Adams ierr = ISDestroy(&proc_is);CHKERRQ(ierr); 2885ef31b24SMark F. Adams } 2895ef31b24SMark F. Adams ierr = MatDestroy(&adj);CHKERRQ(ierr); 2905a9b9e01SMark F. Adams 2913b4367a7SBarry Smith ierr = ISCreateGeneral(comm, ncrs_eq, newproc_idx, PETSC_COPY_VALUES, &is_eq_newproc);CHKERRQ(ierr); 2928263b398SMark F. Adams ierr = PetscFree(newproc_idx);CHKERRQ(ierr); 29331cb4603SMark Adams } else { /* simple aggregation of parts -- 'is_eq_newproc' */ 294ce7c7f2fSMark Adams PetscInt targetPE; 2954cdfd227SMark if (new_size==nactive) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"new_size==nactive. Should not happen"); 296302440fdSBarry Smith ierr = PetscInfo1(pc,"Number of equations (loc) %D with simple aggregation\n",ncrs_eq);CHKERRQ(ierr); 297ce7c7f2fSMark Adams targetPE = (rank/rfactor)*expand_factor; 2983b4367a7SBarry Smith ierr = ISCreateStride(comm, ncrs_eq, targetPE, 0, &is_eq_newproc);CHKERRQ(ierr); 299a2f3521dSMark F. Adams } /* end simple 'is_eq_newproc' */ 300e33ef3b1SMark F. Adams 30111e60469SMark F. Adams /* 302a2f3521dSMark F. Adams Create an index set from the is_eq_newproc index set to indicate the mapping TO 30311e60469SMark F. Adams */ 304a2f3521dSMark F. Adams ierr = ISPartitioningToNumbering(is_eq_newproc, &is_eq_num);CHKERRQ(ierr); 3057700e67bSMark Adams is_eq_num_prim = is_eq_num; 30611e60469SMark F. Adams /* 307a2f3521dSMark F. Adams Determine how many equations/vertices are assigned to each processor 30811e60469SMark F. Adams */ 309c5df96a5SBarry Smith ierr = ISPartitioningCount(is_eq_newproc, size, counts);CHKERRQ(ierr); 310c5df96a5SBarry Smith ncrs_eq_new = counts[rank]; 311a2f3521dSMark F. Adams ierr = ISDestroy(&is_eq_newproc);CHKERRQ(ierr); 312ce7c7f2fSMark Adams ncrs_new = ncrs_eq_new/cr_bs; 313a2f3521dSMark F. Adams 314a2f3521dSMark F. Adams ierr = PetscFree(counts);CHKERRQ(ierr); 315885364a3SMark Adams /* data movement scope -- this could be moved to subclasses so that we don't try to cram all auxilary data into some complex abstracted thing */ 316885364a3SMark Adams { 317885364a3SMark Adams Vec src_crd, dest_crd; 318885364a3SMark Adams const PetscInt *idx,ndata_rows=pc_gamg->data_cell_rows,ndata_cols=pc_gamg->data_cell_cols,node_data_sz=ndata_rows*ndata_cols; 319885364a3SMark Adams VecScatter vecscat; 320885364a3SMark Adams PetscScalar *array; 321885364a3SMark Adams IS isscat; 322a2f3521dSMark F. Adams /* move data (for primal equations only) */ 32322063be5SMark F. Adams /* Create a vector to contain the newly ordered element information */ 3243b4367a7SBarry Smith ierr = VecCreate(comm, &dest_crd);CHKERRQ(ierr); 3253ae0bb68SMark Adams ierr = VecSetSizes(dest_crd, node_data_sz*ncrs_new, PETSC_DECIDE);CHKERRQ(ierr); 326c0dedaeaSBarry Smith ierr = VecSetType(dest_crd,VECSTANDARD);CHKERRQ(ierr); /* this is needed! */ 32711e60469SMark F. Adams /* 3289d5b6da9SMark F. Adams There are 'ndata_rows*ndata_cols' data items per node, (one can think of the vectors of having 329c5bfad50SMark F. Adams a block size of ...). Note, ISs are expanded into equation space by 'cr_bs'. 33011e60469SMark F. Adams */ 331854ce69bSBarry Smith ierr = PetscMalloc1(ncrs*node_data_sz, &tidx);CHKERRQ(ierr); 332a2f3521dSMark F. Adams ierr = ISGetIndices(is_eq_num_prim, &idx);CHKERRQ(ierr); 3333ae0bb68SMark Adams for (ii=0,jj=0; ii<ncrs; ii++) { 334c5bfad50SMark F. Adams PetscInt id = idx[ii*cr_bs]/cr_bs; /* get node back */ 335a2f3521dSMark F. Adams for (kk=0; kk<node_data_sz; kk++, jj++) tidx[jj] = id*node_data_sz + kk; 33611e60469SMark F. Adams } 337a2f3521dSMark F. Adams ierr = ISRestoreIndices(is_eq_num_prim, &idx);CHKERRQ(ierr); 3383ae0bb68SMark Adams ierr = ISCreateGeneral(comm, node_data_sz*ncrs, tidx, PETSC_COPY_VALUES, &isscat);CHKERRQ(ierr); 33992a756f0SMark F. Adams ierr = PetscFree(tidx);CHKERRQ(ierr); 34011e60469SMark F. Adams /* 34111e60469SMark F. Adams Create a vector to contain the original vertex information for each element 34211e60469SMark F. Adams */ 3433ae0bb68SMark Adams ierr = VecCreateSeq(PETSC_COMM_SELF, node_data_sz*ncrs, &src_crd);CHKERRQ(ierr); 3449d5b6da9SMark F. Adams for (jj=0; jj<ndata_cols; jj++) { 3453ae0bb68SMark Adams const PetscInt stride0=ncrs*pc_gamg->data_cell_rows; 3463ae0bb68SMark Adams for (ii=0; ii<ncrs; ii++) { 3479d5b6da9SMark F. Adams for (kk=0; kk<ndata_rows; kk++) { 348a2f3521dSMark F. Adams PetscInt ix = ii*ndata_rows + kk + jj*stride0, jx = ii*node_data_sz + kk*ndata_cols + jj; 349c8b0795cSMark F. Adams PetscScalar tt = (PetscScalar)pc_gamg->data[ix]; 350676e1743SMark F. Adams ierr = VecSetValues(src_crd, 1, &jx, &tt, INSERT_VALUES);CHKERRQ(ierr); 351d3d6bff4SMark F. Adams } 352038e3b61SMark F. Adams } 353eb07cef2SMark F. Adams } 354eb07cef2SMark F. Adams ierr = VecAssemblyBegin(src_crd);CHKERRQ(ierr); 355eb07cef2SMark F. Adams ierr = VecAssemblyEnd(src_crd);CHKERRQ(ierr); 35611e60469SMark F. Adams /* 35711e60469SMark F. Adams Scatter the element vertex information (still in the original vertex ordering) 35811e60469SMark F. Adams to the correct processor 35911e60469SMark F. Adams */ 3609448b7f1SJunchao Zhang ierr = VecScatterCreate(src_crd, NULL, dest_crd, isscat, &vecscat);CHKERRQ(ierr); 36111e60469SMark F. Adams ierr = ISDestroy(&isscat);CHKERRQ(ierr); 36211e60469SMark F. Adams ierr = VecScatterBegin(vecscat,src_crd,dest_crd,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 36311e60469SMark F. Adams ierr = VecScatterEnd(vecscat,src_crd,dest_crd,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 36411e60469SMark F. Adams ierr = VecScatterDestroy(&vecscat);CHKERRQ(ierr); 36511e60469SMark F. Adams ierr = VecDestroy(&src_crd);CHKERRQ(ierr); 36611e60469SMark F. Adams /* 36711e60469SMark F. Adams Put the element vertex data into a new allocation of the gdata->ele 36811e60469SMark F. Adams */ 369c8b0795cSMark F. Adams ierr = PetscFree(pc_gamg->data);CHKERRQ(ierr); 370578f55a3SPeter Brune ierr = PetscMalloc1(node_data_sz*ncrs_new, &pc_gamg->data);CHKERRQ(ierr); 3712fa5cd67SKarl Rupp 3723ae0bb68SMark Adams pc_gamg->data_sz = node_data_sz*ncrs_new; 3733ae0bb68SMark Adams strideNew = ncrs_new*ndata_rows; 3742fa5cd67SKarl Rupp 37511e60469SMark F. Adams ierr = VecGetArray(dest_crd, &array);CHKERRQ(ierr); 3769d5b6da9SMark F. Adams for (jj=0; jj<ndata_cols; jj++) { 3773ae0bb68SMark Adams for (ii=0; ii<ncrs_new; ii++) { 3789d5b6da9SMark F. Adams for (kk=0; kk<ndata_rows; kk++) { 379a2f3521dSMark F. Adams PetscInt ix = ii*ndata_rows + kk + jj*strideNew, jx = ii*node_data_sz + kk*ndata_cols + jj; 380c8b0795cSMark F. Adams pc_gamg->data[ix] = PetscRealPart(array[jx]); 381d3d6bff4SMark F. Adams } 382038e3b61SMark F. Adams } 383038e3b61SMark F. Adams } 38411e60469SMark F. Adams ierr = VecRestoreArray(dest_crd, &array);CHKERRQ(ierr); 38511e60469SMark F. Adams ierr = VecDestroy(&dest_crd);CHKERRQ(ierr); 386885364a3SMark Adams } 387a2f3521dSMark F. Adams /* move A and P (columns) with new layout */ 3880cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG 3890cbbd2e1SMark F. Adams ierr = PetscLogEventBegin(petsc_gamg_setup_events[SET13],0,0,0,0);CHKERRQ(ierr); 390ed3f9983SMark F. Adams #endif 39111e60469SMark F. Adams /* 3927dae84e0SHong Zhang Invert for MatCreateSubMatrix 39311e60469SMark F. Adams */ 394a2f3521dSMark F. Adams ierr = ISInvertPermutation(is_eq_num, ncrs_eq_new, &new_eq_indices);CHKERRQ(ierr); 395a2f3521dSMark F. Adams ierr = ISSort(new_eq_indices);CHKERRQ(ierr); /* is this needed? */ 396c5bfad50SMark F. Adams ierr = ISSetBlockSize(new_eq_indices, cr_bs);CHKERRQ(ierr); 397a2f3521dSMark F. Adams if (is_eq_num != is_eq_num_prim) { 398a2f3521dSMark F. Adams ierr = ISDestroy(&is_eq_num_prim);CHKERRQ(ierr); /* could be same as 'is_eq_num' */ 399a2f3521dSMark F. Adams } 4003cb8563fSToby Isaac if (Pcolumnperm) { 4013cb8563fSToby Isaac ierr = PetscObjectReference((PetscObject)new_eq_indices);CHKERRQ(ierr); 4023cb8563fSToby Isaac *Pcolumnperm = new_eq_indices; 4033cb8563fSToby Isaac } 404a2f3521dSMark F. Adams ierr = ISDestroy(&is_eq_num);CHKERRQ(ierr); 4050cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG 4060cbbd2e1SMark F. Adams ierr = PetscLogEventEnd(petsc_gamg_setup_events[SET13],0,0,0,0);CHKERRQ(ierr); 4070cbbd2e1SMark F. Adams ierr = PetscLogEventBegin(petsc_gamg_setup_events[SET14],0,0,0,0);CHKERRQ(ierr); 408ed3f9983SMark F. Adams #endif 409a2f3521dSMark F. Adams /* 'a_Amat_crs' output */ 410a2f3521dSMark F. Adams { 411a2f3521dSMark F. Adams Mat mat; 4127dae84e0SHong Zhang ierr = MatCreateSubMatrix(Cmat, new_eq_indices, new_eq_indices, MAT_INITIAL_MATRIX, &mat);CHKERRQ(ierr); 413a2f3521dSMark F. Adams *a_Amat_crs = mat; 414a2f3521dSMark F. Adams } 415038e3b61SMark F. Adams ierr = MatDestroy(&Cmat);CHKERRQ(ierr); 416a2f3521dSMark F. Adams 4170cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG 4180cbbd2e1SMark F. Adams ierr = PetscLogEventEnd(petsc_gamg_setup_events[SET14],0,0,0,0);CHKERRQ(ierr); 419ed3f9983SMark F. Adams #endif 42011e60469SMark F. Adams /* prolongator */ 42111e60469SMark F. Adams { 42211e60469SMark F. Adams IS findices; 423a2f3521dSMark F. Adams PetscInt Istart,Iend; 424a2f3521dSMark F. Adams Mat Pnew; 42562294041SBarry Smith 426a2f3521dSMark F. Adams ierr = MatGetOwnershipRange(Pold, &Istart, &Iend);CHKERRQ(ierr); 4270cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG 4280cbbd2e1SMark F. Adams ierr = PetscLogEventBegin(petsc_gamg_setup_events[SET15],0,0,0,0);CHKERRQ(ierr); 429ed3f9983SMark F. Adams #endif 4303b4367a7SBarry Smith ierr = ISCreateStride(comm,Iend-Istart,Istart,1,&findices);CHKERRQ(ierr); 431c5bfad50SMark F. Adams ierr = ISSetBlockSize(findices,f_bs);CHKERRQ(ierr); 4327dae84e0SHong Zhang ierr = MatCreateSubMatrix(Pold, findices, new_eq_indices, MAT_INITIAL_MATRIX, &Pnew);CHKERRQ(ierr); 43311e60469SMark F. Adams ierr = ISDestroy(&findices);CHKERRQ(ierr); 434c5bfad50SMark F. Adams 4350cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG 4360cbbd2e1SMark F. Adams ierr = PetscLogEventEnd(petsc_gamg_setup_events[SET15],0,0,0,0);CHKERRQ(ierr); 437ed3f9983SMark F. Adams #endif 4383530afc2SMark F. Adams ierr = MatDestroy(a_P_inout);CHKERRQ(ierr); 439a2f3521dSMark F. Adams 440a2f3521dSMark F. Adams /* output - repartitioned */ 441a2f3521dSMark F. Adams *a_P_inout = Pnew; 442e33ef3b1SMark F. Adams } 443a2f3521dSMark F. Adams ierr = ISDestroy(&new_eq_indices);CHKERRQ(ierr); 4445b89ad90SMark F. Adams 445c5df96a5SBarry Smith *a_nactive_proc = new_size; /* output */ 446ce7c7f2fSMark Adams 447ce7c7f2fSMark Adams /* pinning on reduced grids, not a bad heuristic and optimization gets folded into process reduction optimization */ 448ce7c7f2fSMark Adams if (pc_gamg->cpu_pin_coarse_grids) { 449ce7c7f2fSMark Adams #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 4508bca76a6SMark Adams static PetscInt llev = 2; 45139d09545SMark Adams ierr = PetscInfo1(pc,"Pinning level %D to the CPU\n",llev++);CHKERRQ(ierr); 452ce7c7f2fSMark Adams #endif 453b470e4b4SRichard Tran Mills ierr = MatBindToCPU(*a_Amat_crs,PETSC_TRUE);CHKERRQ(ierr); 454b470e4b4SRichard Tran Mills ierr = MatBindToCPU(*a_P_inout,PETSC_TRUE);CHKERRQ(ierr); 455ce7c7f2fSMark Adams if (1) { /* lvec is created, need to pin it, this is done in MatSetUpMultiply_MPIAIJ. Hack */ 456ce7c7f2fSMark Adams Mat A = *a_Amat_crs, P = *a_P_inout; 457ce7c7f2fSMark Adams PetscMPIInt size; 458ffc4695bSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)A),&size);CHKERRMPI(ierr); 459ce7c7f2fSMark Adams if (size > 1) { 460ce7c7f2fSMark Adams Mat_MPIAIJ *a = (Mat_MPIAIJ*)A->data, *p = (Mat_MPIAIJ*)P->data; 461b470e4b4SRichard Tran Mills ierr = VecBindToCPU(a->lvec,PETSC_TRUE);CHKERRQ(ierr); 462b470e4b4SRichard Tran Mills ierr = VecBindToCPU(p->lvec,PETSC_TRUE);CHKERRQ(ierr); 463ce7c7f2fSMark Adams } 464ce7c7f2fSMark Adams } 465ce7c7f2fSMark Adams } 4664cdfd227SMark #if defined PETSC_GAMG_USE_LOG 4674cdfd227SMark ierr = PetscLogEventEnd(petsc_gamg_setup_events[SET12],0,0,0,0);CHKERRQ(ierr); 4684cdfd227SMark #endif 469a2f3521dSMark F. Adams } 4705b89ad90SMark F. Adams PetscFunctionReturn(0); 4715b89ad90SMark F. Adams } 4725b89ad90SMark F. Adams 4734b1575e2SStefano Zampini PetscErrorCode PCGAMGSquareGraph_GAMG(PC a_pc, Mat Gmat1, Mat* Gmat2) 4744b1575e2SStefano Zampini { 4754b1575e2SStefano Zampini PetscErrorCode ierr; 4764b1575e2SStefano Zampini const char *prefix; 4774b1575e2SStefano Zampini char addp[32]; 4784b1575e2SStefano Zampini PC_MG *mg = (PC_MG*)a_pc->data; 4794b1575e2SStefano Zampini PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 4804b1575e2SStefano Zampini 4814b1575e2SStefano Zampini PetscFunctionBegin; 4824b1575e2SStefano Zampini ierr = PCGetOptionsPrefix(a_pc,&prefix);CHKERRQ(ierr); 4834b1575e2SStefano Zampini ierr = PetscInfo1(a_pc,"Square Graph on level %D\n",pc_gamg->current_level+1);CHKERRQ(ierr); 484*8abdc6daSStefano Zampini #if defined(PETSC_HAVE_CUDA) 485*8abdc6daSStefano Zampini ierr = MatAIJCUSPARSESetGenerateTranspose(Gmat1,PETSC_TRUE);CHKERRQ(ierr); 486*8abdc6daSStefano Zampini #endif 4874b1575e2SStefano Zampini ierr = MatProductCreate(Gmat1,Gmat1,NULL,Gmat2);CHKERRQ(ierr); 4884b1575e2SStefano Zampini ierr = MatSetOptionsPrefix(*Gmat2,prefix);CHKERRQ(ierr); 4894b1575e2SStefano Zampini ierr = PetscSNPrintf(addp,sizeof(addp),"pc_gamg_square_%d_",pc_gamg->current_level);CHKERRQ(ierr); 4904b1575e2SStefano Zampini ierr = MatAppendOptionsPrefix(*Gmat2,addp);CHKERRQ(ierr); 49143ef1857SStefano Zampini /* TODO: if we know the matrix is symmetric we can pass MATPRODUCT_AB */ 4924b1575e2SStefano Zampini ierr = MatProductSetType(*Gmat2,MATPRODUCT_AtB);CHKERRQ(ierr); 4934b1575e2SStefano Zampini ierr = MatProductSetFromOptions(*Gmat2);CHKERRQ(ierr); 4944b1575e2SStefano Zampini ierr = MatProductSymbolic(*Gmat2);CHKERRQ(ierr); 4954b1575e2SStefano Zampini /* we only need the sparsity, cheat and tell PETSc the matrix has been assembled */ 4964b1575e2SStefano Zampini (*Gmat2)->assembled = PETSC_TRUE; 4974b1575e2SStefano Zampini PetscFunctionReturn(0); 4984b1575e2SStefano Zampini } 4994b1575e2SStefano Zampini 5005b89ad90SMark F. Adams /* -------------------------------------------------------------------------- */ 5015b89ad90SMark F. Adams /* 5025b89ad90SMark F. Adams PCSetUp_GAMG - Prepares for the use of the GAMG preconditioner 5035b89ad90SMark F. Adams by setting data structures and options. 5045b89ad90SMark F. Adams 5055b89ad90SMark F. Adams Input Parameter: 5065b89ad90SMark F. Adams . pc - the preconditioner context 5075b89ad90SMark F. Adams 5085b89ad90SMark F. Adams */ 5099d5b6da9SMark F. Adams PetscErrorCode PCSetUp_GAMG(PC pc) 5105b89ad90SMark F. Adams { 5115b89ad90SMark F. Adams PetscErrorCode ierr; 5129d5b6da9SMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 5135b89ad90SMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 5142adcac29SMark F. Adams Mat Pmat = pc->pmat; 51518c3aa7eSMark PetscInt fine_level,level,level1,bs,M,N,qq,lidx,nASMBlocksArr[PETSC_MG_MAXLEVELS]; 5163b4367a7SBarry Smith MPI_Comm comm; 517c5df96a5SBarry Smith PetscMPIInt rank,size,nactivepe; 51818c3aa7eSMark Mat Aarr[PETSC_MG_MAXLEVELS],Parr[PETSC_MG_MAXLEVELS]; 51918c3aa7eSMark IS *ASMLocalIDsArr[PETSC_MG_MAXLEVELS]; 520a2f3521dSMark F. Adams PetscLogDouble nnz0=0.,nnztot=0.; 521569f4572SMark Adams MatInfo info; 522171cca9aSMark Adams PetscBool is_last = PETSC_FALSE; 5235ef31b24SMark F. Adams 5245b89ad90SMark F. Adams PetscFunctionBegin; 5253b4367a7SBarry Smith ierr = PetscObjectGetComm((PetscObject)pc,&comm);CHKERRQ(ierr); 526ffc4695bSBarry Smith ierr = MPI_Comm_rank(comm,&rank);CHKERRMPI(ierr); 527ffc4695bSBarry Smith ierr = MPI_Comm_size(comm,&size);CHKERRMPI(ierr); 528dfd5c07aSMark F. Adams 529*8abdc6daSStefano Zampini if (pc->setupcalled) { 530*8abdc6daSStefano Zampini if (!pc_gamg->reuse_prol || pc->flag == DIFFERENT_NONZERO_PATTERN) { 531878e152fSMark F. Adams /* reset everything */ 532878e152fSMark F. Adams ierr = PCReset_MG(pc);CHKERRQ(ierr); 533878e152fSMark F. Adams pc->setupcalled = 0; 534806fa848SBarry Smith } else { 53584d3f75bSMark F. Adams PC_MG_Levels **mglevels = mg->levels; 53603a628feSMark F. Adams /* just do Galerkin grids */ 53758471d46SMark F. Adams Mat B,dA,dB; 53858471d46SMark F. Adams 5399d5b6da9SMark F. Adams if (pc_gamg->Nlevels > 1) { 54058471d46SMark F. Adams /* currently only handle case where mat and pmat are the same on coarser levels */ 54123ee1639SBarry Smith ierr = KSPGetOperators(mglevels[pc_gamg->Nlevels-1]->smoothd,&dA,&dB);CHKERRQ(ierr); 54258471d46SMark F. Adams /* (re)set to get dirty flag */ 54323ee1639SBarry Smith ierr = KSPSetOperators(mglevels[pc_gamg->Nlevels-1]->smoothd,dA,dB);CHKERRQ(ierr); 54458471d46SMark F. Adams 5452fb0b348SMark F. Adams for (level=pc_gamg->Nlevels-2; level>=0; level--) { 546*8abdc6daSStefano Zampini MatReuse reuse = MAT_INITIAL_MATRIX ; 547*8abdc6daSStefano Zampini 548*8abdc6daSStefano Zampini /* matrix structure can change from repartitioning or process reduction but don't know if we have process reduction here. Should fix */ 54923ee1639SBarry Smith ierr = KSPGetOperators(mglevels[level]->smoothd,NULL,&B);CHKERRQ(ierr); 550*8abdc6daSStefano Zampini if (B->product) { 551*8abdc6daSStefano Zampini if (B->product->A == dB && B->product->B == mglevels[level+1]->interpolate) { 552*8abdc6daSStefano Zampini reuse = MAT_REUSE_MATRIX; 55303a628feSMark F. Adams } 554*8abdc6daSStefano Zampini } 555*8abdc6daSStefano Zampini if (reuse == MAT_INITIAL_MATRIX) { ierr = MatDestroy(&mglevels[level]->A);CHKERRQ(ierr); } 556*8abdc6daSStefano Zampini if (reuse == MAT_REUSE_MATRIX) { 557*8abdc6daSStefano Zampini ierr = PetscInfo1(pc,"RAP after first solve, reuse matrix level %D\n",level);CHKERRQ(ierr); 558*8abdc6daSStefano Zampini } else { 559*8abdc6daSStefano Zampini ierr = PetscInfo1(pc,"RAP after first solve, new matrix level %D\n",level);CHKERRQ(ierr); 560*8abdc6daSStefano Zampini } 561*8abdc6daSStefano Zampini ierr = MatPtAP(dB,mglevels[level+1]->interpolate,reuse,PETSC_DEFAULT,&B);CHKERRQ(ierr); 562*8abdc6daSStefano Zampini mglevels[level]->A = B; 56323ee1639SBarry Smith ierr = KSPSetOperators(mglevels[level]->smoothd,B,B);CHKERRQ(ierr); 56458471d46SMark F. Adams dB = B; 56558471d46SMark F. Adams } 5665f8cf99dSMark F. Adams } 567d5280255SMark F. Adams 568d5280255SMark F. Adams ierr = PCSetUp_MG(pc);CHKERRQ(ierr); 56958471d46SMark F. Adams PetscFunctionReturn(0); 570eb07cef2SMark F. Adams } 571878e152fSMark F. Adams } 572f6536408SMark F. Adams 573878e152fSMark F. Adams if (!pc_gamg->data) { 574878e152fSMark F. Adams if (pc_gamg->orig_data) { 575878e152fSMark F. Adams ierr = MatGetBlockSize(Pmat, &bs);CHKERRQ(ierr); 5760298fd71SBarry Smith ierr = MatGetLocalSize(Pmat, &qq, NULL);CHKERRQ(ierr); 5772fa5cd67SKarl Rupp 578878e152fSMark F. Adams pc_gamg->data_sz = (qq/bs)*pc_gamg->orig_data_cell_rows*pc_gamg->orig_data_cell_cols; 579878e152fSMark F. Adams pc_gamg->data_cell_rows = pc_gamg->orig_data_cell_rows; 580878e152fSMark F. Adams pc_gamg->data_cell_cols = pc_gamg->orig_data_cell_cols; 5812fa5cd67SKarl Rupp 582785e854fSJed Brown ierr = PetscMalloc1(pc_gamg->data_sz, &pc_gamg->data);CHKERRQ(ierr); 583878e152fSMark F. Adams for (qq=0; qq<pc_gamg->data_sz; qq++) pc_gamg->data[qq] = pc_gamg->orig_data[qq]; 584806fa848SBarry Smith } else { 5851ab5ffc9SJed Brown if (!pc_gamg->ops->createdefaultdata) SETERRQ(comm,PETSC_ERR_PLIB,"'createdefaultdata' not set(?) need to support NULL data"); 5867700e67bSMark Adams ierr = pc_gamg->ops->createdefaultdata(pc,Pmat);CHKERRQ(ierr); 5879d5b6da9SMark F. Adams } 588878e152fSMark F. Adams } 589878e152fSMark F. Adams 590878e152fSMark F. Adams /* cache original data for reuse */ 5911c1aac46SBarry Smith if (!pc_gamg->orig_data && (PetscBool)(!pc_gamg->reuse_prol)) { 592785e854fSJed Brown ierr = PetscMalloc1(pc_gamg->data_sz, &pc_gamg->orig_data);CHKERRQ(ierr); 593878e152fSMark F. Adams for (qq=0; qq<pc_gamg->data_sz; qq++) pc_gamg->orig_data[qq] = pc_gamg->data[qq]; 594878e152fSMark F. Adams pc_gamg->orig_data_cell_rows = pc_gamg->data_cell_rows; 595878e152fSMark F. Adams pc_gamg->orig_data_cell_cols = pc_gamg->data_cell_cols; 596878e152fSMark F. Adams } 597038e3b61SMark F. Adams 598302f38e8SMark F. Adams /* get basic dims */ 599302f38e8SMark F. Adams ierr = MatGetBlockSize(Pmat, &bs);CHKERRQ(ierr); 600171cca9aSMark Adams ierr = MatGetSize(Pmat, &M, &N);CHKERRQ(ierr); 60184d3f75bSMark F. Adams 602569f4572SMark Adams ierr = MatGetInfo(Pmat,MAT_GLOBAL_SUM,&info);CHKERRQ(ierr); /* global reduction */ 603569f4572SMark Adams nnz0 = info.nz_used; 604569f4572SMark Adams nnztot = info.nz_used; 605c9567895SMark ierr = PetscInfo6(pc,"level %D) N=%D, n data rows=%D, n data cols=%D, nnz/row (ave)=%d, np=%D\n",0,M,pc_gamg->data_cell_rows,pc_gamg->data_cell_cols,(int)(nnz0/(PetscReal)M+0.5),size);CHKERRQ(ierr); 606569f4572SMark Adams 607a2f3521dSMark F. Adams /* Get A_i and R_i */ 60862294041SBarry Smith for (level=0, Aarr[0]=Pmat, nactivepe = size; level < (pc_gamg->Nlevels-1) && (!level || M>pc_gamg->coarse_eq_limit); level++) { 6099ab59c8bSMark Adams pc_gamg->current_level = level; 61018c3aa7eSMark if (level >= PETSC_MG_MAXLEVELS) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Too many levels %D",level); 6115b89ad90SMark F. Adams level1 = level + 1; 6120cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG 6130cbbd2e1SMark F. Adams ierr = PetscLogEventBegin(petsc_gamg_setup_events[SET1],0,0,0,0);CHKERRQ(ierr); 614a2f3521dSMark F. Adams #if (defined GAMG_STAGES) 615a2f3521dSMark F. Adams ierr = PetscLogStagePush(gamg_stages[level]);CHKERRQ(ierr); 616b4fbaa2aSMark F. Adams #endif 617a2f3521dSMark F. Adams #endif 618c8b0795cSMark F. Adams { /* construct prolongator */ 619725b86d8SJed Brown Mat Gmat; 6200cbbd2e1SMark F. Adams PetscCoarsenData *agg_lists; 6217700e67bSMark Adams Mat Prol11; 622c8b0795cSMark F. Adams 6237700e67bSMark Adams ierr = pc_gamg->ops->graph(pc,Aarr[level], &Gmat);CHKERRQ(ierr); 6241ab5ffc9SJed Brown ierr = pc_gamg->ops->coarsen(pc, &Gmat, &agg_lists);CHKERRQ(ierr); 6257700e67bSMark Adams ierr = pc_gamg->ops->prolongator(pc,Aarr[level],Gmat,agg_lists,&Prol11);CHKERRQ(ierr); 626c8b0795cSMark F. Adams 627a2f3521dSMark F. Adams /* could have failed to create new level */ 628a2f3521dSMark F. Adams if (Prol11) { 629f7df55f0SStefano Zampini const char *prefix; 630f7df55f0SStefano Zampini char addp[32]; 631f7df55f0SStefano Zampini 6329d5b6da9SMark F. Adams /* get new block size of coarse matrices */ 6330298fd71SBarry Smith ierr = MatGetBlockSizes(Prol11, NULL, &bs);CHKERRQ(ierr); 634a2f3521dSMark F. Adams 635fd1112cbSBarry Smith if (pc_gamg->ops->optprolongator) { 636c8b0795cSMark F. Adams /* smooth */ 637fd1112cbSBarry Smith ierr = pc_gamg->ops->optprolongator(pc, Aarr[level], &Prol11);CHKERRQ(ierr); 638c8b0795cSMark F. Adams } 639c8b0795cSMark F. Adams 6400c3bc534SBarry Smith if (pc_gamg->use_aggs_in_asm) { 6411b18a24aSMark Adams PetscInt bs; 6421b18a24aSMark Adams ierr = MatGetBlockSizes(Prol11, &bs, NULL);CHKERRQ(ierr); 6430a3c815dSMark Adams ierr = PetscCDGetASMBlocks(agg_lists, bs, Gmat, &nASMBlocksArr[level], &ASMLocalIDsArr[level]);CHKERRQ(ierr); 644ffc955d6SMark F. Adams } 645ffc955d6SMark F. Adams 646f7df55f0SStefano Zampini ierr = PCGetOptionsPrefix(pc,&prefix);CHKERRQ(ierr); 647f7df55f0SStefano Zampini ierr = MatSetOptionsPrefix(Prol11,prefix);CHKERRQ(ierr); 648c9567895SMark ierr = PetscSNPrintf(addp,sizeof(addp),"pc_gamg_prolongator_%d_",(int)level);CHKERRQ(ierr); 649f7df55f0SStefano Zampini ierr = MatAppendOptionsPrefix(Prol11,addp);CHKERRQ(ierr); 65091f31d3dSStefano Zampini /* Always generate the transpose with CUDA 651f7df55f0SStefano Zampini Such behaviour can be adapted with -pc_gamg_prolongator_ prefixed options */ 652f7df55f0SStefano Zampini #if defined(PETSC_HAVE_CUDA) 653f7df55f0SStefano Zampini { 654f7df55f0SStefano Zampini PetscBool ismpiaij; 655f7df55f0SStefano Zampini 656f7df55f0SStefano Zampini ierr = PetscObjectBaseTypeCompare((PetscObject)Prol11,MATMPIAIJ,&ismpiaij);CHKERRQ(ierr); 657f7df55f0SStefano Zampini if (ismpiaij) { 658f7df55f0SStefano Zampini Mat Prol_d,Prol_o; 659f7df55f0SStefano Zampini 660f7df55f0SStefano Zampini ierr = MatMPIAIJGetSeqAIJ(Prol11,&Prol_d,&Prol_o,NULL);CHKERRQ(ierr); 66191f31d3dSStefano Zampini ierr = MatSeqAIJCUSPARSESetGenerateTranspose(Prol_d,PETSC_TRUE);CHKERRQ(ierr); 66291f31d3dSStefano Zampini ierr = MatSeqAIJCUSPARSESetGenerateTranspose(Prol_o,PETSC_TRUE);CHKERRQ(ierr); 663f7df55f0SStefano Zampini } else { 66491f31d3dSStefano Zampini ierr = MatSeqAIJCUSPARSESetGenerateTranspose(Prol11,PETSC_TRUE);CHKERRQ(ierr); 665f7df55f0SStefano Zampini } 666f7df55f0SStefano Zampini } 667f7df55f0SStefano Zampini #endif 668f7df55f0SStefano Zampini ierr = MatSetFromOptions(Prol11);CHKERRQ(ierr); 6694bde40a0SMark Adams Parr[level1] = Prol11; 6704bde40a0SMark Adams } else Parr[level1] = NULL; /* failed to coarsen */ 6714bde40a0SMark Adams 672a2f3521dSMark F. Adams ierr = MatDestroy(&Gmat);CHKERRQ(ierr); 67341b27cdeSMark F. Adams ierr = PetscCDDestroy(agg_lists);CHKERRQ(ierr); 674a2f3521dSMark F. Adams } /* construct prolongator scope */ 6750cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG 6760cbbd2e1SMark F. Adams ierr = PetscLogEventEnd(petsc_gamg_setup_events[SET1],0,0,0,0);CHKERRQ(ierr); 677c8b0795cSMark F. Adams #endif 6787f66b68fSMark Adams if (!level) Aarr[0] = Pmat; /* use Pmat for finest level setup */ 679171cca9aSMark Adams if (!Parr[level1]) { /* failed to coarsen */ 680569f4572SMark Adams ierr = PetscInfo1(pc,"Stop gridding, level %D\n",level);CHKERRQ(ierr); 68162294041SBarry Smith #if defined PETSC_GAMG_USE_LOG && defined GAMG_STAGES 682a90e85d9SMark Adams ierr = PetscLogStagePop();CHKERRQ(ierr); 683a90e85d9SMark Adams #endif 684c8b0795cSMark F. Adams break; 685c8b0795cSMark F. Adams } 6860cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG 6870cbbd2e1SMark F. Adams ierr = PetscLogEventBegin(petsc_gamg_setup_events[SET2],0,0,0,0);CHKERRQ(ierr); 688b4fbaa2aSMark F. Adams #endif 689171cca9aSMark Adams ierr = MatGetSize(Parr[level1], &M, &N);CHKERRQ(ierr); /* N is next M, a loop test variables */ 690c9567895SMark if (is_last) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Is last ?"); 691171cca9aSMark Adams if (N <= pc_gamg->coarse_eq_limit) is_last = PETSC_TRUE; 6920e2909e1SMark Adams if (level1 == pc_gamg->Nlevels-1) is_last = PETSC_TRUE; 693171cca9aSMark Adams ierr = pc_gamg->ops->createlevel(pc, Aarr[level], bs, &Parr[level1], &Aarr[level1], &nactivepe, NULL, is_last);CHKERRQ(ierr); 694a2f3521dSMark F. Adams 6950cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG 6960cbbd2e1SMark F. Adams ierr = PetscLogEventEnd(petsc_gamg_setup_events[SET2],0,0,0,0);CHKERRQ(ierr); 697b4fbaa2aSMark F. Adams #endif 698171cca9aSMark Adams ierr = MatGetSize(Aarr[level1], &M, &N);CHKERRQ(ierr); /* M is loop test variables */ 699569f4572SMark Adams ierr = MatGetInfo(Aarr[level1], MAT_GLOBAL_SUM, &info);CHKERRQ(ierr); 700569f4572SMark Adams nnztot += info.nz_used; 701c9567895SMark ierr = PetscInfo5(pc,"%D) N=%D, n data cols=%D, nnz/row (ave)=%d, %D active pes\n",level1,M,pc_gamg->data_cell_cols,(int)(info.nz_used/(PetscReal)M),nactivepe);CHKERRQ(ierr); 702569f4572SMark Adams 7030cbbd2e1SMark F. Adams #if (defined PETSC_GAMG_USE_LOG && defined GAMG_STAGES) 704b4fbaa2aSMark F. Adams ierr = PetscLogStagePop();CHKERRQ(ierr); 705b4fbaa2aSMark F. Adams #endif 706a90e85d9SMark Adams /* stop if one node or one proc -- could pull back for singular problems */ 7079ab59c8bSMark Adams if ((pc_gamg->data_cell_cols && M/pc_gamg->data_cell_cols < 2) || (!pc_gamg->data_cell_cols && M/bs < 2)) { 7089ab59c8bSMark Adams ierr = PetscInfo2(pc,"HARD stop of coarsening on level %D. Grid too small: %D block nodes\n",level,M/bs);CHKERRQ(ierr); 709a90e85d9SMark Adams level++; 710a90e85d9SMark Adams break; 711a90e85d9SMark Adams } 712c8b0795cSMark F. Adams } /* levels */ 713c8b0795cSMark F. Adams ierr = PetscFree(pc_gamg->data);CHKERRQ(ierr); 714c8b0795cSMark F. Adams 715569f4572SMark Adams ierr = PetscInfo2(pc,"%D levels, grid complexity = %g\n",level+1,nnztot/nnz0);CHKERRQ(ierr); 7169d5b6da9SMark F. Adams pc_gamg->Nlevels = level + 1; 7175b89ad90SMark F. Adams fine_level = level; 7180298fd71SBarry Smith ierr = PCMGSetLevels(pc,pc_gamg->Nlevels,NULL);CHKERRQ(ierr); 7195b89ad90SMark F. Adams 72062294041SBarry Smith if (pc_gamg->Nlevels > 1) { /* don't setup MG if one level */ 7210ed2132dSStefano Zampini PetscErrorCode (*savesetfromoptions[PETSC_MG_MAXLEVELS])(PetscOptionItems*,KSP); 7220ed2132dSStefano Zampini 723d5280255SMark F. Adams /* set default smoothers & set operators */ 72462294041SBarry Smith for (lidx = 1, level = pc_gamg->Nlevels-2; lidx <= fine_level; lidx++, level--) { 725ffc955d6SMark F. Adams KSP smoother; 726ffc955d6SMark F. Adams PC subpc; 727a2f3521dSMark F. Adams 7289d5b6da9SMark F. Adams ierr = PCMGGetSmoother(pc, lidx, &smoother);CHKERRQ(ierr); 729f6536408SMark F. Adams ierr = KSPGetPC(smoother, &subpc);CHKERRQ(ierr); 730ffc955d6SMark F. Adams 731a2f3521dSMark F. Adams ierr = KSPSetNormType(smoother, KSP_NORM_NONE);CHKERRQ(ierr); 732a2f3521dSMark F. Adams /* set ops */ 73323ee1639SBarry Smith ierr = KSPSetOperators(smoother, Aarr[level], Aarr[level]);CHKERRQ(ierr); 734a2f3521dSMark F. Adams ierr = PCMGSetInterpolation(pc, lidx, Parr[level+1]);CHKERRQ(ierr); 735a2f3521dSMark F. Adams 736a2f3521dSMark F. Adams /* set defaults */ 7376c9de887SHong Zhang ierr = KSPSetType(smoother, KSPCHEBYSHEV);CHKERRQ(ierr); 738a2f3521dSMark F. Adams 7390c3bc534SBarry Smith /* set blocks for ASM smoother that uses the 'aggregates' */ 7400c3bc534SBarry Smith if (pc_gamg->use_aggs_in_asm) { 7412d3561bbSSatish Balay PetscInt sz; 7427a28f3e5SMark Adams IS *iss; 743a2f3521dSMark F. Adams 7442d3561bbSSatish Balay sz = nASMBlocksArr[level]; 7457a28f3e5SMark Adams iss = ASMLocalIDsArr[level]; 7460c3bc534SBarry Smith ierr = PCSetType(subpc, PCASM);CHKERRQ(ierr); 7470a3c815dSMark Adams ierr = PCASMSetOverlap(subpc, 0);CHKERRQ(ierr); 7480c3bc534SBarry Smith ierr = PCASMSetType(subpc,PC_ASM_BASIC);CHKERRQ(ierr); 7497f66b68fSMark Adams if (!sz) { 750ffc955d6SMark F. Adams IS is; 7510a3c815dSMark Adams ierr = ISCreateGeneral(PETSC_COMM_SELF, 0, NULL, PETSC_COPY_VALUES, &is);CHKERRQ(ierr); 7527a28f3e5SMark Adams ierr = PCASMSetLocalSubdomains(subpc, 1, NULL, &is);CHKERRQ(ierr); 753a94c3b12SMark F. Adams ierr = ISDestroy(&is);CHKERRQ(ierr); 754806fa848SBarry Smith } else { 755a94c3b12SMark F. Adams PetscInt kk; 7567a28f3e5SMark Adams ierr = PCASMSetLocalSubdomains(subpc, sz, NULL, iss);CHKERRQ(ierr); 757a94c3b12SMark F. Adams for (kk=0; kk<sz; kk++) { 7587a28f3e5SMark Adams ierr = ISDestroy(&iss[kk]);CHKERRQ(ierr); 759a94c3b12SMark F. Adams } 7607a28f3e5SMark Adams ierr = PetscFree(iss);CHKERRQ(ierr); 761ffc955d6SMark F. Adams } 7620298fd71SBarry Smith ASMLocalIDsArr[level] = NULL; 763ffc955d6SMark F. Adams nASMBlocksArr[level] = 0; 764806fa848SBarry Smith } else { 765890ffe84SMark Adams ierr = PCSetType(subpc, PCSOR);CHKERRQ(ierr); 766ffc955d6SMark F. Adams } 767d5280255SMark F. Adams } 768d5280255SMark F. Adams { 769d5280255SMark F. Adams /* coarse grid */ 770d5280255SMark F. Adams KSP smoother,*k2; PC subpc,pc2; PetscInt ii,first; 771d5280255SMark F. Adams Mat Lmat = Aarr[(level=pc_gamg->Nlevels-1)]; lidx = 0; 7720ed2132dSStefano Zampini 773d5280255SMark F. Adams ierr = PCMGGetSmoother(pc, lidx, &smoother);CHKERRQ(ierr); 77423ee1639SBarry Smith ierr = KSPSetOperators(smoother, Lmat, Lmat);CHKERRQ(ierr); 775cf8ae1d3SMark Adams if (!pc_gamg->use_parallel_coarse_grid_solver) { 776d5280255SMark F. Adams ierr = KSPSetNormType(smoother, KSP_NORM_NONE);CHKERRQ(ierr); 777d5280255SMark F. Adams ierr = KSPGetPC(smoother, &subpc);CHKERRQ(ierr); 778d5280255SMark F. Adams ierr = PCSetType(subpc, PCBJACOBI);CHKERRQ(ierr); 779d5280255SMark F. Adams ierr = PCSetUp(subpc);CHKERRQ(ierr); 78071959b99SBarry Smith ierr = PCBJacobiGetSubKSP(subpc,&ii,&first,&k2);CHKERRQ(ierr); 78171959b99SBarry Smith if (ii != 1) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"ii %D is not one",ii); 782d5280255SMark F. Adams ierr = KSPGetPC(k2[0],&pc2);CHKERRQ(ierr); 783d5280255SMark F. Adams ierr = PCSetType(pc2, PCLU);CHKERRQ(ierr); 7849dbfc187SHong Zhang ierr = PCFactorSetShiftType(pc2,MAT_SHIFT_INBLOCKS);CHKERRQ(ierr); 7852fb0b348SMark F. Adams ierr = KSPSetTolerances(k2[0],PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,1);CHKERRQ(ierr); 78608e36f19SMark Adams ierr = KSPSetType(k2[0], KSPPREONLY);CHKERRQ(ierr); 7875b42dca8SJed Brown /* This flag gets reset by PCBJacobiGetSubKSP(), but our BJacobi really does the same algorithm everywhere (and in 7885b42dca8SJed Brown * fact, all but one process will have zero dofs), so we reset the flag to avoid having PCView_BJacobi attempt to 7895b42dca8SJed Brown * view every subdomain as though they were different. */ 7905b42dca8SJed Brown ((PC_BJacobi*)subpc->data)->same_local_solves = PETSC_TRUE; 791d5280255SMark F. Adams } 792cf8ae1d3SMark Adams } 793d5280255SMark F. Adams 794d5280255SMark F. Adams /* should be called in PCSetFromOptions_GAMG(), but cannot be called prior to PCMGSetLevels() */ 795d5280255SMark F. Adams ierr = PetscObjectOptionsBegin((PetscObject)pc);CHKERRQ(ierr); 796e55864a3SBarry Smith ierr = PCSetFromOptions_MG(PetscOptionsObject,pc);CHKERRQ(ierr); 797d5280255SMark F. Adams ierr = PetscOptionsEnd();CHKERRQ(ierr); 79869aca0b8SBarry Smith ierr = PCMGSetGalerkin(pc,PC_MG_GALERKIN_EXTERNAL);CHKERRQ(ierr); 799d5280255SMark F. Adams 80018c3aa7eSMark /* setup cheby eigen estimates from SA */ 8010ed2132dSStefano Zampini if (pc_gamg->use_sa_esteig==1) { 80218c3aa7eSMark for (lidx = 1, level = pc_gamg->Nlevels-2; level >= 0 ; lidx++, level--) { 80318c3aa7eSMark KSP smoother; 80418c3aa7eSMark PetscBool ischeb; 8050ed2132dSStefano Zampini 8060ed2132dSStefano Zampini savesetfromoptions[level] = NULL; 80718c3aa7eSMark ierr = PCMGGetSmoother(pc, lidx, &smoother);CHKERRQ(ierr); 80818c3aa7eSMark ierr = PetscObjectTypeCompare((PetscObject)smoother,KSPCHEBYSHEV,&ischeb);CHKERRQ(ierr); 80918c3aa7eSMark if (ischeb) { 81018c3aa7eSMark KSP_Chebyshev *cheb = (KSP_Chebyshev*)smoother->data; 8110ed2132dSStefano Zampini 8120ed2132dSStefano Zampini ierr = KSPSetFromOptions(smoother);CHKERRQ(ierr); /* let command line emax override using SA's eigenvalues */ 8130ed2132dSStefano Zampini if (mg->max_eigen_DinvA[level] > 0 && cheb->emax == 0.) { 81418c3aa7eSMark PC subpc; 81518c3aa7eSMark PetscBool isjac; 81618c3aa7eSMark ierr = KSPGetPC(smoother, &subpc);CHKERRQ(ierr); 81718c3aa7eSMark ierr = PetscObjectTypeCompare((PetscObject)subpc,PCJACOBI,&isjac);CHKERRQ(ierr); 8180ed2132dSStefano Zampini if (isjac && pc_gamg->use_sa_esteig==1) { 81918c3aa7eSMark PetscReal emax,emin; 8200ed2132dSStefano Zampini 82118c3aa7eSMark emin = mg->min_eigen_DinvA[level]; 82218c3aa7eSMark emax = mg->max_eigen_DinvA[level]; 82318c3aa7eSMark ierr = PetscInfo4(pc,"PCSetUp_GAMG: call KSPChebyshevSetEigenvalues on level %D (N=%D) with emax = %g emin = %g\n",level,Aarr[level]->rmap->N,(double)emax,(double)emin);CHKERRQ(ierr); 82418c3aa7eSMark cheb->emin_computed = emin; 82518c3aa7eSMark cheb->emax_computed = emax; 82618c3aa7eSMark ierr = KSPChebyshevSetEigenvalues(smoother, cheb->tform[2]*emin + cheb->tform[3]*emax, cheb->tform[0]*emin + cheb->tform[1]*emax);CHKERRQ(ierr); 8270ed2132dSStefano Zampini 8280ed2132dSStefano Zampini /* We have set the eigenvalues and consumed the transformation values 8290ed2132dSStefano Zampini prevent from flagging the recomputation of the eigenvalues again in PCSetUp_MG 8300ed2132dSStefano Zampini below when setfromoptions will be called again */ 8310ed2132dSStefano Zampini savesetfromoptions[level] = smoother->ops->setfromoptions; 8320ed2132dSStefano Zampini smoother->ops->setfromoptions = NULL; 83318c3aa7eSMark } 83418c3aa7eSMark } 83518c3aa7eSMark } 83618c3aa7eSMark } 8370ed2132dSStefano Zampini } 8380ed2132dSStefano Zampini 8390ed2132dSStefano Zampini ierr = PCSetUp_MG(pc);CHKERRQ(ierr); 8400ed2132dSStefano Zampini 8410ed2132dSStefano Zampini /* restore Chebyshev smoother for next calls */ 8420ed2132dSStefano Zampini if (pc_gamg->use_sa_esteig==1) { 8430ed2132dSStefano Zampini for (lidx = 1, level = pc_gamg->Nlevels-2; level >= 0 ; lidx++, level--) { 8440ed2132dSStefano Zampini if (savesetfromoptions[level]) { 8450ed2132dSStefano Zampini KSP smoother; 8460ed2132dSStefano Zampini ierr = PCMGGetSmoother(pc, lidx, &smoother);CHKERRQ(ierr); 8470ed2132dSStefano Zampini smoother->ops->setfromoptions = savesetfromoptions[level]; 8480ed2132dSStefano Zampini } 8490ed2132dSStefano Zampini } 8500ed2132dSStefano Zampini } 85118c3aa7eSMark 852d5280255SMark F. Adams /* clean up */ 853d5280255SMark F. Adams for (level=1; level<pc_gamg->Nlevels; level++) { 854587fa25dSMark F. Adams ierr = MatDestroy(&Parr[level]);CHKERRQ(ierr); 855587fa25dSMark F. Adams ierr = MatDestroy(&Aarr[level]);CHKERRQ(ierr); 8565b89ad90SMark F. Adams } 857806fa848SBarry Smith } else { 8585f8cf99dSMark F. Adams KSP smoother; 8590ed2132dSStefano Zampini 860302440fdSBarry Smith ierr = PetscInfo(pc,"One level solver used (system is seen as DD). Using default solver.\n");CHKERRQ(ierr); 8619d5b6da9SMark F. Adams ierr = PCMGGetSmoother(pc, 0, &smoother);CHKERRQ(ierr); 86223ee1639SBarry Smith ierr = KSPSetOperators(smoother, Aarr[0], Aarr[0]);CHKERRQ(ierr); 8635f8cf99dSMark F. Adams ierr = KSPSetType(smoother, KSPPREONLY);CHKERRQ(ierr); 8649d5b6da9SMark F. Adams ierr = PCSetUp_MG(pc);CHKERRQ(ierr); 8655f8cf99dSMark F. Adams } 8665b89ad90SMark F. Adams PetscFunctionReturn(0); 8675b89ad90SMark F. Adams } 8685b89ad90SMark F. Adams 869eb07cef2SMark F. Adams /* ------------------------------------------------------------------------- */ 8705b89ad90SMark F. Adams /* 8715b89ad90SMark F. Adams PCDestroy_GAMG - Destroys the private context for the GAMG preconditioner 8725b89ad90SMark F. Adams that was created with PCCreate_GAMG(). 8735b89ad90SMark F. Adams 8745b89ad90SMark F. Adams Input Parameter: 8755b89ad90SMark F. Adams . pc - the preconditioner context 8765b89ad90SMark F. Adams 8775b89ad90SMark F. Adams Application Interface Routine: PCDestroy() 8785b89ad90SMark F. Adams */ 8795b89ad90SMark F. Adams PetscErrorCode PCDestroy_GAMG(PC pc) 8805b89ad90SMark F. Adams { 8815b89ad90SMark F. Adams PetscErrorCode ierr; 8825b89ad90SMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 8835b89ad90SMark F. Adams PC_GAMG *pc_gamg= (PC_GAMG*)mg->innerctx; 8845b89ad90SMark F. Adams 8855b89ad90SMark F. Adams PetscFunctionBegin; 8865b89ad90SMark F. Adams ierr = PCReset_GAMG(pc);CHKERRQ(ierr); 8879b8ffb57SJed Brown if (pc_gamg->ops->destroy) { 8889b8ffb57SJed Brown ierr = (*pc_gamg->ops->destroy)(pc);CHKERRQ(ierr); 8899b8ffb57SJed Brown } 8901ab5ffc9SJed Brown ierr = PetscFree(pc_gamg->ops);CHKERRQ(ierr); 8911ab5ffc9SJed Brown ierr = PetscFree(pc_gamg->gamg_type_name);CHKERRQ(ierr); 8925b89ad90SMark F. Adams ierr = PetscFree(pc_gamg);CHKERRQ(ierr); 8935b89ad90SMark F. Adams ierr = PCDestroy_MG(pc);CHKERRQ(ierr); 8945b89ad90SMark F. Adams PetscFunctionReturn(0); 8955b89ad90SMark F. Adams } 8965b89ad90SMark F. Adams 897676e1743SMark F. Adams /*@ 898cab9ed1eSBarry Smith PCGAMGSetProcEqLim - Set number of equations to aim for per process on the coarse grids via processor reduction. 899676e1743SMark F. Adams 9001cc46a46SBarry Smith Logically Collective on PC 901676e1743SMark F. Adams 902676e1743SMark F. Adams Input Parameters: 9031cc46a46SBarry Smith + pc - the preconditioner context 9041cc46a46SBarry Smith - n - the number of equations 905676e1743SMark F. Adams 906676e1743SMark F. Adams 907676e1743SMark F. Adams Options Database Key: 9081cc46a46SBarry Smith . -pc_gamg_process_eq_limit <limit> 909676e1743SMark F. Adams 91095452b02SPatrick Sanan Notes: 91195452b02SPatrick Sanan GAMG will reduce the number of MPI processes used directly on the coarse grids so that there are around <limit> equations on each process 912cab9ed1eSBarry Smith that has degrees of freedom 913cab9ed1eSBarry Smith 914676e1743SMark F. Adams Level: intermediate 915676e1743SMark F. Adams 916c9567895SMark .seealso: PCGAMGSetCoarseEqLim(), PCGAMGSetRankReductionFactors() 917676e1743SMark F. Adams @*/ 918676e1743SMark F. Adams PetscErrorCode PCGAMGSetProcEqLim(PC pc, PetscInt n) 919676e1743SMark F. Adams { 920676e1743SMark F. Adams PetscErrorCode ierr; 921676e1743SMark F. Adams 922676e1743SMark F. Adams PetscFunctionBegin; 923676e1743SMark F. Adams PetscValidHeaderSpecific(pc,PC_CLASSID,1); 924676e1743SMark F. Adams ierr = PetscTryMethod(pc,"PCGAMGSetProcEqLim_C",(PC,PetscInt),(pc,n));CHKERRQ(ierr); 925676e1743SMark F. Adams PetscFunctionReturn(0); 926676e1743SMark F. Adams } 927676e1743SMark F. Adams 9281e6b0712SBarry Smith static PetscErrorCode PCGAMGSetProcEqLim_GAMG(PC pc, PetscInt n) 929676e1743SMark F. Adams { 930c20e4228SMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 931c20e4228SMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 932676e1743SMark F. Adams 933676e1743SMark F. Adams PetscFunctionBegin; 9349d5b6da9SMark F. Adams if (n>0) pc_gamg->min_eq_proc = n; 935676e1743SMark F. Adams PetscFunctionReturn(0); 936676e1743SMark F. Adams } 937676e1743SMark F. Adams 938389730f3SMark F. Adams /*@ 939cab9ed1eSBarry Smith PCGAMGSetCoarseEqLim - Set maximum number of equations on coarsest grid. 940389730f3SMark F. Adams 941389730f3SMark F. Adams Collective on PC 942389730f3SMark F. Adams 943389730f3SMark F. Adams Input Parameters: 9441cc46a46SBarry Smith + pc - the preconditioner context 9451cc46a46SBarry Smith - n - maximum number of equations to aim for 946389730f3SMark F. Adams 947389730f3SMark F. Adams Options Database Key: 9481cc46a46SBarry Smith . -pc_gamg_coarse_eq_limit <limit> 949389730f3SMark F. Adams 95074329af1SBarry Smith Notes: For example -pc_gamg_coarse_eq_limit 1000 will stop coarsening once the coarse grid 95174329af1SBarry Smith has less than 1000 unknowns. 95274329af1SBarry Smith 953389730f3SMark F. Adams Level: intermediate 954389730f3SMark F. Adams 955c9567895SMark .seealso: PCGAMGSetProcEqLim(), PCGAMGSetRankReductionFactors() 956389730f3SMark F. Adams @*/ 957389730f3SMark F. Adams PetscErrorCode PCGAMGSetCoarseEqLim(PC pc, PetscInt n) 958389730f3SMark F. Adams { 959389730f3SMark F. Adams PetscErrorCode ierr; 960389730f3SMark F. Adams 961389730f3SMark F. Adams PetscFunctionBegin; 962389730f3SMark F. Adams PetscValidHeaderSpecific(pc,PC_CLASSID,1); 963389730f3SMark F. Adams ierr = PetscTryMethod(pc,"PCGAMGSetCoarseEqLim_C",(PC,PetscInt),(pc,n));CHKERRQ(ierr); 964389730f3SMark F. Adams PetscFunctionReturn(0); 965389730f3SMark F. Adams } 966389730f3SMark F. Adams 9671e6b0712SBarry Smith static PetscErrorCode PCGAMGSetCoarseEqLim_GAMG(PC pc, PetscInt n) 968389730f3SMark F. Adams { 969389730f3SMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 970389730f3SMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 971389730f3SMark F. Adams 972389730f3SMark F. Adams PetscFunctionBegin; 9739d5b6da9SMark F. Adams if (n>0) pc_gamg->coarse_eq_limit = n; 974389730f3SMark F. Adams PetscFunctionReturn(0); 975389730f3SMark F. Adams } 976389730f3SMark F. Adams 977676e1743SMark F. Adams /*@ 978cab9ed1eSBarry Smith PCGAMGSetRepartition - Repartition the degrees of freedom across the processors on the coarser grids 979676e1743SMark F. Adams 980676e1743SMark F. Adams Collective on PC 981676e1743SMark F. Adams 982676e1743SMark F. Adams Input Parameters: 9831cc46a46SBarry Smith + pc - the preconditioner context 9841cc46a46SBarry Smith - n - PETSC_TRUE or PETSC_FALSE 985676e1743SMark F. Adams 986676e1743SMark F. Adams Options Database Key: 9871cc46a46SBarry Smith . -pc_gamg_repartition <true,false> 988676e1743SMark F. Adams 98995452b02SPatrick Sanan Notes: 99095452b02SPatrick Sanan this will generally improve the loading balancing of the work on each level 991cab9ed1eSBarry Smith 992676e1743SMark F. Adams Level: intermediate 993676e1743SMark F. Adams 994676e1743SMark F. Adams .seealso: () 995676e1743SMark F. Adams @*/ 996cab9ed1eSBarry Smith PetscErrorCode PCGAMGSetRepartition(PC pc, PetscBool n) 997676e1743SMark F. Adams { 998676e1743SMark F. Adams PetscErrorCode ierr; 999676e1743SMark F. Adams 1000676e1743SMark F. Adams PetscFunctionBegin; 1001676e1743SMark F. Adams PetscValidHeaderSpecific(pc,PC_CLASSID,1); 1002cab9ed1eSBarry Smith ierr = PetscTryMethod(pc,"PCGAMGSetRepartition_C",(PC,PetscBool),(pc,n));CHKERRQ(ierr); 1003676e1743SMark F. Adams PetscFunctionReturn(0); 1004676e1743SMark F. Adams } 1005676e1743SMark F. Adams 1006cab9ed1eSBarry Smith static PetscErrorCode PCGAMGSetRepartition_GAMG(PC pc, PetscBool n) 1007676e1743SMark F. Adams { 1008c20e4228SMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 1009c20e4228SMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 1010676e1743SMark F. Adams 1011676e1743SMark F. Adams PetscFunctionBegin; 10129d5b6da9SMark F. Adams pc_gamg->repart = n; 1013676e1743SMark F. Adams PetscFunctionReturn(0); 1014676e1743SMark F. Adams } 1015676e1743SMark F. Adams 1016dfd5c07aSMark F. Adams /*@ 101718c3aa7eSMark PCGAMGSetEstEigKSPMaxIt - Set number of KSP iterations in eigen estimator (for Cheby) 101818c3aa7eSMark 101918c3aa7eSMark Collective on PC 102018c3aa7eSMark 102118c3aa7eSMark Input Parameters: 102218c3aa7eSMark + pc - the preconditioner context 102318c3aa7eSMark - n - number of its 102418c3aa7eSMark 102518c3aa7eSMark Options Database Key: 102618c3aa7eSMark . -pc_gamg_esteig_ksp_max_it <its> 102718c3aa7eSMark 102818c3aa7eSMark Notes: 102918c3aa7eSMark 103018c3aa7eSMark Level: intermediate 103118c3aa7eSMark 103218c3aa7eSMark .seealso: () 103318c3aa7eSMark @*/ 103418c3aa7eSMark PetscErrorCode PCGAMGSetEstEigKSPMaxIt(PC pc, PetscInt n) 103518c3aa7eSMark { 103618c3aa7eSMark PetscErrorCode ierr; 103718c3aa7eSMark 103818c3aa7eSMark PetscFunctionBegin; 103918c3aa7eSMark PetscValidHeaderSpecific(pc,PC_CLASSID,1); 104018c3aa7eSMark ierr = PetscTryMethod(pc,"PCGAMGSetEstEigKSPMaxIt_C",(PC,PetscInt),(pc,n));CHKERRQ(ierr); 104118c3aa7eSMark PetscFunctionReturn(0); 104218c3aa7eSMark } 104318c3aa7eSMark 104418c3aa7eSMark static PetscErrorCode PCGAMGSetEstEigKSPMaxIt_GAMG(PC pc, PetscInt n) 104518c3aa7eSMark { 104618c3aa7eSMark PC_MG *mg = (PC_MG*)pc->data; 104718c3aa7eSMark PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 104818c3aa7eSMark 104918c3aa7eSMark PetscFunctionBegin; 105018c3aa7eSMark pc_gamg->esteig_max_it = n; 105118c3aa7eSMark PetscFunctionReturn(0); 105218c3aa7eSMark } 105318c3aa7eSMark 105418c3aa7eSMark /*@ 105518c3aa7eSMark PCGAMGSetUseSAEstEig - Use eigen estimate from smoothed aggregation for Cheby smoother 105618c3aa7eSMark 105718c3aa7eSMark Collective on PC 105818c3aa7eSMark 105918c3aa7eSMark Input Parameters: 106018c3aa7eSMark + pc - the preconditioner context 106118c3aa7eSMark - n - number of its 106218c3aa7eSMark 106318c3aa7eSMark Options Database Key: 106418c3aa7eSMark . -pc_gamg_use_sa_esteig <true,false> 106518c3aa7eSMark 106618c3aa7eSMark Notes: 106718c3aa7eSMark 106818c3aa7eSMark Level: intermediate 106918c3aa7eSMark 107018c3aa7eSMark .seealso: () 107118c3aa7eSMark @*/ 107218c3aa7eSMark PetscErrorCode PCGAMGSetUseSAEstEig(PC pc, PetscBool n) 107318c3aa7eSMark { 107418c3aa7eSMark PetscErrorCode ierr; 107518c3aa7eSMark 107618c3aa7eSMark PetscFunctionBegin; 107718c3aa7eSMark PetscValidHeaderSpecific(pc,PC_CLASSID,1); 107818c3aa7eSMark ierr = PetscTryMethod(pc,"PCGAMGSetUseSAEstEig_C",(PC,PetscBool),(pc,n));CHKERRQ(ierr); 107918c3aa7eSMark PetscFunctionReturn(0); 108018c3aa7eSMark } 108118c3aa7eSMark 10820ed2132dSStefano Zampini static PetscErrorCode PCGAMGSetUseSAEstEig_GAMG(PC pc, PetscBool n) 108318c3aa7eSMark { 108418c3aa7eSMark PC_MG *mg = (PC_MG*)pc->data; 108518c3aa7eSMark PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 108618c3aa7eSMark 108718c3aa7eSMark PetscFunctionBegin; 108818c3aa7eSMark pc_gamg->use_sa_esteig = n ? 1 : 0; 108918c3aa7eSMark PetscFunctionReturn(0); 109018c3aa7eSMark } 109118c3aa7eSMark 109218c3aa7eSMark /*@C 109318c3aa7eSMark PCGAMGSetEstEigKSPType - Set type of KSP in eigen estimator (for Cheby) 109418c3aa7eSMark 109518c3aa7eSMark Collective on PC 109618c3aa7eSMark 109718c3aa7eSMark Input Parameters: 109818c3aa7eSMark + pc - the preconditioner context 109918c3aa7eSMark - t - ksp type 110018c3aa7eSMark 110118c3aa7eSMark Options Database Key: 110218c3aa7eSMark . -pc_gamg_esteig_ksp_type <type> 110318c3aa7eSMark 110418c3aa7eSMark Notes: 110518c3aa7eSMark 110618c3aa7eSMark Level: intermediate 110718c3aa7eSMark 110818c3aa7eSMark .seealso: () 110918c3aa7eSMark @*/ 111018c3aa7eSMark PetscErrorCode PCGAMGSetEstEigKSPType(PC pc, char t[]) 111118c3aa7eSMark { 111218c3aa7eSMark PetscErrorCode ierr; 111318c3aa7eSMark 111418c3aa7eSMark PetscFunctionBegin; 111518c3aa7eSMark PetscValidHeaderSpecific(pc,PC_CLASSID,1); 111618c3aa7eSMark ierr = PetscTryMethod(pc,"PCGAMGSetEstEigKSPType_C",(PC,char[]),(pc,t));CHKERRQ(ierr); 111718c3aa7eSMark PetscFunctionReturn(0); 111818c3aa7eSMark } 111918c3aa7eSMark 112018c3aa7eSMark static PetscErrorCode PCGAMGSetEstEigKSPType_GAMG(PC pc, char t[]) 112118c3aa7eSMark { 112218c3aa7eSMark PetscErrorCode ierr; 112318c3aa7eSMark PC_MG *mg = (PC_MG*)pc->data; 112418c3aa7eSMark PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 112518c3aa7eSMark 112618c3aa7eSMark PetscFunctionBegin; 112718c3aa7eSMark ierr = PetscStrcpy(pc_gamg->esteig_type,t);CHKERRQ(ierr); 112818c3aa7eSMark PetscFunctionReturn(0); 112918c3aa7eSMark } 113018c3aa7eSMark 113118c3aa7eSMark /*@ 113218c3aa7eSMark PCGAMGSetEigenvalues - Set eigenvalues 113318c3aa7eSMark 113418c3aa7eSMark Collective on PC 113518c3aa7eSMark 113618c3aa7eSMark Input Parameters: 113718c3aa7eSMark + pc - the preconditioner context 113818c3aa7eSMark - emax - max eigenvalue 113918c3aa7eSMark . emin - min eigenvalue 114018c3aa7eSMark 114118c3aa7eSMark Options Database Key: 114218c3aa7eSMark . -pc_gamg_eigenvalues 114318c3aa7eSMark 114418c3aa7eSMark Level: intermediate 114518c3aa7eSMark 114618c3aa7eSMark .seealso: PCGAMGSetEstEigKSPMaxIt(), PCGAMGSetUseSAEstEig(), PCGAMGSetEstEigKSPType() 114718c3aa7eSMark @*/ 114818c3aa7eSMark PetscErrorCode PCGAMGSetEigenvalues(PC pc, PetscReal emax,PetscReal emin) 114918c3aa7eSMark { 115018c3aa7eSMark PetscErrorCode ierr; 115118c3aa7eSMark 115218c3aa7eSMark PetscFunctionBegin; 115318c3aa7eSMark PetscValidHeaderSpecific(pc,PC_CLASSID,1); 115418c3aa7eSMark ierr = PetscTryMethod(pc,"PCGAMGSetEigenvalues_C",(PC,PetscReal,PetscReal),(pc,emax,emin));CHKERRQ(ierr); 115518c3aa7eSMark PetscFunctionReturn(0); 115618c3aa7eSMark } 115718c3aa7eSMark static PetscErrorCode PCGAMGSetEigenvalues_GAMG(PC pc,PetscReal emax,PetscReal emin) 115818c3aa7eSMark { 115918c3aa7eSMark PC_MG *mg = (PC_MG*)pc->data; 116018c3aa7eSMark PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 116118c3aa7eSMark 116218c3aa7eSMark PetscFunctionBegin; 116318c3aa7eSMark if (emax <= emin) SETERRQ2(PetscObjectComm((PetscObject)pc),PETSC_ERR_ARG_INCOMP,"Maximum eigenvalue must be larger than minimum: max %g min %g",(double)emax,(double)emin); 116418c3aa7eSMark if (emax*emin <= 0.0) SETERRQ2(PetscObjectComm((PetscObject)pc),PETSC_ERR_ARG_INCOMP,"Both eigenvalues must be of the same sign: max %g min %g",(double)emax,(double)emin); 116518c3aa7eSMark pc_gamg->emax = emax; 116618c3aa7eSMark pc_gamg->emin = emin; 116718c3aa7eSMark 116818c3aa7eSMark PetscFunctionReturn(0); 116918c3aa7eSMark } 117018c3aa7eSMark 117118c3aa7eSMark /*@ 1172cab9ed1eSBarry Smith PCGAMGSetReuseInterpolation - Reuse prolongation when rebuilding algebraic multigrid preconditioner 1173dfd5c07aSMark F. Adams 1174dfd5c07aSMark F. Adams Collective on PC 1175dfd5c07aSMark F. Adams 1176dfd5c07aSMark F. Adams Input Parameters: 11771cc46a46SBarry Smith + pc - the preconditioner context 11781cc46a46SBarry Smith - n - PETSC_TRUE or PETSC_FALSE 1179dfd5c07aSMark F. Adams 1180dfd5c07aSMark F. Adams Options Database Key: 11811cc46a46SBarry Smith . -pc_gamg_reuse_interpolation <true,false> 1182dfd5c07aSMark F. Adams 1183dfd5c07aSMark F. Adams Level: intermediate 1184dfd5c07aSMark F. Adams 118595452b02SPatrick Sanan Notes: 118695452b02SPatrick Sanan this may negatively affect the convergence rate of the method on new matrices if the matrix entries change a great deal, but allows 1187cab9ed1eSBarry Smith rebuilding the preconditioner quicker. 1188cab9ed1eSBarry Smith 1189dfd5c07aSMark F. Adams .seealso: () 1190dfd5c07aSMark F. Adams @*/ 11911cc46a46SBarry Smith PetscErrorCode PCGAMGSetReuseInterpolation(PC pc, PetscBool n) 1192dfd5c07aSMark F. Adams { 1193dfd5c07aSMark F. Adams PetscErrorCode ierr; 1194dfd5c07aSMark F. Adams 1195dfd5c07aSMark F. Adams PetscFunctionBegin; 1196dfd5c07aSMark F. Adams PetscValidHeaderSpecific(pc,PC_CLASSID,1); 11971cc46a46SBarry Smith ierr = PetscTryMethod(pc,"PCGAMGSetReuseInterpolation_C",(PC,PetscBool),(pc,n));CHKERRQ(ierr); 1198dfd5c07aSMark F. Adams PetscFunctionReturn(0); 1199dfd5c07aSMark F. Adams } 1200dfd5c07aSMark F. Adams 12011cc46a46SBarry Smith static PetscErrorCode PCGAMGSetReuseInterpolation_GAMG(PC pc, PetscBool n) 1202dfd5c07aSMark F. Adams { 1203dfd5c07aSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 1204dfd5c07aSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 1205dfd5c07aSMark F. Adams 1206dfd5c07aSMark F. Adams PetscFunctionBegin; 1207dfd5c07aSMark F. Adams pc_gamg->reuse_prol = n; 1208dfd5c07aSMark F. Adams PetscFunctionReturn(0); 1209dfd5c07aSMark F. Adams } 1210dfd5c07aSMark F. Adams 1211ffc955d6SMark F. Adams /*@ 1212cab9ed1eSBarry Smith PCGAMGASMSetUseAggs - Have the PCGAMG smoother on each level use the aggregates defined by the coarsening process as the subdomains for the additive Schwarz preconditioner. 1213ffc955d6SMark F. Adams 1214ffc955d6SMark F. Adams Collective on PC 1215ffc955d6SMark F. Adams 1216ffc955d6SMark F. Adams Input Parameters: 1217cab9ed1eSBarry Smith + pc - the preconditioner context 1218cab9ed1eSBarry Smith - flg - PETSC_TRUE to use aggregates, PETSC_FALSE to not 1219ffc955d6SMark F. Adams 1220ffc955d6SMark F. Adams Options Database Key: 1221cab9ed1eSBarry Smith . -pc_gamg_asm_use_agg 1222ffc955d6SMark F. Adams 1223ffc955d6SMark F. Adams Level: intermediate 1224ffc955d6SMark F. Adams 1225ffc955d6SMark F. Adams .seealso: () 1226ffc955d6SMark F. Adams @*/ 1227cab9ed1eSBarry Smith PetscErrorCode PCGAMGASMSetUseAggs(PC pc, PetscBool flg) 1228ffc955d6SMark F. Adams { 1229ffc955d6SMark F. Adams PetscErrorCode ierr; 1230ffc955d6SMark F. Adams 1231ffc955d6SMark F. Adams PetscFunctionBegin; 1232ffc955d6SMark F. Adams PetscValidHeaderSpecific(pc,PC_CLASSID,1); 1233cab9ed1eSBarry Smith ierr = PetscTryMethod(pc,"PCGAMGASMSetUseAggs_C",(PC,PetscBool),(pc,flg));CHKERRQ(ierr); 1234ffc955d6SMark F. Adams PetscFunctionReturn(0); 1235ffc955d6SMark F. Adams } 1236ffc955d6SMark F. Adams 1237cab9ed1eSBarry Smith static PetscErrorCode PCGAMGASMSetUseAggs_GAMG(PC pc, PetscBool flg) 1238ffc955d6SMark F. Adams { 1239ffc955d6SMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 1240ffc955d6SMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 1241ffc955d6SMark F. Adams 1242ffc955d6SMark F. Adams PetscFunctionBegin; 1243cab9ed1eSBarry Smith pc_gamg->use_aggs_in_asm = flg; 1244ffc955d6SMark F. Adams PetscFunctionReturn(0); 1245ffc955d6SMark F. Adams } 1246ffc955d6SMark F. Adams 1247171cca9aSMark Adams /*@ 1248cf8ae1d3SMark Adams PCGAMGSetUseParallelCoarseGridSolve - allow a parallel coarse grid solver 1249171cca9aSMark Adams 1250171cca9aSMark Adams Collective on PC 1251171cca9aSMark Adams 1252171cca9aSMark Adams Input Parameters: 1253171cca9aSMark Adams + pc - the preconditioner context 1254cf8ae1d3SMark Adams - flg - PETSC_TRUE to not force coarse grid onto one processor 1255171cca9aSMark Adams 1256171cca9aSMark Adams Options Database Key: 1257cf8ae1d3SMark Adams . -pc_gamg_use_parallel_coarse_grid_solver 1258171cca9aSMark Adams 1259171cca9aSMark Adams Level: intermediate 1260171cca9aSMark Adams 126139d09545SMark Adams .seealso: PCGAMGSetCoarseGridLayoutType(), PCGAMGSetCpuPinCoarseGrids() 1262171cca9aSMark Adams @*/ 1263171cca9aSMark Adams PetscErrorCode PCGAMGSetUseParallelCoarseGridSolve(PC pc, PetscBool flg) 1264171cca9aSMark Adams { 1265171cca9aSMark Adams PetscErrorCode ierr; 1266171cca9aSMark Adams 1267171cca9aSMark Adams PetscFunctionBegin; 1268171cca9aSMark Adams PetscValidHeaderSpecific(pc,PC_CLASSID,1); 1269171cca9aSMark Adams ierr = PetscTryMethod(pc,"PCGAMGSetUseParallelCoarseGridSolve_C",(PC,PetscBool),(pc,flg));CHKERRQ(ierr); 1270171cca9aSMark Adams PetscFunctionReturn(0); 1271171cca9aSMark Adams } 1272171cca9aSMark Adams 1273171cca9aSMark Adams static PetscErrorCode PCGAMGSetUseParallelCoarseGridSolve_GAMG(PC pc, PetscBool flg) 1274171cca9aSMark Adams { 1275171cca9aSMark Adams PC_MG *mg = (PC_MG*)pc->data; 1276171cca9aSMark Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 1277171cca9aSMark Adams 1278171cca9aSMark Adams PetscFunctionBegin; 1279171cca9aSMark Adams pc_gamg->use_parallel_coarse_grid_solver = flg; 1280ffc955d6SMark F. Adams PetscFunctionReturn(0); 1281ffc955d6SMark F. Adams } 1282ffc955d6SMark F. Adams 12834ef23d27SMark F. Adams /*@ 1284ce7c7f2fSMark Adams PCGAMGSetCpuPinCoarseGrids - pin reduced grids to CPU 1285ce7c7f2fSMark Adams 1286ce7c7f2fSMark Adams Collective on PC 1287ce7c7f2fSMark Adams 1288ce7c7f2fSMark Adams Input Parameters: 1289ce7c7f2fSMark Adams + pc - the preconditioner context 1290ce7c7f2fSMark Adams - flg - PETSC_TRUE to pin coarse grids to CPU 1291ce7c7f2fSMark Adams 1292ce7c7f2fSMark Adams Options Database Key: 1293ce7c7f2fSMark Adams . -pc_gamg_cpu_pin_coarse_grids 1294ce7c7f2fSMark Adams 1295ce7c7f2fSMark Adams Level: intermediate 1296ce7c7f2fSMark Adams 129739d09545SMark Adams .seealso: PCGAMGSetCoarseGridLayoutType(), PCGAMGSetUseParallelCoarseGridSolve() 1298ce7c7f2fSMark Adams @*/ 1299ce7c7f2fSMark Adams PetscErrorCode PCGAMGSetCpuPinCoarseGrids(PC pc, PetscBool flg) 1300ce7c7f2fSMark Adams { 1301ce7c7f2fSMark Adams PetscErrorCode ierr; 1302ce7c7f2fSMark Adams 1303ce7c7f2fSMark Adams PetscFunctionBegin; 1304ce7c7f2fSMark Adams PetscValidHeaderSpecific(pc,PC_CLASSID,1); 1305ce7c7f2fSMark Adams ierr = PetscTryMethod(pc,"PCGAMGSetCpuPinCoarseGrids_C",(PC,PetscBool),(pc,flg));CHKERRQ(ierr); 1306ce7c7f2fSMark Adams PetscFunctionReturn(0); 1307ce7c7f2fSMark Adams } 1308ce7c7f2fSMark Adams 1309ce7c7f2fSMark Adams static PetscErrorCode PCGAMGSetCpuPinCoarseGrids_GAMG(PC pc, PetscBool flg) 1310ce7c7f2fSMark Adams { 1311ce7c7f2fSMark Adams PC_MG *mg = (PC_MG*)pc->data; 1312ce7c7f2fSMark Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 1313ce7c7f2fSMark Adams 1314ce7c7f2fSMark Adams PetscFunctionBegin; 1315ce7c7f2fSMark Adams pc_gamg->cpu_pin_coarse_grids = flg; 1316ce7c7f2fSMark Adams PetscFunctionReturn(0); 1317ce7c7f2fSMark Adams } 1318ce7c7f2fSMark Adams 1319ce7c7f2fSMark Adams /*@ 1320ce7c7f2fSMark Adams PCGAMGSetCoarseGridLayoutType - place reduce grids on processors with natural order (compact type) 1321ce7c7f2fSMark Adams 1322ce7c7f2fSMark Adams Collective on PC 1323ce7c7f2fSMark Adams 1324ce7c7f2fSMark Adams Input Parameters: 1325ce7c7f2fSMark Adams + pc - the preconditioner context 1326ce7c7f2fSMark Adams - flg - Layout type 1327ce7c7f2fSMark Adams 1328ce7c7f2fSMark Adams Options Database Key: 1329ce7c7f2fSMark Adams . -pc_gamg_coarse_grid_layout_type 1330ce7c7f2fSMark Adams 1331ce7c7f2fSMark Adams Level: intermediate 1332ce7c7f2fSMark Adams 133339d09545SMark Adams .seealso: PCGAMGSetUseParallelCoarseGridSolve(), PCGAMGSetCpuPinCoarseGrids() 1334ce7c7f2fSMark Adams @*/ 1335ce7c7f2fSMark Adams PetscErrorCode PCGAMGSetCoarseGridLayoutType(PC pc, PCGAMGLayoutType flg) 1336ce7c7f2fSMark Adams { 1337ce7c7f2fSMark Adams PetscErrorCode ierr; 1338ce7c7f2fSMark Adams 1339ce7c7f2fSMark Adams PetscFunctionBegin; 1340ce7c7f2fSMark Adams PetscValidHeaderSpecific(pc,PC_CLASSID,1); 1341ce7c7f2fSMark Adams ierr = PetscTryMethod(pc,"PCGAMGSetCoarseGridLayoutType_C",(PC,PCGAMGLayoutType),(pc,flg));CHKERRQ(ierr); 1342ce7c7f2fSMark Adams PetscFunctionReturn(0); 1343ce7c7f2fSMark Adams } 1344ce7c7f2fSMark Adams 1345ce7c7f2fSMark Adams static PetscErrorCode PCGAMGSetCoarseGridLayoutType_GAMG(PC pc, PCGAMGLayoutType flg) 1346ce7c7f2fSMark Adams { 1347ce7c7f2fSMark Adams PC_MG *mg = (PC_MG*)pc->data; 1348ce7c7f2fSMark Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 1349ce7c7f2fSMark Adams 1350ce7c7f2fSMark Adams PetscFunctionBegin; 1351ce7c7f2fSMark Adams pc_gamg->layout_type = flg; 1352ce7c7f2fSMark Adams PetscFunctionReturn(0); 1353ce7c7f2fSMark Adams } 1354ce7c7f2fSMark Adams 1355ce7c7f2fSMark Adams /*@ 13561cc46a46SBarry Smith PCGAMGSetNlevels - Sets the maximum number of levels PCGAMG will use 13574ef23d27SMark F. Adams 13584ef23d27SMark F. Adams Not collective on PC 13594ef23d27SMark F. Adams 13604ef23d27SMark F. Adams Input Parameters: 13611cc46a46SBarry Smith + pc - the preconditioner 13621cc46a46SBarry Smith - n - the maximum number of levels to use 13634ef23d27SMark F. Adams 13644ef23d27SMark F. Adams Options Database Key: 13654ef23d27SMark F. Adams . -pc_mg_levels 13664ef23d27SMark F. Adams 13674ef23d27SMark F. Adams Level: intermediate 13684ef23d27SMark F. Adams 13694ef23d27SMark F. Adams .seealso: () 13704ef23d27SMark F. Adams @*/ 13714ef23d27SMark F. Adams PetscErrorCode PCGAMGSetNlevels(PC pc, PetscInt n) 13724ef23d27SMark F. Adams { 13734ef23d27SMark F. Adams PetscErrorCode ierr; 13744ef23d27SMark F. Adams 13754ef23d27SMark F. Adams PetscFunctionBegin; 13764ef23d27SMark F. Adams PetscValidHeaderSpecific(pc,PC_CLASSID,1); 13774ef23d27SMark F. Adams ierr = PetscTryMethod(pc,"PCGAMGSetNlevels_C",(PC,PetscInt),(pc,n));CHKERRQ(ierr); 13784ef23d27SMark F. Adams PetscFunctionReturn(0); 13794ef23d27SMark F. Adams } 13804ef23d27SMark F. Adams 13811e6b0712SBarry Smith static PetscErrorCode PCGAMGSetNlevels_GAMG(PC pc, PetscInt n) 13824ef23d27SMark F. Adams { 13834ef23d27SMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 13844ef23d27SMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 13854ef23d27SMark F. Adams 13864ef23d27SMark F. Adams PetscFunctionBegin; 13879d5b6da9SMark F. Adams pc_gamg->Nlevels = n; 13884ef23d27SMark F. Adams PetscFunctionReturn(0); 13894ef23d27SMark F. Adams } 13904ef23d27SMark F. Adams 13913542efc5SMark F. Adams /*@ 13923542efc5SMark F. Adams PCGAMGSetThreshold - Relative threshold to use for dropping edges in aggregation graph 13933542efc5SMark F. Adams 13943542efc5SMark F. Adams Not collective on PC 13953542efc5SMark F. Adams 13963542efc5SMark F. Adams Input Parameters: 13971cc46a46SBarry Smith + pc - the preconditioner context 1398c9567895SMark . v - array of threshold values for finest n levels; 0.0 means keep all nonzero entries in the graph; negative means keep even zero entries in the graph 1399055c8bd0SJed Brown - n - number of threshold values provided in array 14003542efc5SMark F. Adams 14013542efc5SMark F. Adams Options Database Key: 14021cc46a46SBarry Smith . -pc_gamg_threshold <threshold> 14033542efc5SMark F. Adams 140495452b02SPatrick Sanan Notes: 1405af3c827dSMark Adams Increasing the threshold decreases the rate of coarsening. Conversely reducing the threshold increases the rate of coarsening (aggressive coarsening) and thereby reduces the complexity of the coarse grids, and generally results in slower solver converge rates. Reducing coarse grid complexity reduced the complexity of Galerkin coarse grid construction considerably. 1406af3c827dSMark Adams Before coarsening or aggregating the graph, GAMG removes small values from the graph with this threshold, and thus reducing the coupling in the graph and a different (perhaps better) coarser set of points. 1407cab9ed1eSBarry Smith 1408055c8bd0SJed Brown If n is less than the total number of coarsenings (see PCGAMGSetNlevels()), then threshold scaling (see PCGAMGSetThresholdScale()) is used for each successive coarsening. 1409055c8bd0SJed Brown In this case, PCGAMGSetThresholdScale() must be called before PCGAMGSetThreshold(). 1410055c8bd0SJed Brown If n is greater than the total number of levels, the excess entries in threshold will not be used. 1411055c8bd0SJed Brown 14123542efc5SMark F. Adams Level: intermediate 14133542efc5SMark F. Adams 1414af3c827dSMark Adams .seealso: PCGAMGFilterGraph(), PCGAMGSetSquareGraph() 14153542efc5SMark F. Adams @*/ 1416c1eae691SMark Adams PetscErrorCode PCGAMGSetThreshold(PC pc, PetscReal v[], PetscInt n) 14173542efc5SMark F. Adams { 14183542efc5SMark F. Adams PetscErrorCode ierr; 14193542efc5SMark F. Adams 14203542efc5SMark F. Adams PetscFunctionBegin; 14213542efc5SMark F. Adams PetscValidHeaderSpecific(pc,PC_CLASSID,1); 1422055c8bd0SJed Brown if (n) PetscValidRealPointer(v,2); 1423c1eae691SMark Adams ierr = PetscTryMethod(pc,"PCGAMGSetThreshold_C",(PC,PetscReal[],PetscInt),(pc,v,n));CHKERRQ(ierr); 14243542efc5SMark F. Adams PetscFunctionReturn(0); 14253542efc5SMark F. Adams } 14263542efc5SMark F. Adams 1427c1eae691SMark Adams static PetscErrorCode PCGAMGSetThreshold_GAMG(PC pc, PetscReal v[], PetscInt n) 14283542efc5SMark F. Adams { 1429c20e4228SMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 1430c20e4228SMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 1431c1eae691SMark Adams PetscInt i; 1432c1eae691SMark Adams PetscFunctionBegin; 1433055c8bd0SJed Brown for (i=0; i<PetscMin(n,PETSC_MG_MAXLEVELS); i++) pc_gamg->threshold[i] = v[i]; 1434055c8bd0SJed Brown for (; i<PETSC_MG_MAXLEVELS; i++) pc_gamg->threshold[i] = pc_gamg->threshold[i-1]*pc_gamg->threshold_scale; 1435c1eae691SMark Adams PetscFunctionReturn(0); 1436c1eae691SMark Adams } 1437c1eae691SMark Adams 1438c1eae691SMark Adams /*@ 1439c9567895SMark PCGAMGSetRankReductionFactors - Set manual schedual for process reduction on coarse grids 1440c9567895SMark 1441c9567895SMark Collective on PC 1442c9567895SMark 1443c9567895SMark Input Parameters: 1444c9567895SMark + pc - the preconditioner context 1445c9567895SMark . v - array of reduction factors. 0 for fist value forces a reduction to one process/device on first level in Cuda 1446c9567895SMark - n - number of values provided in array 1447c9567895SMark 1448c9567895SMark Options Database Key: 1449c9567895SMark . -pc_gamg_rank_reduction_factors <factors> 1450c9567895SMark 1451c9567895SMark Level: intermediate 1452c9567895SMark 1453c9567895SMark .seealso: PCGAMGSetProcEqLim(), PCGAMGSetCoarseEqLim() 1454c9567895SMark @*/ 1455c9567895SMark PetscErrorCode PCGAMGSetRankReductionFactors(PC pc, PetscInt v[], PetscInt n) 1456c9567895SMark { 1457c9567895SMark PetscErrorCode ierr; 1458c9567895SMark 1459c9567895SMark PetscFunctionBegin; 1460c9567895SMark PetscValidHeaderSpecific(pc,PC_CLASSID,1); 1461c9567895SMark if (n) PetscValidIntPointer(v,2); 1462c9567895SMark ierr = PetscTryMethod(pc,"PCGAMGSetRankReductionFactors_C",(PC,PetscInt[],PetscInt),(pc,v,n));CHKERRQ(ierr); 1463c9567895SMark PetscFunctionReturn(0); 1464c9567895SMark } 1465c9567895SMark 1466c9567895SMark static PetscErrorCode PCGAMGSetRankReductionFactors_GAMG(PC pc, PetscInt v[], PetscInt n) 1467c9567895SMark { 1468c9567895SMark PC_MG *mg = (PC_MG*)pc->data; 1469c9567895SMark PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 1470c9567895SMark PetscInt i; 1471c9567895SMark PetscFunctionBegin; 1472c9567895SMark for (i=0; i<PetscMin(n,PETSC_MG_MAXLEVELS); i++) pc_gamg->level_reduction_factors[i] = v[i]; 1473c9567895SMark for (; i<PETSC_MG_MAXLEVELS; i++) pc_gamg->level_reduction_factors[i] = -1; /* 0 stop putting one process/device on first level */ 1474c9567895SMark PetscFunctionReturn(0); 1475c9567895SMark } 1476c9567895SMark 1477c9567895SMark /*@ 1478c1eae691SMark Adams PCGAMGSetThresholdScale - Relative threshold reduction at each level 1479c1eae691SMark Adams 1480c1eae691SMark Adams Not collective on PC 1481c1eae691SMark Adams 1482c1eae691SMark Adams Input Parameters: 1483c1eae691SMark Adams + pc - the preconditioner context 1484c1eae691SMark Adams - scale - the threshold value reduction, ussually < 1.0 1485c1eae691SMark Adams 1486c1eae691SMark Adams Options Database Key: 1487c1eae691SMark Adams . -pc_gamg_threshold_scale <v> 1488c1eae691SMark Adams 1489055c8bd0SJed Brown Notes: 1490055c8bd0SJed Brown The initial threshold (for an arbitrary number of levels starting from the finest) can be set with PCGAMGSetThreshold(). 1491055c8bd0SJed Brown This scaling is used for each subsequent coarsening, but must be called before PCGAMGSetThreshold(). 1492055c8bd0SJed Brown 1493c1eae691SMark Adams Level: advanced 1494c1eae691SMark Adams 1495055c8bd0SJed Brown .seealso: PCGAMGSetThreshold() 1496c1eae691SMark Adams @*/ 1497c1eae691SMark Adams PetscErrorCode PCGAMGSetThresholdScale(PC pc, PetscReal v) 1498c1eae691SMark Adams { 1499c1eae691SMark Adams PetscErrorCode ierr; 15003542efc5SMark F. Adams 15013542efc5SMark F. Adams PetscFunctionBegin; 1502c1eae691SMark Adams PetscValidHeaderSpecific(pc,PC_CLASSID,1); 1503c1eae691SMark Adams ierr = PetscTryMethod(pc,"PCGAMGSetThresholdScale_C",(PC,PetscReal),(pc,v));CHKERRQ(ierr); 1504c1eae691SMark Adams PetscFunctionReturn(0); 1505c1eae691SMark Adams } 1506c1eae691SMark Adams 1507c1eae691SMark Adams static PetscErrorCode PCGAMGSetThresholdScale_GAMG(PC pc, PetscReal v) 1508c1eae691SMark Adams { 1509c1eae691SMark Adams PC_MG *mg = (PC_MG*)pc->data; 1510c1eae691SMark Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 1511c1eae691SMark Adams PetscFunctionBegin; 1512c1eae691SMark Adams pc_gamg->threshold_scale = v; 15133542efc5SMark F. Adams PetscFunctionReturn(0); 15143542efc5SMark F. Adams } 15153542efc5SMark F. Adams 1516e20c40e8SBarry Smith /*@C 1517c60c7ad4SBarry Smith PCGAMGSetType - Set solution method 1518676e1743SMark F. Adams 1519676e1743SMark F. Adams Collective on PC 1520676e1743SMark F. Adams 1521676e1743SMark F. Adams Input Parameters: 1522c60c7ad4SBarry Smith + pc - the preconditioner context 1523c60c7ad4SBarry Smith - type - PCGAMGAGG, PCGAMGGEO, or PCGAMGCLASSICAL 1524676e1743SMark F. Adams 1525676e1743SMark F. Adams Options Database Key: 1526cab9ed1eSBarry Smith . -pc_gamg_type <agg,geo,classical> - type of algebraic multigrid to apply 1527676e1743SMark F. Adams 1528676e1743SMark F. Adams Level: intermediate 1529676e1743SMark F. Adams 1530cab9ed1eSBarry Smith .seealso: PCGAMGGetType(), PCGAMG, PCGAMGType 1531676e1743SMark F. Adams @*/ 153219fd82e9SBarry Smith PetscErrorCode PCGAMGSetType(PC pc, PCGAMGType type) 1533676e1743SMark F. Adams { 1534676e1743SMark F. Adams PetscErrorCode ierr; 1535676e1743SMark F. Adams 1536676e1743SMark F. Adams PetscFunctionBegin; 1537676e1743SMark F. Adams PetscValidHeaderSpecific(pc,PC_CLASSID,1); 1538806fa848SBarry Smith ierr = PetscTryMethod(pc,"PCGAMGSetType_C",(PC,PCGAMGType),(pc,type));CHKERRQ(ierr); 1539676e1743SMark F. Adams PetscFunctionReturn(0); 1540676e1743SMark F. Adams } 1541676e1743SMark F. Adams 1542e20c40e8SBarry Smith /*@C 1543c60c7ad4SBarry Smith PCGAMGGetType - Get solution method 1544c60c7ad4SBarry Smith 1545c60c7ad4SBarry Smith Collective on PC 1546c60c7ad4SBarry Smith 1547c60c7ad4SBarry Smith Input Parameter: 1548c60c7ad4SBarry Smith . pc - the preconditioner context 1549c60c7ad4SBarry Smith 1550c60c7ad4SBarry Smith Output Parameter: 1551c60c7ad4SBarry Smith . type - the type of algorithm used 1552c60c7ad4SBarry Smith 1553c60c7ad4SBarry Smith Level: intermediate 1554c60c7ad4SBarry Smith 15551c1aac46SBarry Smith .seealso: PCGAMGSetType(), PCGAMGType 1556c60c7ad4SBarry Smith @*/ 1557c60c7ad4SBarry Smith PetscErrorCode PCGAMGGetType(PC pc, PCGAMGType *type) 1558c60c7ad4SBarry Smith { 1559c60c7ad4SBarry Smith PetscErrorCode ierr; 1560c60c7ad4SBarry Smith 1561c60c7ad4SBarry Smith PetscFunctionBegin; 1562c60c7ad4SBarry Smith PetscValidHeaderSpecific(pc,PC_CLASSID,1); 1563c60c7ad4SBarry Smith ierr = PetscUseMethod(pc,"PCGAMGGetType_C",(PC,PCGAMGType*),(pc,type));CHKERRQ(ierr); 1564c60c7ad4SBarry Smith PetscFunctionReturn(0); 1565c60c7ad4SBarry Smith } 1566c60c7ad4SBarry Smith 1567c60c7ad4SBarry Smith static PetscErrorCode PCGAMGGetType_GAMG(PC pc, PCGAMGType *type) 1568c60c7ad4SBarry Smith { 1569c60c7ad4SBarry Smith PC_MG *mg = (PC_MG*)pc->data; 1570c60c7ad4SBarry Smith PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 1571c60c7ad4SBarry Smith 1572c60c7ad4SBarry Smith PetscFunctionBegin; 1573c60c7ad4SBarry Smith *type = pc_gamg->type; 1574c60c7ad4SBarry Smith PetscFunctionReturn(0); 1575c60c7ad4SBarry Smith } 1576c60c7ad4SBarry Smith 15771e6b0712SBarry Smith static PetscErrorCode PCGAMGSetType_GAMG(PC pc, PCGAMGType type) 1578676e1743SMark F. Adams { 15799d5b6da9SMark F. Adams PetscErrorCode ierr,(*r)(PC); 15801ab5ffc9SJed Brown PC_MG *mg = (PC_MG*)pc->data; 15811ab5ffc9SJed Brown PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 1582676e1743SMark F. Adams 1583676e1743SMark F. Adams PetscFunctionBegin; 1584c60c7ad4SBarry Smith pc_gamg->type = type; 15851c9cd337SJed Brown ierr = PetscFunctionListFind(GAMGList,type,&r);CHKERRQ(ierr); 15869d5b6da9SMark F. Adams if (!r) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_UNKNOWN_TYPE,"Unknown GAMG type %s given",type); 15871ab5ffc9SJed Brown if (pc_gamg->ops->destroy) { 15881ab5ffc9SJed Brown ierr = (*pc_gamg->ops->destroy)(pc);CHKERRQ(ierr); 15891ab5ffc9SJed Brown ierr = PetscMemzero(pc_gamg->ops,sizeof(struct _PCGAMGOps));CHKERRQ(ierr); 1590e616c208SToby Isaac pc_gamg->ops->createlevel = PCGAMGCreateLevel_GAMG; 15913ae0bb68SMark Adams /* cleaning up common data in pc_gamg - this should disapear someday */ 15923ae0bb68SMark Adams pc_gamg->data_cell_cols = 0; 15933ae0bb68SMark Adams pc_gamg->data_cell_rows = 0; 15943ae0bb68SMark Adams pc_gamg->orig_data_cell_cols = 0; 15953ae0bb68SMark Adams pc_gamg->orig_data_cell_rows = 0; 15963ae0bb68SMark Adams ierr = PetscFree(pc_gamg->data);CHKERRQ(ierr); 15973ae0bb68SMark Adams pc_gamg->data_sz = 0; 15981ab5ffc9SJed Brown } 15991ab5ffc9SJed Brown ierr = PetscFree(pc_gamg->gamg_type_name);CHKERRQ(ierr); 16001ab5ffc9SJed Brown ierr = PetscStrallocpy(type,&pc_gamg->gamg_type_name);CHKERRQ(ierr); 16019d5b6da9SMark F. Adams ierr = (*r)(pc);CHKERRQ(ierr); 1602676e1743SMark F. Adams PetscFunctionReturn(0); 1603676e1743SMark F. Adams } 1604676e1743SMark F. Adams 16059d766c59SMark Adams /* -------------------------------------------------------------------------- */ 16069d766c59SMark Adams /* 16079d766c59SMark Adams PCMGGetGridComplexity - compute coarse grid complexity of MG hierarchy 16089d766c59SMark Adams 16099d766c59SMark Adams Input Parameter: 16109d766c59SMark Adams . pc - the preconditioner context 16119d766c59SMark Adams 16129d766c59SMark Adams Output Parameter: 16139d766c59SMark Adams . gc - grid complexity = sum_i(nnz_i) / nnz_0 16149d766c59SMark Adams 16159d766c59SMark Adams Level: advanced 16169d766c59SMark Adams */ 16179d766c59SMark Adams static PetscErrorCode PCMGGetGridComplexity(PC pc, PetscReal *gc) 16189d766c59SMark Adams { 16199d766c59SMark Adams PetscErrorCode ierr; 16209d766c59SMark Adams PC_MG *mg = (PC_MG*)pc->data; 16219d766c59SMark Adams PC_MG_Levels **mglevels = mg->levels; 16223966268fSBarry Smith PetscInt lev; 16233966268fSBarry Smith PetscLogDouble nnz0 = 0, sgc = 0; 16249d766c59SMark Adams MatInfo info; 16253966268fSBarry Smith 16269d766c59SMark Adams PetscFunctionBegin; 1627dbf6bb8dSprj- if (!pc->setupcalled) { 1628dbf6bb8dSprj- *gc = 0; 1629dbf6bb8dSprj- PetscFunctionReturn(0); 1630dbf6bb8dSprj- } 16319d766c59SMark Adams if (!mg->nlevels) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"MG has no levels"); 16323966268fSBarry Smith for (lev=0; lev<mg->nlevels; lev++) { 163362a6e064SMark Adams Mat dB; 163462a6e064SMark Adams ierr = KSPGetOperators(mglevels[lev]->smoothd,NULL,&dB);CHKERRQ(ierr); 163562a6e064SMark Adams ierr = MatGetInfo(dB,MAT_GLOBAL_SUM,&info);CHKERRQ(ierr); /* global reduction */ 16363966268fSBarry Smith sgc += info.nz_used; 16379d766c59SMark Adams if (lev==mg->nlevels-1) nnz0 = info.nz_used; 16389d766c59SMark Adams } 16393966268fSBarry Smith if (nnz0 > 0) *gc = (PetscReal)(sgc/nnz0); 16403966268fSBarry Smith else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Number for grid points on finest level is not available"); 16419d766c59SMark Adams PetscFunctionReturn(0); 16429d766c59SMark Adams } 16439d766c59SMark Adams 16445adeb434SBarry Smith static PetscErrorCode PCView_GAMG(PC pc,PetscViewer viewer) 16455adeb434SBarry Smith { 1646c1eae691SMark Adams PetscErrorCode ierr,i; 16475adeb434SBarry Smith PC_MG *mg = (PC_MG*)pc->data; 16485adeb434SBarry Smith PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 164923b2d91dSMark Adams PetscReal gc=0; 16505adeb434SBarry Smith PetscFunctionBegin; 16515adeb434SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," GAMG specific options\n");CHKERRQ(ierr); 1652459726d8SSatish Balay ierr = PetscViewerASCIIPrintf(viewer," Threshold for dropping small values in graph on each level =");CHKERRQ(ierr); 1653b3e187dcSStefano Zampini for (i=0;i<mg->nlevels; i++) { 1654c1eae691SMark Adams ierr = PetscViewerASCIIPrintf(viewer," %g",(double)pc_gamg->threshold[i]);CHKERRQ(ierr); 1655c1eae691SMark Adams } 1656459726d8SSatish Balay ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 1657459726d8SSatish Balay ierr = PetscViewerASCIIPrintf(viewer," Threshold scaling factor for each level not specified = %g\n",(double)pc_gamg->threshold_scale);CHKERRQ(ierr); 1658cab9ed1eSBarry Smith if (pc_gamg->use_aggs_in_asm) { 1659cab9ed1eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," Using aggregates from coarsening process to define subdomains for PCASM\n");CHKERRQ(ierr); 1660cab9ed1eSBarry Smith } 1661171cca9aSMark Adams if (pc_gamg->use_parallel_coarse_grid_solver) { 1662171cca9aSMark Adams ierr = PetscViewerASCIIPrintf(viewer," Using parallel coarse grid solver (all coarse grid equations not put on one process)\n");CHKERRQ(ierr); 1663171cca9aSMark Adams } 1664ce7c7f2fSMark Adams #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 1665ce7c7f2fSMark Adams if (pc_gamg->cpu_pin_coarse_grids) { 1666ce7c7f2fSMark Adams /* ierr = PetscViewerASCIIPrintf(viewer," Pinning coarse grids to the CPU)\n");CHKERRQ(ierr); */ 1667ce7c7f2fSMark Adams } 1668ce7c7f2fSMark Adams #endif 1669ce7c7f2fSMark Adams /* if (pc_gamg->layout_type==PCGAMG_LAYOUT_COMPACT) { */ 1670ce7c7f2fSMark Adams /* ierr = PetscViewerASCIIPrintf(viewer," Put reduced grids on processes in natural order (ie, 0,1,2...)\n");CHKERRQ(ierr); */ 1671ce7c7f2fSMark Adams /* } else { */ 1672ce7c7f2fSMark Adams /* ierr = PetscViewerASCIIPrintf(viewer," Put reduced grids on whole machine (ie, 0,1*f,2*f...,np-f)\n");CHKERRQ(ierr); */ 1673ce7c7f2fSMark Adams /* } */ 16745adeb434SBarry Smith if (pc_gamg->ops->view) { 16755adeb434SBarry Smith ierr = (*pc_gamg->ops->view)(pc,viewer);CHKERRQ(ierr); 16765adeb434SBarry Smith } 16779d766c59SMark Adams ierr = PCMGGetGridComplexity(pc,&gc);CHKERRQ(ierr); 16789d766c59SMark Adams ierr = PetscViewerASCIIPrintf(viewer," Complexity: grid = %g\n",gc);CHKERRQ(ierr); 16795adeb434SBarry Smith PetscFunctionReturn(0); 16805adeb434SBarry Smith } 16815adeb434SBarry Smith 16824416b707SBarry Smith PetscErrorCode PCSetFromOptions_GAMG(PetscOptionItems *PetscOptionsObject,PC pc) 16835b89ad90SMark F. Adams { 1684676e1743SMark F. Adams PetscErrorCode ierr; 1685676e1743SMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 1686676e1743SMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 168718c3aa7eSMark PetscBool flag,f2; 16883b4367a7SBarry Smith MPI_Comm comm; 168918c3aa7eSMark char prefix[256],tname[32]; 1690c1eae691SMark Adams PetscInt i,n; 169114a9496bSBarry Smith const char *pcpre; 16920a545947SLisandro Dalcin static const char *LayoutTypes[] = {"compact","spread","PCGAMGLayoutType","PC_GAMG_LAYOUT",NULL}; 16935b89ad90SMark F. Adams PetscFunctionBegin; 16943b4367a7SBarry Smith ierr = PetscObjectGetComm((PetscObject)pc,&comm);CHKERRQ(ierr); 1695e55864a3SBarry Smith ierr = PetscOptionsHead(PetscOptionsObject,"GAMG options");CHKERRQ(ierr); 16961a1c1e04SBarry Smith ierr = PetscOptionsFList("-pc_gamg_type","Type of AMG method","PCGAMGSetType",GAMGList, pc_gamg->gamg_type_name, tname, sizeof(tname), &flag);CHKERRQ(ierr); 1697bd94a7aaSJed Brown if (flag) { 1698bd94a7aaSJed Brown ierr = PCGAMGSetType(pc,tname);CHKERRQ(ierr); 16991ab5ffc9SJed Brown } 170018c3aa7eSMark ierr = PetscOptionsFList("-pc_gamg_esteig_ksp_type","Krylov method for eigen estimator","PCGAMGSetEstEigKSPType",KSPList,pc_gamg->esteig_type,tname,sizeof(tname),&flag);CHKERRQ(ierr); 170118c3aa7eSMark if (flag) { 170218c3aa7eSMark ierr = PCGAMGSetEstEigKSPType(pc,tname);CHKERRQ(ierr); 170318c3aa7eSMark } 1704cab9ed1eSBarry Smith ierr = PetscOptionsBool("-pc_gamg_repartition","Repartion coarse grids","PCGAMGSetRepartition",pc_gamg->repart,&pc_gamg->repart,NULL);CHKERRQ(ierr); 170518c3aa7eSMark f2 = PETSC_TRUE; 170618c3aa7eSMark ierr = PetscOptionsBool("-pc_gamg_use_sa_esteig","Use eigen estimate from Smoothed aggregation for smoother","PCGAMGSetUseSAEstEig",f2,&f2,&flag);CHKERRQ(ierr); 170718c3aa7eSMark if (flag) pc_gamg->use_sa_esteig = f2 ? 1 : 0; 17081cc46a46SBarry Smith ierr = PetscOptionsBool("-pc_gamg_reuse_interpolation","Reuse prolongation operator","PCGAMGReuseInterpolation",pc_gamg->reuse_prol,&pc_gamg->reuse_prol,NULL);CHKERRQ(ierr); 1709a303c832SJed Brown ierr = PetscOptionsBool("-pc_gamg_asm_use_agg","Use aggregation aggregates for ASM smoother","PCGAMGASMSetUseAggs",pc_gamg->use_aggs_in_asm,&pc_gamg->use_aggs_in_asm,NULL);CHKERRQ(ierr); 1710cf8ae1d3SMark Adams ierr = PetscOptionsBool("-pc_gamg_use_parallel_coarse_grid_solver","Use parallel coarse grid solver (otherwise put last grid on one process)","PCGAMGSetUseParallelCoarseGridSolve",pc_gamg->use_parallel_coarse_grid_solver,&pc_gamg->use_parallel_coarse_grid_solver,NULL);CHKERRQ(ierr); 1711ce7c7f2fSMark Adams ierr = PetscOptionsBool("-pc_gamg_cpu_pin_coarse_grids","Pin coarse grids to the CPU","PCGAMGSetCpuPinCoarseGrids",pc_gamg->cpu_pin_coarse_grids,&pc_gamg->cpu_pin_coarse_grids,NULL);CHKERRQ(ierr); 1712a0095786SMark ierr = PetscOptionsEnum("-pc_gamg_coarse_grid_layout_type","compact: place reduced grids on processes in natural order; spread: distribute to whole machine for more memory bandwidth","PCGAMGSetCoarseGridLayoutType",LayoutTypes,(PetscEnum)pc_gamg->layout_type,(PetscEnum*)&pc_gamg->layout_type,NULL);CHKERRQ(ierr); 171394ae4db5SBarry Smith ierr = PetscOptionsInt("-pc_gamg_process_eq_limit","Limit (goal) on number of equations per process on coarse grids","PCGAMGSetProcEqLim",pc_gamg->min_eq_proc,&pc_gamg->min_eq_proc,NULL);CHKERRQ(ierr); 171418c3aa7eSMark ierr = PetscOptionsInt("-pc_gamg_esteig_ksp_max_it","Number of iterations of eigen estimator","PCGAMGSetEstEigKSPMaxIt",pc_gamg->esteig_max_it,&pc_gamg->esteig_max_it,NULL);CHKERRQ(ierr); 171594ae4db5SBarry Smith ierr = PetscOptionsInt("-pc_gamg_coarse_eq_limit","Limit on number of equations for the coarse grid","PCGAMGSetCoarseEqLim",pc_gamg->coarse_eq_limit,&pc_gamg->coarse_eq_limit,NULL);CHKERRQ(ierr); 1716a303c832SJed Brown ierr = PetscOptionsReal("-pc_gamg_threshold_scale","Scaling of threshold for each level not specified","PCGAMGSetThresholdScale",pc_gamg->threshold_scale,&pc_gamg->threshold_scale,NULL);CHKERRQ(ierr); 171718c3aa7eSMark n = PETSC_MG_MAXLEVELS; 1718c1eae691SMark Adams ierr = PetscOptionsRealArray("-pc_gamg_threshold","Relative threshold to use for dropping edges in aggregation graph","PCGAMGSetThreshold",pc_gamg->threshold,&n,&flag);CHKERRQ(ierr); 171918c3aa7eSMark if (!flag || n < PETSC_MG_MAXLEVELS) { 1720efd3c5ceSMark Adams if (!flag) n = 1; 1721c1eae691SMark Adams i = n; 172218c3aa7eSMark do {pc_gamg->threshold[i] = pc_gamg->threshold[i-1]*pc_gamg->threshold_scale;} while (++i<PETSC_MG_MAXLEVELS); 1723c1eae691SMark Adams } 1724c9567895SMark n = PETSC_MG_MAXLEVELS; 1725c9567895SMark ierr = PetscOptionsIntArray("-pc_gamg_rank_reduction_factors","Manual schedule of coarse grid reduction factors that overrides internal heuristics (0 for first reduction puts one process/device)","PCGAMGSetRankReductionFactors",pc_gamg->level_reduction_factors,&n,&flag);CHKERRQ(ierr); 1726c9567895SMark if (!flag) i = 0; 1727c9567895SMark else i = n; 1728c9567895SMark do {pc_gamg->level_reduction_factors[i] = -1;} while (++i<PETSC_MG_MAXLEVELS); 172994ae4db5SBarry Smith ierr = PetscOptionsInt("-pc_mg_levels","Set number of MG levels","PCGAMGSetNlevels",pc_gamg->Nlevels,&pc_gamg->Nlevels,NULL);CHKERRQ(ierr); 173018c3aa7eSMark { 173118c3aa7eSMark PetscReal eminmax[2] = {0., 0.}; 173218c3aa7eSMark n = 2; 173318c3aa7eSMark ierr = PetscOptionsRealArray("-pc_gamg_eigenvalues","extreme eigenvalues for smoothed aggregation","PCGAMGSetEigenvalues",eminmax,&n,&flag);CHKERRQ(ierr); 173418c3aa7eSMark if (flag) { 173518c3aa7eSMark if (n != 2) SETERRQ(PetscObjectComm((PetscObject)pc),PETSC_ERR_ARG_INCOMP,"-pc_gamg_eigenvalues: must specify 2 parameters, min and max eigenvalues"); 173618c3aa7eSMark ierr = PCGAMGSetEigenvalues(pc, eminmax[1], eminmax[0]);CHKERRQ(ierr); 173718c3aa7eSMark } 173818c3aa7eSMark } 1739b7cbab4eSMark Adams /* set options for subtype */ 1740e55864a3SBarry Smith if (pc_gamg->ops->setfromoptions) {ierr = (*pc_gamg->ops->setfromoptions)(PetscOptionsObject,pc);CHKERRQ(ierr);} 174118c3aa7eSMark 174214a9496bSBarry Smith ierr = PCGetOptionsPrefix(pc, &pcpre);CHKERRQ(ierr); 174314a9496bSBarry Smith ierr = PetscSNPrintf(prefix,sizeof(prefix),"%spc_gamg_",pcpre ? pcpre : "");CHKERRQ(ierr); 1744676e1743SMark F. Adams ierr = PetscOptionsTail();CHKERRQ(ierr); 17455b89ad90SMark F. Adams PetscFunctionReturn(0); 17465b89ad90SMark F. Adams } 17475b89ad90SMark F. Adams 17485b89ad90SMark F. Adams /* -------------------------------------------------------------------------- */ 17495b89ad90SMark F. Adams /*MC 17501cc46a46SBarry Smith PCGAMG - Geometric algebraic multigrid (AMG) preconditioner 17515b89ad90SMark F. Adams 1752280d9858SJed Brown Options Database Keys: 1753cab9ed1eSBarry Smith + -pc_gamg_type <type> - one of agg, geo, or classical 1754cab9ed1eSBarry Smith . -pc_gamg_repartition <true,default=false> - repartition the degrees of freedom accross the coarse grids as they are determined 1755cab9ed1eSBarry Smith . -pc_gamg_reuse_interpolation <true,default=false> - when rebuilding the algebraic multigrid preconditioner reuse the previously computed interpolations 1756cab9ed1eSBarry Smith . -pc_gamg_asm_use_agg <true,default=false> - use the aggregates from the coasening process to defined the subdomains on each level for the PCASM smoother 1757cab9ed1eSBarry Smith . -pc_gamg_process_eq_limit <limit, default=50> - GAMG will reduce the number of MPI processes used directly on the coarse grids so that there are around <limit> 1758cab9ed1eSBarry Smith equations on each process that has degrees of freedom 1759cab9ed1eSBarry Smith . -pc_gamg_coarse_eq_limit <limit, default=50> - Set maximum number of equations on coarsest grid to aim for. 17606008e27bSRichard Tran Mills . -pc_gamg_threshold[] <thresh,default=0> - Before aggregating the graph GAMG will remove small values from the graph on each level 1761c1eae691SMark Adams - -pc_gamg_threshold_scale <scale,default=1> - Scaling of threshold on each coarser grid if not specified 1762cab9ed1eSBarry Smith 1763cab9ed1eSBarry Smith Options Database Keys for default Aggregation: 1764cab9ed1eSBarry Smith + -pc_gamg_agg_nsmooths <nsmooth, default=1> - number of smoothing steps to use with smooth aggregation 1765cab9ed1eSBarry Smith . -pc_gamg_sym_graph <true,default=false> - symmetrize the graph before computing the aggregation 1766cab9ed1eSBarry Smith - -pc_gamg_square_graph <n,default=1> - number of levels to square the graph before aggregating it 1767cab9ed1eSBarry Smith 1768db9745e2SBarry Smith Multigrid options: 1769db9745e2SBarry Smith + -pc_mg_cycles <v> - v or w, see PCMGSetCycleType() 1770db9745e2SBarry Smith . -pc_mg_distinct_smoothup - configure the up and down (pre and post) smoothers separately, see PCMGSetDistinctSmoothUp() 1771db9745e2SBarry Smith . -pc_mg_type <multiplicative> - (one of) additive multiplicative full kascade 1772cab9ed1eSBarry Smith - -pc_mg_levels <levels> - Number of levels of multigrid to use. 17735b89ad90SMark F. Adams 17741cc46a46SBarry Smith 177595452b02SPatrick Sanan Notes: 177695452b02SPatrick Sanan In order to obtain good performance for PCGAMG for vector valued problems you must 1777db9745e2SBarry Smith Call MatSetBlockSize() to indicate the number of degrees of freedom per grid point 1778db9745e2SBarry Smith Call MatSetNearNullSpace() (or PCSetCoordinates() if solving the equations of elasticity) to indicate the near null space of the operator 1779db9745e2SBarry Smith See the Users Manual Chapter 4 for more details 17801cc46a46SBarry Smith 17815b89ad90SMark F. Adams Level: intermediate 1782280d9858SJed Brown 17831cc46a46SBarry Smith .seealso: PCCreate(), PCSetType(), MatSetBlockSize(), PCMGType, PCSetCoordinates(), MatSetNearNullSpace(), PCGAMGSetType(), PCGAMGAGG, PCGAMGGEO, PCGAMGCLASSICAL, PCGAMGSetProcEqLim(), 178418c3aa7eSMark PCGAMGSetCoarseEqLim(), PCGAMGSetRepartition(), PCGAMGRegister(), PCGAMGSetReuseInterpolation(), PCGAMGASMSetUseAggs(), PCGAMGSetUseParallelCoarseGridSolve(), PCGAMGSetNlevels(), PCGAMGSetThreshold(), PCGAMGGetType(), PCGAMGSetReuseInterpolation(), PCGAMGSetUseSAEstEig(), PCGAMGSetEstEigKSPMaxIt(), PCGAMGSetEstEigKSPType() 17855b89ad90SMark F. Adams M*/ 1786b2573a8aSBarry Smith 17878cc058d9SJed Brown PETSC_EXTERN PetscErrorCode PCCreate_GAMG(PC pc) 17885b89ad90SMark F. Adams { 1789c1eae691SMark Adams PetscErrorCode ierr,i; 17905b89ad90SMark F. Adams PC_GAMG *pc_gamg; 17915b89ad90SMark F. Adams PC_MG *mg; 17925b89ad90SMark F. Adams 17935b89ad90SMark F. Adams PetscFunctionBegin; 17941c1aac46SBarry Smith /* register AMG type */ 17951c1aac46SBarry Smith ierr = PCGAMGInitializePackage();CHKERRQ(ierr); 17961c1aac46SBarry Smith 17975b89ad90SMark F. Adams /* PCGAMG is an inherited class of PCMG. Initialize pc as PCMG */ 17981c1aac46SBarry Smith ierr = PCSetType(pc, PCMG);CHKERRQ(ierr); 17995b89ad90SMark F. Adams ierr = PetscObjectChangeTypeName((PetscObject)pc, PCGAMG);CHKERRQ(ierr); 18005b89ad90SMark F. Adams 18015b89ad90SMark F. Adams /* create a supporting struct and attach it to pc */ 1802b00a9115SJed Brown ierr = PetscNewLog(pc,&pc_gamg);CHKERRQ(ierr); 180369aca0b8SBarry Smith ierr = PCMGSetGalerkin(pc,PC_MG_GALERKIN_EXTERNAL);CHKERRQ(ierr); 18045b89ad90SMark F. Adams mg = (PC_MG*)pc->data; 18055b89ad90SMark F. Adams mg->innerctx = pc_gamg; 18065b89ad90SMark F. Adams 1807b00a9115SJed Brown ierr = PetscNewLog(pc,&pc_gamg->ops);CHKERRQ(ierr); 18081ab5ffc9SJed Brown 18099d5b6da9SMark F. Adams /* these should be in subctx but repartitioning needs simple arrays */ 18109d5b6da9SMark F. Adams pc_gamg->data_sz = 0; 18110a545947SLisandro Dalcin pc_gamg->data = NULL; 18125b89ad90SMark F. Adams 18139d5b6da9SMark F. Adams /* overwrite the pointers of PCMG by the functions of base class PCGAMG */ 18145b89ad90SMark F. Adams pc->ops->setfromoptions = PCSetFromOptions_GAMG; 18155b89ad90SMark F. Adams pc->ops->setup = PCSetUp_GAMG; 18165b89ad90SMark F. Adams pc->ops->reset = PCReset_GAMG; 18175b89ad90SMark F. Adams pc->ops->destroy = PCDestroy_GAMG; 18185adeb434SBarry Smith mg->view = PCView_GAMG; 18195b89ad90SMark F. Adams 182097d33e41SMatthew G. Knepley ierr = PetscObjectComposeFunction((PetscObject)pc,"PCMGGetLevels_C",PCMGGetLevels_MG);CHKERRQ(ierr); 182197d33e41SMatthew G. Knepley ierr = PetscObjectComposeFunction((PetscObject)pc,"PCMGSetLevels_C",PCMGSetLevels_MG);CHKERRQ(ierr); 1822bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCGAMGSetProcEqLim_C",PCGAMGSetProcEqLim_GAMG);CHKERRQ(ierr); 1823bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCGAMGSetCoarseEqLim_C",PCGAMGSetCoarseEqLim_GAMG);CHKERRQ(ierr); 1824cab9ed1eSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCGAMGSetRepartition_C",PCGAMGSetRepartition_GAMG);CHKERRQ(ierr); 182518c3aa7eSMark ierr = PetscObjectComposeFunction((PetscObject)pc,"PCGAMGSetEstEigKSPType_C",PCGAMGSetEstEigKSPType_GAMG);CHKERRQ(ierr); 182618c3aa7eSMark ierr = PetscObjectComposeFunction((PetscObject)pc,"PCGAMGSetEstEigKSPMaxIt_C",PCGAMGSetEstEigKSPMaxIt_GAMG);CHKERRQ(ierr); 182718c3aa7eSMark ierr = PetscObjectComposeFunction((PetscObject)pc,"PCGAMGSetEigenvalues_C",PCGAMGSetEigenvalues_GAMG);CHKERRQ(ierr); 182818c3aa7eSMark ierr = PetscObjectComposeFunction((PetscObject)pc,"PCGAMGSetUseSAEstEig_C",PCGAMGSetUseSAEstEig_GAMG);CHKERRQ(ierr); 18291cc46a46SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCGAMGSetReuseInterpolation_C",PCGAMGSetReuseInterpolation_GAMG);CHKERRQ(ierr); 1830cab9ed1eSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCGAMGASMSetUseAggs_C",PCGAMGASMSetUseAggs_GAMG);CHKERRQ(ierr); 1831171cca9aSMark Adams ierr = PetscObjectComposeFunction((PetscObject)pc,"PCGAMGSetUseParallelCoarseGridSolve_C",PCGAMGSetUseParallelCoarseGridSolve_GAMG);CHKERRQ(ierr); 1832ce7c7f2fSMark Adams ierr = PetscObjectComposeFunction((PetscObject)pc,"PCGAMGSetCpuPinCoarseGrids_C",PCGAMGSetCpuPinCoarseGrids_GAMG);CHKERRQ(ierr); 1833ce7c7f2fSMark Adams ierr = PetscObjectComposeFunction((PetscObject)pc,"PCGAMGSetCoarseGridLayoutType_C",PCGAMGSetCoarseGridLayoutType_GAMG);CHKERRQ(ierr); 1834bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCGAMGSetThreshold_C",PCGAMGSetThreshold_GAMG);CHKERRQ(ierr); 1835c9567895SMark ierr = PetscObjectComposeFunction((PetscObject)pc,"PCGAMGSetRankReductionFactors_C",PCGAMGSetRankReductionFactors_GAMG);CHKERRQ(ierr); 1836c1eae691SMark Adams ierr = PetscObjectComposeFunction((PetscObject)pc,"PCGAMGSetThresholdScale_C",PCGAMGSetThresholdScale_GAMG);CHKERRQ(ierr); 1837bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCGAMGSetType_C",PCGAMGSetType_GAMG);CHKERRQ(ierr); 1838c60c7ad4SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCGAMGGetType_C",PCGAMGGetType_GAMG);CHKERRQ(ierr); 1839bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCGAMGSetNlevels_C",PCGAMGSetNlevels_GAMG);CHKERRQ(ierr); 18409d5b6da9SMark F. Adams pc_gamg->repart = PETSC_FALSE; 1841d3042614SMark Adams pc_gamg->reuse_prol = PETSC_FALSE; 18420c3bc534SBarry Smith pc_gamg->use_aggs_in_asm = PETSC_FALSE; 1843171cca9aSMark Adams pc_gamg->use_parallel_coarse_grid_solver = PETSC_FALSE; 1844a0095786SMark pc_gamg->cpu_pin_coarse_grids = PETSC_FALSE; 1845a0095786SMark pc_gamg->layout_type = PCGAMG_LAYOUT_SPREAD; 1846038f3aa4SMark F. Adams pc_gamg->min_eq_proc = 50; 184725a145a7SMark Adams pc_gamg->coarse_eq_limit = 50; 184818c3aa7eSMark for (i=0;i<PETSC_MG_MAXLEVELS;i++) pc_gamg->threshold[i] = 0.; 1849c1eae691SMark Adams pc_gamg->threshold_scale = 1.; 185018c3aa7eSMark pc_gamg->Nlevels = PETSC_MG_MAXLEVELS; 18519ab59c8bSMark Adams pc_gamg->current_level = 0; /* don't need to init really */ 1852d24ecf33SMark ierr = PetscStrcpy(pc_gamg->esteig_type,NULL);CHKERRQ(ierr); 185318c3aa7eSMark pc_gamg->esteig_max_it = 10; 185418c3aa7eSMark pc_gamg->use_sa_esteig = -1; 185518c3aa7eSMark pc_gamg->emin = 0; 185618c3aa7eSMark pc_gamg->emax = 0; 185718c3aa7eSMark 1858c238b0ebSToby Isaac pc_gamg->ops->createlevel = PCGAMGCreateLevel_GAMG; 18599d5b6da9SMark F. Adams 1860bd94a7aaSJed Brown /* PCSetUp_GAMG assumes that the type has been set, so set it to the default now */ 1861bd94a7aaSJed Brown ierr = PCGAMGSetType(pc,PCGAMGAGG);CHKERRQ(ierr); 18625b89ad90SMark F. Adams PetscFunctionReturn(0); 18635b89ad90SMark F. Adams } 18643e3471ccSMark Adams 18653e3471ccSMark Adams /*@C 18663e3471ccSMark Adams PCGAMGInitializePackage - This function initializes everything in the PCGAMG package. It is called 18678a690491SBarry Smith from PCInitializePackage(). 18683e3471ccSMark Adams 18693e3471ccSMark Adams Level: developer 18703e3471ccSMark Adams 18713e3471ccSMark Adams .seealso: PetscInitialize() 18723e3471ccSMark Adams @*/ 18733e3471ccSMark Adams PetscErrorCode PCGAMGInitializePackage(void) 18743e3471ccSMark Adams { 18753e3471ccSMark Adams PetscErrorCode ierr; 18763e3471ccSMark Adams 18773e3471ccSMark Adams PetscFunctionBegin; 18783e3471ccSMark Adams if (PCGAMGPackageInitialized) PetscFunctionReturn(0); 18793e3471ccSMark Adams PCGAMGPackageInitialized = PETSC_TRUE; 18803e3471ccSMark Adams ierr = PetscFunctionListAdd(&GAMGList,PCGAMGGEO,PCCreateGAMG_GEO);CHKERRQ(ierr); 18813e3471ccSMark Adams ierr = PetscFunctionListAdd(&GAMGList,PCGAMGAGG,PCCreateGAMG_AGG);CHKERRQ(ierr); 18828e6d0c30SPeter Brune ierr = PetscFunctionListAdd(&GAMGList,PCGAMGCLASSICAL,PCCreateGAMG_Classical);CHKERRQ(ierr); 18833e3471ccSMark Adams ierr = PetscRegisterFinalize(PCGAMGFinalizePackage);CHKERRQ(ierr); 1884c1c463dbSMark Adams 1885c1c463dbSMark Adams /* general events */ 1886fd1112cbSBarry Smith ierr = PetscLogEventRegister("PCGAMGGraph_AGG", 0, &PC_GAMGGraph_AGG);CHKERRQ(ierr); 1887fd1112cbSBarry Smith ierr = PetscLogEventRegister("PCGAMGGraph_GEO", PC_CLASSID, &PC_GAMGGraph_GEO);CHKERRQ(ierr); 1888fd1112cbSBarry Smith ierr = PetscLogEventRegister("PCGAMGCoarse_AGG", PC_CLASSID, &PC_GAMGCoarsen_AGG);CHKERRQ(ierr); 1889fd1112cbSBarry Smith ierr = PetscLogEventRegister("PCGAMGCoarse_GEO", PC_CLASSID, &PC_GAMGCoarsen_GEO);CHKERRQ(ierr); 1890c1c463dbSMark Adams ierr = PetscLogEventRegister("PCGAMGProl_AGG", PC_CLASSID, &PC_GAMGProlongator_AGG);CHKERRQ(ierr); 1891c1c463dbSMark Adams ierr = PetscLogEventRegister("PCGAMGProl_GEO", PC_CLASSID, &PC_GAMGProlongator_GEO);CHKERRQ(ierr); 1892fd1112cbSBarry Smith ierr = PetscLogEventRegister("PCGAMGPOpt_AGG", PC_CLASSID, &PC_GAMGOptProlongator_AGG);CHKERRQ(ierr); 1893c1c463dbSMark Adams 18945b89ad90SMark F. Adams #if defined PETSC_GAMG_USE_LOG 18955b89ad90SMark F. Adams ierr = PetscLogEventRegister("GAMG: createProl", PC_CLASSID, &petsc_gamg_setup_events[SET1]);CHKERRQ(ierr); 18965b89ad90SMark F. Adams ierr = PetscLogEventRegister(" Graph", PC_CLASSID, &petsc_gamg_setup_events[GRAPH]);CHKERRQ(ierr); 18975b89ad90SMark F. Adams /* PetscLogEventRegister(" G.Mat", PC_CLASSID, &petsc_gamg_setup_events[GRAPH_MAT]); */ 18985b89ad90SMark F. Adams /* PetscLogEventRegister(" G.Filter", PC_CLASSID, &petsc_gamg_setup_events[GRAPH_FILTER]); */ 18995b89ad90SMark F. Adams /* PetscLogEventRegister(" G.Square", PC_CLASSID, &petsc_gamg_setup_events[GRAPH_SQR]); */ 19005b89ad90SMark F. Adams ierr = PetscLogEventRegister(" MIS/Agg", PC_CLASSID, &petsc_gamg_setup_events[SET4]);CHKERRQ(ierr); 19015b89ad90SMark F. Adams ierr = PetscLogEventRegister(" geo: growSupp", PC_CLASSID, &petsc_gamg_setup_events[SET5]);CHKERRQ(ierr); 19025b89ad90SMark F. Adams ierr = PetscLogEventRegister(" geo: triangle", PC_CLASSID, &petsc_gamg_setup_events[SET6]);CHKERRQ(ierr); 1903bb235841SBarry Smith ierr = PetscLogEventRegister(" search-set", PC_CLASSID, &petsc_gamg_setup_events[FIND_V]);CHKERRQ(ierr); 19045b89ad90SMark F. Adams ierr = PetscLogEventRegister(" SA: col data", PC_CLASSID, &petsc_gamg_setup_events[SET7]);CHKERRQ(ierr); 19055b89ad90SMark F. Adams ierr = PetscLogEventRegister(" SA: frmProl0", PC_CLASSID, &petsc_gamg_setup_events[SET8]);CHKERRQ(ierr); 19065b89ad90SMark F. Adams ierr = PetscLogEventRegister(" SA: smooth", PC_CLASSID, &petsc_gamg_setup_events[SET9]);CHKERRQ(ierr); 19075b89ad90SMark F. Adams ierr = PetscLogEventRegister("GAMG: partLevel", PC_CLASSID, &petsc_gamg_setup_events[SET2]);CHKERRQ(ierr); 19085b89ad90SMark F. Adams ierr = PetscLogEventRegister(" repartition", PC_CLASSID, &petsc_gamg_setup_events[SET12]);CHKERRQ(ierr); 19095b89ad90SMark F. Adams ierr = PetscLogEventRegister(" Invert-Sort", PC_CLASSID, &petsc_gamg_setup_events[SET13]);CHKERRQ(ierr); 19105b89ad90SMark F. Adams ierr = PetscLogEventRegister(" Move A", PC_CLASSID, &petsc_gamg_setup_events[SET14]);CHKERRQ(ierr); 19115b89ad90SMark F. Adams ierr = PetscLogEventRegister(" Move P", PC_CLASSID, &petsc_gamg_setup_events[SET15]);CHKERRQ(ierr); 19125b89ad90SMark F. Adams 19135b89ad90SMark F. Adams /* PetscLogEventRegister(" PL move data", PC_CLASSID, &petsc_gamg_setup_events[SET13]); */ 19145b89ad90SMark F. Adams /* PetscLogEventRegister("GAMG: fix", PC_CLASSID, &petsc_gamg_setup_events[SET10]); */ 19155b89ad90SMark F. Adams /* PetscLogEventRegister("GAMG: set levels", PC_CLASSID, &petsc_gamg_setup_events[SET11]); */ 19165b89ad90SMark F. Adams /* create timer stages */ 19175b89ad90SMark F. Adams #if defined GAMG_STAGES 19185b89ad90SMark F. Adams { 19195b89ad90SMark F. Adams char str[32]; 19205b89ad90SMark F. Adams PetscInt lidx; 19215b89ad90SMark F. Adams sprintf(str,"MG Level %d (finest)",0); 19225b89ad90SMark F. Adams ierr = PetscLogStageRegister(str, &gamg_stages[0]);CHKERRQ(ierr); 19235b89ad90SMark F. Adams for (lidx=1; lidx<9; lidx++) { 1924c9567895SMark sprintf(str,"MG Level %d",(int)lidx); 19255b89ad90SMark F. Adams ierr = PetscLogStageRegister(str, &gamg_stages[lidx]);CHKERRQ(ierr); 19265b89ad90SMark F. Adams } 19275b89ad90SMark F. Adams } 19285b89ad90SMark F. Adams #endif 19295b89ad90SMark F. Adams #endif 19303e3471ccSMark Adams PetscFunctionReturn(0); 19313e3471ccSMark Adams } 19323e3471ccSMark Adams 19333e3471ccSMark Adams /*@C 19341c1aac46SBarry Smith PCGAMGFinalizePackage - This function frees everything from the PCGAMG package. It is 19351c1aac46SBarry Smith called from PetscFinalize() automatically. 19363e3471ccSMark Adams 19373e3471ccSMark Adams Level: developer 19383e3471ccSMark Adams 19393e3471ccSMark Adams .seealso: PetscFinalize() 19403e3471ccSMark Adams @*/ 19413e3471ccSMark Adams PetscErrorCode PCGAMGFinalizePackage(void) 19423e3471ccSMark Adams { 19433e3471ccSMark Adams PetscErrorCode ierr; 19443e3471ccSMark Adams 19453e3471ccSMark Adams PetscFunctionBegin; 19463e3471ccSMark Adams PCGAMGPackageInitialized = PETSC_FALSE; 19473e3471ccSMark Adams ierr = PetscFunctionListDestroy(&GAMGList);CHKERRQ(ierr); 19483e3471ccSMark Adams PetscFunctionReturn(0); 19493e3471ccSMark Adams } 1950a36cf38bSToby Isaac 1951a36cf38bSToby Isaac /*@C 1952a36cf38bSToby Isaac PCGAMGRegister - Register a PCGAMG implementation. 1953a36cf38bSToby Isaac 1954a36cf38bSToby Isaac Input Parameters: 1955a36cf38bSToby Isaac + type - string that will be used as the name of the GAMG type. 1956a36cf38bSToby Isaac - create - function for creating the gamg context. 1957a36cf38bSToby Isaac 1958a36cf38bSToby Isaac Level: advanced 1959a36cf38bSToby Isaac 19601c1aac46SBarry Smith .seealso: PCGAMGType, PCGAMG, PCGAMGSetType() 1961a36cf38bSToby Isaac @*/ 1962a36cf38bSToby Isaac PetscErrorCode PCGAMGRegister(PCGAMGType type, PetscErrorCode (*create)(PC)) 1963a36cf38bSToby Isaac { 1964a36cf38bSToby Isaac PetscErrorCode ierr; 1965a36cf38bSToby Isaac 1966a36cf38bSToby Isaac PetscFunctionBegin; 1967a36cf38bSToby Isaac ierr = PCGAMGInitializePackage();CHKERRQ(ierr); 1968a36cf38bSToby Isaac ierr = PetscFunctionListAdd(&GAMGList,type,create);CHKERRQ(ierr); 1969a36cf38bSToby Isaac PetscFunctionReturn(0); 1970a36cf38bSToby Isaac } 1971a36cf38bSToby Isaac 1972