1641875f9SMatthew G Knepley 2641875f9SMatthew G Knepley /* 3d515b9b4SShri Abhyankar Provides an interface to the CHOLMOD sparse solver available through SuiteSparse version 4.2.1 4641875f9SMatthew G Knepley 58999bf53SRichard Mills When built with PETSC_USE_64BIT_INDICES this will use Suitesparse_long as the 6641875f9SMatthew G Knepley integer type in UMFPACK, otherwise it will use int. This means 7641875f9SMatthew G Knepley all integers in this file as simply declared as PetscInt. Also it means 89e475b0dSSatish Balay that one cannot use 64BIT_INDICES on 32bit machines [as Suitesparse_long is 32bit only] 9641875f9SMatthew G Knepley 10641875f9SMatthew G Knepley */ 11641875f9SMatthew G Knepley 12c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/sbaij.h> 13c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/cholmod/cholmodimpl.h> 14641875f9SMatthew G Knepley 15641875f9SMatthew G Knepley /* 16641875f9SMatthew G Knepley This is a terrible hack, but it allows the error handler to retain a context. 17641875f9SMatthew G Knepley Note that this hack really cannot be made both reentrant and concurrent. 18641875f9SMatthew G Knepley */ 19641875f9SMatthew G Knepley static Mat static_F; 20641875f9SMatthew G Knepley 21641875f9SMatthew G Knepley static void CholmodErrorHandler(int status,const char *file,int line,const char *message) 22641875f9SMatthew G Knepley { 23ec55ff42SBarry Smith PetscErrorCode ierr; 24641875f9SMatthew G Knepley 25641875f9SMatthew G Knepley PetscFunctionBegin; 26641875f9SMatthew G Knepley if (status > CHOLMOD_OK) { 27e49b6e0cSMatthew G. Knepley ierr = PetscInfo4(static_F,"CHOLMOD warning %d at %s:%d: %s\n",status,file,line,message);CHKERRV(ierr); 28641875f9SMatthew G Knepley } else if (status == CHOLMOD_OK) { /* Documentation says this can happen, but why? */ 29e49b6e0cSMatthew G. Knepley ierr = PetscInfo3(static_F,"CHOLMOD OK at %s:%d: %s\n",file,line,message);CHKERRV(ierr); 30641875f9SMatthew G Knepley } else { 31e49b6e0cSMatthew G. Knepley ierr = PetscErrorPrintf("CHOLMOD error %d at %s:%d: %s\n",status,file,line,message);CHKERRV(ierr); 32641875f9SMatthew G Knepley } 33641875f9SMatthew G Knepley PetscFunctionReturnVoid(); 34641875f9SMatthew G Knepley } 35641875f9SMatthew G Knepley 367087cfbeSBarry Smith PetscErrorCode CholmodStart(Mat F) 37641875f9SMatthew G Knepley { 38641875f9SMatthew G Knepley PetscErrorCode ierr; 396b8f6f9dSBarry Smith Mat_CHOLMOD *chol=(Mat_CHOLMOD*)F->data; 40641875f9SMatthew G Knepley cholmod_common *c; 41ace3abfcSBarry Smith PetscBool flg; 42641875f9SMatthew G Knepley 43641875f9SMatthew G Knepley PetscFunctionBegin; 44641875f9SMatthew G Knepley if (chol->common) PetscFunctionReturn(0); 45854ce69bSBarry Smith ierr = PetscMalloc1(1,&chol->common);CHKERRQ(ierr); 46641875f9SMatthew G Knepley ierr = !cholmod_X_start(chol->common);CHKERRQ(ierr); 4726fbe8dcSKarl Rupp 48641875f9SMatthew G Knepley c = chol->common; 49641875f9SMatthew G Knepley c->error_handler = CholmodErrorHandler; 50641875f9SMatthew G Knepley 51641875f9SMatthew G Knepley #define CHOLMOD_OPTION_DOUBLE(name,help) do { \ 52641875f9SMatthew G Knepley PetscReal tmp = (PetscReal)c->name; \ 538afaa268SBarry Smith ierr = PetscOptionsReal("-mat_cholmod_" #name,help,"None",tmp,&tmp,NULL);CHKERRQ(ierr); \ 54641875f9SMatthew G Knepley c->name = (double)tmp; \ 55641875f9SMatthew G Knepley } while (0) 5626fbe8dcSKarl Rupp 57641875f9SMatthew G Knepley #define CHOLMOD_OPTION_INT(name,help) do { \ 58641875f9SMatthew G Knepley PetscInt tmp = (PetscInt)c->name; \ 598afaa268SBarry Smith ierr = PetscOptionsInt("-mat_cholmod_" #name,help,"None",tmp,&tmp,NULL);CHKERRQ(ierr); \ 60641875f9SMatthew G Knepley c->name = (int)tmp; \ 61641875f9SMatthew G Knepley } while (0) 6226fbe8dcSKarl Rupp 63641875f9SMatthew G Knepley #define CHOLMOD_OPTION_SIZE_T(name,help) do { \ 64*54b3d318SStefano Zampini PetscReal tmp = (PetscInt)c->name; \ 65*54b3d318SStefano Zampini ierr = PetscOptionsReal("-mat_cholmod_" #name,help,"None",tmp,&tmp,NULL);CHKERRQ(ierr); \ 66ce94432eSBarry Smith if (tmp < 0) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ARG_OUTOFRANGE,"value must be positive"); \ 67641875f9SMatthew G Knepley c->name = (size_t)tmp; \ 68641875f9SMatthew G Knepley } while (0) 6926fbe8dcSKarl Rupp 70b9eaa5e8SBarry Smith #define CHOLMOD_OPTION_BOOL(name,help) do { \ 71ace3abfcSBarry Smith PetscBool tmp = (PetscBool) !!c->name; \ 728afaa268SBarry Smith ierr = PetscOptionsBool("-mat_cholmod_" #name,help,"None",tmp,&tmp,NULL);CHKERRQ(ierr); \ 73641875f9SMatthew G Knepley c->name = (int)tmp; \ 74641875f9SMatthew G Knepley } while (0) 75641875f9SMatthew G Knepley 76ce94432eSBarry Smith ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)F),((PetscObject)F)->prefix,"CHOLMOD Options","Mat");CHKERRQ(ierr); 77*54b3d318SStefano Zampini CHOLMOD_OPTION_INT(nmethods,"Number of different ordering methods to try"); 7826fbe8dcSKarl Rupp 79b9eaa5e8SBarry Smith #if defined(PETSC_USE_SUITESPARSE_GPU) 80b9eaa5e8SBarry Smith c->useGPU = 1; 81b9eaa5e8SBarry Smith CHOLMOD_OPTION_INT(useGPU,"Use GPU for BLAS 1, otherwise 0"); 82*54b3d318SStefano Zampini CHOLMOD_OPTION_SIZE_T(maxGpuMemBytes,"Maximum memory to allocate on the GPU"); 83*54b3d318SStefano Zampini CHOLMOD_OPTION_DOUBLE(maxGpuMemFraction,"Fraction of available GPU memory to allocate"); 84b9eaa5e8SBarry Smith #endif 85b9eaa5e8SBarry Smith 86*54b3d318SStefano Zampini /* CHOLMOD handles first-time packing and refactor-packing separately, but we usually want them to be the same. */ 87*54b3d318SStefano Zampini chol->pack = (PetscBool)c->final_pack; 888afaa268SBarry Smith ierr = PetscOptionsBool("-mat_cholmod_pack","Pack factors after factorization [disable for frequent repeat factorization]","None",chol->pack,&chol->pack,NULL);CHKERRQ(ierr); 89641875f9SMatthew G Knepley c->final_pack = (int)chol->pack; 90641875f9SMatthew G Knepley 91641875f9SMatthew G Knepley CHOLMOD_OPTION_DOUBLE(dbound,"Minimum absolute value of diagonal entries of D"); 92641875f9SMatthew G Knepley CHOLMOD_OPTION_DOUBLE(grow0,"Global growth ratio when factors are modified"); 93641875f9SMatthew G Knepley CHOLMOD_OPTION_DOUBLE(grow1,"Column growth ratio when factors are modified"); 94641875f9SMatthew G Knepley CHOLMOD_OPTION_SIZE_T(grow2,"Affine column growth constant when factors are modified"); 95641875f9SMatthew G Knepley CHOLMOD_OPTION_SIZE_T(maxrank,"Max rank of update, larger values are faster but use more memory [2,4,8]"); 96641875f9SMatthew G Knepley { 97641875f9SMatthew G Knepley static const char *const list[] = {"SIMPLICIAL","AUTO","SUPERNODAL","MatCholmodFactorType","MAT_CHOLMOD_FACTOR_",0}; 988afaa268SBarry Smith ierr = PetscOptionsEnum("-mat_cholmod_factor","Factorization method","None",list,(PetscEnum)c->supernodal,(PetscEnum*)&c->supernodal,NULL);CHKERRQ(ierr); 99641875f9SMatthew G Knepley } 100641875f9SMatthew G Knepley if (c->supernodal) CHOLMOD_OPTION_DOUBLE(supernodal_switch,"flop/nnz_L threshold for switching to supernodal factorization"); 101b9eaa5e8SBarry Smith CHOLMOD_OPTION_BOOL(final_asis,"Leave factors \"as is\""); 102b9eaa5e8SBarry Smith CHOLMOD_OPTION_BOOL(final_pack,"Pack the columns when finished (use FALSE if the factors will be updated later)"); 103641875f9SMatthew G Knepley if (!c->final_asis) { 104b9eaa5e8SBarry Smith CHOLMOD_OPTION_BOOL(final_super,"Leave supernodal factors instead of converting to simplicial"); 105b9eaa5e8SBarry Smith CHOLMOD_OPTION_BOOL(final_ll,"Turn LDL' factorization into LL'"); 106b9eaa5e8SBarry Smith CHOLMOD_OPTION_BOOL(final_monotonic,"Ensure columns are monotonic when done"); 107b9eaa5e8SBarry Smith CHOLMOD_OPTION_BOOL(final_resymbol,"Remove numerically zero values resulting from relaxed supernodal amalgamation"); 108641875f9SMatthew G Knepley } 109641875f9SMatthew G Knepley { 110641875f9SMatthew G Knepley PetscReal tmp[] = {(PetscReal)c->zrelax[0],(PetscReal)c->zrelax[1],(PetscReal)c->zrelax[2]}; 111641875f9SMatthew G Knepley PetscInt n = 3; 112641875f9SMatthew G Knepley ierr = PetscOptionsRealArray("-mat_cholmod_zrelax","3 real supernodal relaxed amalgamation parameters","None",tmp,&n,&flg);CHKERRQ(ierr); 113ce94432eSBarry Smith if (flg && n != 3) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ARG_OUTOFRANGE,"must provide exactly 3 parameters to -mat_cholmod_zrelax"); 114641875f9SMatthew G Knepley if (flg) while (n--) c->zrelax[n] = (double)tmp[n]; 115641875f9SMatthew G Knepley } 116641875f9SMatthew G Knepley { 117641875f9SMatthew G Knepley PetscInt n,tmp[] = {(PetscInt)c->nrelax[0],(PetscInt)c->nrelax[1],(PetscInt)c->nrelax[2]}; 118641875f9SMatthew G Knepley ierr = PetscOptionsIntArray("-mat_cholmod_nrelax","3 size_t supernodal relaxed amalgamation parameters","None",tmp,&n,&flg);CHKERRQ(ierr); 119ce94432eSBarry Smith if (flg && n != 3) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ARG_OUTOFRANGE,"must provide exactly 3 parameters to -mat_cholmod_nrelax"); 120641875f9SMatthew G Knepley if (flg) while (n--) c->nrelax[n] = (size_t)tmp[n]; 121641875f9SMatthew G Knepley } 122b9eaa5e8SBarry Smith CHOLMOD_OPTION_BOOL(prefer_upper,"Work with upper triangular form [faster when using fill-reducing ordering, slower in natural ordering]"); 123b9eaa5e8SBarry Smith CHOLMOD_OPTION_BOOL(default_nesdis,"Use NESDIS instead of METIS for nested dissection"); 124641875f9SMatthew G Knepley CHOLMOD_OPTION_INT(print,"Verbosity level"); 125641875f9SMatthew G Knepley ierr = PetscOptionsEnd();CHKERRQ(ierr); 126641875f9SMatthew G Knepley PetscFunctionReturn(0); 127641875f9SMatthew G Knepley } 128641875f9SMatthew G Knepley 129ace3abfcSBarry Smith static PetscErrorCode MatWrapCholmod_seqsbaij(Mat A,PetscBool values,cholmod_sparse *C,PetscBool *aijalloc) 130641875f9SMatthew G Knepley { 131641875f9SMatthew G Knepley Mat_SeqSBAIJ *sbaij = (Mat_SeqSBAIJ*)A->data; 132641875f9SMatthew G Knepley PetscErrorCode ierr; 133641875f9SMatthew G Knepley 134641875f9SMatthew G Knepley PetscFunctionBegin; 135641875f9SMatthew G Knepley ierr = PetscMemzero(C,sizeof(*C));CHKERRQ(ierr); 136641875f9SMatthew G Knepley /* CHOLMOD uses column alignment, SBAIJ stores the upper factor, so we pass it on as a lower factor, swapping the meaning of row and column */ 137641875f9SMatthew G Knepley C->nrow = (size_t)A->cmap->n; 138641875f9SMatthew G Knepley C->ncol = (size_t)A->rmap->n; 139641875f9SMatthew G Knepley C->nzmax = (size_t)sbaij->maxnz; 140641875f9SMatthew G Knepley C->p = sbaij->i; 141641875f9SMatthew G Knepley C->i = sbaij->j; 142641875f9SMatthew G Knepley C->x = sbaij->a; 143641875f9SMatthew G Knepley C->stype = -1; 144641875f9SMatthew G Knepley C->itype = CHOLMOD_INT_TYPE; 145641875f9SMatthew G Knepley C->xtype = CHOLMOD_SCALAR_TYPE; 146641875f9SMatthew G Knepley C->dtype = CHOLMOD_DOUBLE; 147641875f9SMatthew G Knepley C->sorted = 1; 148641875f9SMatthew G Knepley C->packed = 1; 149641875f9SMatthew G Knepley *aijalloc = PETSC_FALSE; 150641875f9SMatthew G Knepley PetscFunctionReturn(0); 151641875f9SMatthew G Knepley } 152641875f9SMatthew G Knepley 153d9ca1df4SBarry Smith static PetscErrorCode VecWrapCholmodRead(Vec X,cholmod_dense *Y) 154641875f9SMatthew G Knepley { 155641875f9SMatthew G Knepley PetscErrorCode ierr; 156d9ca1df4SBarry Smith const PetscScalar *x; 157641875f9SMatthew G Knepley PetscInt n; 158641875f9SMatthew G Knepley 159641875f9SMatthew G Knepley PetscFunctionBegin; 160641875f9SMatthew G Knepley ierr = PetscMemzero(Y,sizeof(*Y));CHKERRQ(ierr); 161d9ca1df4SBarry Smith ierr = VecGetArrayRead(X,&x);CHKERRQ(ierr); 162641875f9SMatthew G Knepley ierr = VecGetSize(X,&n);CHKERRQ(ierr); 16326fbe8dcSKarl Rupp 164641875f9SMatthew G Knepley Y->x = (double*)x; 165641875f9SMatthew G Knepley Y->nrow = n; 166641875f9SMatthew G Knepley Y->ncol = 1; 167641875f9SMatthew G Knepley Y->nzmax = n; 168641875f9SMatthew G Knepley Y->d = n; 169641875f9SMatthew G Knepley Y->x = (double*)x; 170641875f9SMatthew G Knepley Y->xtype = CHOLMOD_SCALAR_TYPE; 171641875f9SMatthew G Knepley Y->dtype = CHOLMOD_DOUBLE; 172641875f9SMatthew G Knepley PetscFunctionReturn(0); 173641875f9SMatthew G Knepley } 174641875f9SMatthew G Knepley 175d9ca1df4SBarry Smith static PetscErrorCode VecUnWrapCholmodRead(Vec X,cholmod_dense *Y) 176d9ca1df4SBarry Smith { 177d9ca1df4SBarry Smith PetscErrorCode ierr; 178d9ca1df4SBarry Smith 179d9ca1df4SBarry Smith PetscFunctionBegin; 180b7be58f8SBarry Smith ierr = VecRestoreArrayRead(X,NULL);CHKERRQ(ierr); 181d9ca1df4SBarry Smith PetscFunctionReturn(0); 182d9ca1df4SBarry Smith } 183d9ca1df4SBarry Smith 184eb9872f6SBarry Smith PETSC_INTERN PetscErrorCode MatDestroy_CHOLMOD(Mat F) 185641875f9SMatthew G Knepley { 186641875f9SMatthew G Knepley PetscErrorCode ierr; 1876b8f6f9dSBarry Smith Mat_CHOLMOD *chol=(Mat_CHOLMOD*)F->data; 188641875f9SMatthew G Knepley 189641875f9SMatthew G Knepley PetscFunctionBegin; 190641875f9SMatthew G Knepley ierr = !cholmod_X_free_factor(&chol->factor,chol->common);CHKERRQ(ierr); 191641875f9SMatthew G Knepley ierr = !cholmod_X_finish(chol->common);CHKERRQ(ierr); 192641875f9SMatthew G Knepley ierr = PetscFree(chol->common);CHKERRQ(ierr); 193641875f9SMatthew G Knepley ierr = PetscFree(chol->matrix);CHKERRQ(ierr); 1946b8f6f9dSBarry Smith ierr = PetscFree(F->data);CHKERRQ(ierr); 195641875f9SMatthew G Knepley PetscFunctionReturn(0); 196641875f9SMatthew G Knepley } 197641875f9SMatthew G Knepley 198641875f9SMatthew G Knepley static PetscErrorCode MatSolve_CHOLMOD(Mat,Vec,Vec); 199641875f9SMatthew G Knepley 200fcd503bcSBarry Smith /*static const char *const CholmodOrderingMethods[] = {"User","AMD","METIS","NESDIS(default)","Natural","NESDIS(small=20000)","NESDIS(small=4,no constrained)","NESDIS()"};*/ 201641875f9SMatthew G Knepley 202860c79edSBarry Smith static PetscErrorCode MatView_Info_CHOLMOD(Mat F,PetscViewer viewer) 203641875f9SMatthew G Knepley { 2046b8f6f9dSBarry Smith Mat_CHOLMOD *chol = (Mat_CHOLMOD*)F->data; 205641875f9SMatthew G Knepley const cholmod_common *c = chol->common; 206641875f9SMatthew G Knepley PetscErrorCode ierr; 207641875f9SMatthew G Knepley PetscInt i; 208641875f9SMatthew G Knepley 209641875f9SMatthew G Knepley PetscFunctionBegin; 210641875f9SMatthew G Knepley if (F->ops->solve != MatSolve_CHOLMOD) PetscFunctionReturn(0); 211641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"CHOLMOD run parameters:\n");CHKERRQ(ierr); 212641875f9SMatthew G Knepley ierr = PetscViewerASCIIPushTab(viewer);CHKERRQ(ierr); 213641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Pack factors after symbolic factorization: %s\n",chol->pack ? "TRUE" : "FALSE");CHKERRQ(ierr); 214641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.dbound %g (Smallest absolute value of diagonal entries of D)\n",c->dbound);CHKERRQ(ierr); 215641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.grow0 %g\n",c->grow0);CHKERRQ(ierr); 216641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.grow1 %g\n",c->grow1);CHKERRQ(ierr); 217641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.grow2 %u\n",(unsigned)c->grow2);CHKERRQ(ierr); 218641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.maxrank %u\n",(unsigned)c->maxrank);CHKERRQ(ierr); 219641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.supernodal_switch %g\n",c->supernodal_switch);CHKERRQ(ierr); 220641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.supernodal %d\n",c->supernodal);CHKERRQ(ierr); 221641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.final_asis %d\n",c->final_asis);CHKERRQ(ierr); 222641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.final_super %d\n",c->final_super);CHKERRQ(ierr); 223641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.final_ll %d\n",c->final_ll);CHKERRQ(ierr); 224641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.final_pack %d\n",c->final_pack);CHKERRQ(ierr); 225641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.final_monotonic %d\n",c->final_monotonic);CHKERRQ(ierr); 226641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.final_resymbol %d\n",c->final_resymbol);CHKERRQ(ierr); 227641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.zrelax [%g,%g,%g]\n",c->zrelax[0],c->zrelax[1],c->zrelax[2]);CHKERRQ(ierr); 228641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.nrelax [%u,%u,%u]\n",(unsigned)c->nrelax[0],(unsigned)c->nrelax[1],(unsigned)c->nrelax[2]);CHKERRQ(ierr); 229641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.prefer_upper %d\n",c->prefer_upper);CHKERRQ(ierr); 230641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.print %d\n",c->print);CHKERRQ(ierr); 231641875f9SMatthew G Knepley for (i=0; i<c->nmethods; i++) { 232641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Ordering method %D%s:\n",i,i==c->selected ? " [SELECTED]" : "");CHKERRQ(ierr); 233641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer," lnz %g, fl %g, prune_dense %g, prune_dense2 %g\n", 234641875f9SMatthew G Knepley c->method[i].lnz,c->method[i].fl,c->method[i].prune_dense,c->method[i].prune_dense2);CHKERRQ(ierr); 235641875f9SMatthew G Knepley } 236641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.postorder %d\n",c->postorder);CHKERRQ(ierr); 237641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.default_nesdis %d (use NESDIS instead of METIS for nested dissection)\n",c->default_nesdis);CHKERRQ(ierr); 238641875f9SMatthew G Knepley /* Statistics */ 239641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.fl %g (flop count from most recent analysis)\n",c->fl);CHKERRQ(ierr); 240641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.lnz %g (fundamental nz in L)\n",c->lnz);CHKERRQ(ierr); 241641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.anz %g\n",c->anz);CHKERRQ(ierr); 242641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.modfl %g (flop count from most recent update)\n",c->modfl);CHKERRQ(ierr); 243641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.malloc_count %g (number of live objects)\n",(double)c->malloc_count);CHKERRQ(ierr);CHKERRQ(ierr); 244641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.memory_usage %g (peak memory usage in bytes)\n",(double)c->memory_usage);CHKERRQ(ierr);CHKERRQ(ierr); 245641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.memory_inuse %g (current memory usage in bytes)\n",(double)c->memory_inuse);CHKERRQ(ierr);CHKERRQ(ierr); 246641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.nrealloc_col %g (number of column reallocations)\n",c->nrealloc_col);CHKERRQ(ierr);CHKERRQ(ierr); 247641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.nrealloc_factor %g (number of factor reallocations due to column reallocations)\n",c->nrealloc_factor);CHKERRQ(ierr);CHKERRQ(ierr); 248641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.ndbounds_hit %g (number of times diagonal was modified by dbound)\n",c->ndbounds_hit);CHKERRQ(ierr);CHKERRQ(ierr); 249641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.rowfacfl %g (number of flops in last call to cholmod_rowfac)\n",c->rowfacfl);CHKERRQ(ierr);CHKERRQ(ierr); 250641875f9SMatthew G Knepley ierr = PetscViewerASCIIPrintf(viewer,"Common.aatfl %g (number of flops to compute A(:,f)*A(:,f)')\n",c->aatfl);CHKERRQ(ierr);CHKERRQ(ierr); 251b9eaa5e8SBarry Smith #if defined(PETSC_USE_SUITESPARSE_GPU) 252b9eaa5e8SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"Common.useGPU %d\n",c->useGPU);CHKERRQ(ierr);CHKERRQ(ierr); 253b9eaa5e8SBarry Smith #endif 254641875f9SMatthew G Knepley ierr = PetscViewerASCIIPopTab(viewer);CHKERRQ(ierr); 255641875f9SMatthew G Knepley PetscFunctionReturn(0); 256641875f9SMatthew G Knepley } 257641875f9SMatthew G Knepley 258eb9872f6SBarry Smith PETSC_INTERN PetscErrorCode MatView_CHOLMOD(Mat F,PetscViewer viewer) 259641875f9SMatthew G Knepley { 260641875f9SMatthew G Knepley PetscErrorCode ierr; 261ace3abfcSBarry Smith PetscBool iascii; 262641875f9SMatthew G Knepley PetscViewerFormat format; 263641875f9SMatthew G Knepley 264641875f9SMatthew G Knepley PetscFunctionBegin; 265251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 266641875f9SMatthew G Knepley if (iascii) { 267641875f9SMatthew G Knepley ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 268641875f9SMatthew G Knepley if (format == PETSC_VIEWER_ASCII_INFO) { 269860c79edSBarry Smith ierr = MatView_Info_CHOLMOD(F,viewer);CHKERRQ(ierr); 270641875f9SMatthew G Knepley } 271641875f9SMatthew G Knepley } 272641875f9SMatthew G Knepley PetscFunctionReturn(0); 273641875f9SMatthew G Knepley } 274641875f9SMatthew G Knepley 275641875f9SMatthew G Knepley static PetscErrorCode MatSolve_CHOLMOD(Mat F,Vec B,Vec X) 276641875f9SMatthew G Knepley { 2776b8f6f9dSBarry Smith Mat_CHOLMOD *chol = (Mat_CHOLMOD*)F->data; 278641875f9SMatthew G Knepley cholmod_dense cholB,*cholX; 279641875f9SMatthew G Knepley PetscScalar *x; 280641875f9SMatthew G Knepley PetscErrorCode ierr; 281641875f9SMatthew G Knepley 282641875f9SMatthew G Knepley PetscFunctionBegin; 283d9ca1df4SBarry Smith ierr = VecWrapCholmodRead(B,&cholB);CHKERRQ(ierr); 284641875f9SMatthew G Knepley static_F = F; 285641875f9SMatthew G Knepley cholX = cholmod_X_solve(CHOLMOD_A,chol->factor,&cholB,chol->common); 286641875f9SMatthew G Knepley if (!cholX) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"CHOLMOD failed"); 287d9ca1df4SBarry Smith ierr = VecUnWrapCholmodRead(B,&cholB);CHKERRQ(ierr); 288641875f9SMatthew G Knepley ierr = VecGetArray(X,&x);CHKERRQ(ierr); 289580bdb30SBarry Smith ierr = PetscArraycpy(x,(PetscScalar*)cholX->x,cholX->nrow);CHKERRQ(ierr); 290641875f9SMatthew G Knepley ierr = !cholmod_X_free_dense(&cholX,chol->common);CHKERRQ(ierr); 291641875f9SMatthew G Knepley ierr = VecRestoreArray(X,&x);CHKERRQ(ierr); 292641875f9SMatthew G Knepley PetscFunctionReturn(0); 293641875f9SMatthew G Knepley } 294641875f9SMatthew G Knepley 295641875f9SMatthew G Knepley static PetscErrorCode MatCholeskyFactorNumeric_CHOLMOD(Mat F,Mat A,const MatFactorInfo *info) 296641875f9SMatthew G Knepley { 2976b8f6f9dSBarry Smith Mat_CHOLMOD *chol = (Mat_CHOLMOD*)F->data; 298641875f9SMatthew G Knepley cholmod_sparse cholA; 299ace3abfcSBarry Smith PetscBool aijalloc; 300641875f9SMatthew G Knepley PetscErrorCode ierr; 301641875f9SMatthew G Knepley 302641875f9SMatthew G Knepley PetscFunctionBegin; 303641875f9SMatthew G Knepley ierr = (*chol->Wrap)(A,PETSC_TRUE,&cholA,&aijalloc);CHKERRQ(ierr); 304641875f9SMatthew G Knepley static_F = F; 305641875f9SMatthew G Knepley ierr = !cholmod_X_factorize(&cholA,chol->factor,chol->common); 306ce94432eSBarry Smith if (ierr) SETERRQ1(PetscObjectComm((PetscObject)F),PETSC_ERR_LIB,"CHOLMOD factorization failed with status %d",chol->common->status); 307ce94432eSBarry Smith if (chol->common->status == CHOLMOD_NOT_POSDEF) SETERRQ1(PetscObjectComm((PetscObject)F),PETSC_ERR_MAT_CH_ZRPVT,"CHOLMOD detected that the matrix is not positive definite, failure at column %u",(unsigned)chol->factor->minor); 308641875f9SMatthew G Knepley 309641875f9SMatthew G Knepley if (aijalloc) {ierr = PetscFree3(cholA.p,cholA.i,cholA.x);CHKERRQ(ierr);} 310641875f9SMatthew G Knepley 311641875f9SMatthew G Knepley F->ops->solve = MatSolve_CHOLMOD; 312641875f9SMatthew G Knepley F->ops->solvetranspose = MatSolve_CHOLMOD; 313641875f9SMatthew G Knepley PetscFunctionReturn(0); 314641875f9SMatthew G Knepley } 315641875f9SMatthew G Knepley 316eb9872f6SBarry Smith PETSC_INTERN PetscErrorCode MatCholeskyFactorSymbolic_CHOLMOD(Mat F,Mat A,IS perm,const MatFactorInfo *info) 317641875f9SMatthew G Knepley { 3186b8f6f9dSBarry Smith Mat_CHOLMOD *chol = (Mat_CHOLMOD*)F->data; 319641875f9SMatthew G Knepley PetscErrorCode ierr; 320641875f9SMatthew G Knepley cholmod_sparse cholA; 321ace3abfcSBarry Smith PetscBool aijalloc; 322641875f9SMatthew G Knepley PetscInt *fset = 0; 323641875f9SMatthew G Knepley size_t fsize = 0; 324641875f9SMatthew G Knepley 325641875f9SMatthew G Knepley PetscFunctionBegin; 326641875f9SMatthew G Knepley ierr = (*chol->Wrap)(A,PETSC_FALSE,&cholA,&aijalloc);CHKERRQ(ierr); 327641875f9SMatthew G Knepley static_F = F; 328641875f9SMatthew G Knepley if (chol->factor) { 329641875f9SMatthew G Knepley ierr = !cholmod_X_resymbol(&cholA,fset,fsize,(int)chol->pack,chol->factor,chol->common); 330ce94432eSBarry Smith if (ierr) SETERRQ1(PetscObjectComm((PetscObject)F),PETSC_ERR_LIB,"CHOLMOD analysis failed with status %d",chol->common->status); 331641875f9SMatthew G Knepley } else if (perm) { 332641875f9SMatthew G Knepley const PetscInt *ip; 333641875f9SMatthew G Knepley ierr = ISGetIndices(perm,&ip);CHKERRQ(ierr); 334641875f9SMatthew G Knepley chol->factor = cholmod_X_analyze_p(&cholA,(PetscInt*)ip,fset,fsize,chol->common); 335ce94432eSBarry Smith if (!chol->factor) SETERRQ1(PetscObjectComm((PetscObject)F),PETSC_ERR_LIB,"CHOLMOD analysis failed with status %d",chol->common->status); 336641875f9SMatthew G Knepley ierr = ISRestoreIndices(perm,&ip);CHKERRQ(ierr); 337641875f9SMatthew G Knepley } else { 338641875f9SMatthew G Knepley chol->factor = cholmod_X_analyze(&cholA,chol->common); 339ce94432eSBarry Smith if (!chol->factor) SETERRQ1(PetscObjectComm((PetscObject)F),PETSC_ERR_LIB,"CHOLMOD analysis failed with status %d",chol->common->status); 340641875f9SMatthew G Knepley } 341641875f9SMatthew G Knepley 342641875f9SMatthew G Knepley if (aijalloc) {ierr = PetscFree3(cholA.p,cholA.i,cholA.x);CHKERRQ(ierr);} 343641875f9SMatthew G Knepley 344641875f9SMatthew G Knepley F->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_CHOLMOD; 345641875f9SMatthew G Knepley PetscFunctionReturn(0); 346641875f9SMatthew G Knepley } 347641875f9SMatthew G Knepley 348ea799195SBarry Smith static PetscErrorCode MatFactorGetSolverType_seqsbaij_cholmod(Mat A,MatSolverType *type) 349641875f9SMatthew G Knepley { 350641875f9SMatthew G Knepley PetscFunctionBegin; 351641875f9SMatthew G Knepley *type = MATSOLVERCHOLMOD; 352641875f9SMatthew G Knepley PetscFunctionReturn(0); 353641875f9SMatthew G Knepley } 354641875f9SMatthew G Knepley 355641875f9SMatthew G Knepley /*MC 356641875f9SMatthew G Knepley MATSOLVERCHOLMOD = "cholmod" - A matrix type providing direct solvers (Cholesky) for sequential matrices 357641875f9SMatthew G Knepley via the external package CHOLMOD. 358641875f9SMatthew G Knepley 359c2b89b5dSBarry Smith Use ./configure --download-suitesparse to install PETSc to use CHOLMOD 360c2b89b5dSBarry Smith 361f29f8b16SBarry Smith Use -pc_type cholesky -pc_factor_mat_solver_type cholmod to use this direct solver 362641875f9SMatthew G Knepley 363641875f9SMatthew G Knepley Consult CHOLMOD documentation for more information about the Common parameters 364641875f9SMatthew G Knepley which correspond to the options database keys below. 365641875f9SMatthew G Knepley 366641875f9SMatthew G Knepley Options Database Keys: 367e08999f5SMatthew G Knepley + -mat_cholmod_dbound <0> - Minimum absolute value of diagonal entries of D (None) 368e08999f5SMatthew G Knepley . -mat_cholmod_grow0 <1.2> - Global growth ratio when factors are modified (None) 369e08999f5SMatthew G Knepley . -mat_cholmod_grow1 <1.2> - Column growth ratio when factors are modified (None) 370e08999f5SMatthew G Knepley . -mat_cholmod_grow2 <5> - Affine column growth constant when factors are modified (None) 371e08999f5SMatthew G Knepley . -mat_cholmod_maxrank <8> - Max rank of update, larger values are faster but use more memory [2,4,8] (None) 372e08999f5SMatthew G Knepley . -mat_cholmod_factor <AUTO> - (choose one of) SIMPLICIAL AUTO SUPERNODAL 373e08999f5SMatthew G Knepley . -mat_cholmod_supernodal_switch <40> - flop/nnz_L threshold for switching to supernodal factorization (None) 374e08999f5SMatthew G Knepley . -mat_cholmod_final_asis <TRUE> - Leave factors "as is" (None) 375e08999f5SMatthew G Knepley . -mat_cholmod_final_pack <TRUE> - Pack the columns when finished (use FALSE if the factors will be updated later) (None) 376e08999f5SMatthew G Knepley . -mat_cholmod_zrelax <0.8> - 3 real supernodal relaxed amalgamation parameters (None) 377e08999f5SMatthew G Knepley . -mat_cholmod_nrelax <4> - 3 size_t supernodal relaxed amalgamation parameters (None) 378e08999f5SMatthew G Knepley . -mat_cholmod_prefer_upper <TRUE> - Work with upper triangular form (faster when using fill-reducing ordering, slower in natural ordering) (None) 379e08999f5SMatthew G Knepley - -mat_cholmod_print <3> - Verbosity level (None) 380641875f9SMatthew G Knepley 381641875f9SMatthew G Knepley Level: beginner 382641875f9SMatthew G Knepley 383a364b7d2SBarry Smith Note: CHOLMOD is part of SuiteSparse http://faculty.cse.tamu.edu/davis/suitesparse.html 384a364b7d2SBarry Smith 3853ca39a21SBarry Smith .seealso: PCCHOLESKY, PCFactorSetMatSolverType(), MatSolverType 386641875f9SMatthew G Knepley M*/ 387b2573a8aSBarry Smith 388db87b0f2SBarry Smith PETSC_INTERN PetscErrorCode MatGetFactor_seqsbaij_cholmod(Mat A,MatFactorType ftype,Mat *F) 389641875f9SMatthew G Knepley { 390641875f9SMatthew G Knepley Mat B; 391641875f9SMatthew G Knepley Mat_CHOLMOD *chol; 392641875f9SMatthew G Knepley PetscErrorCode ierr; 393641875f9SMatthew G Knepley PetscInt m=A->rmap->n,n=A->cmap->n,bs; 394641875f9SMatthew G Knepley 395641875f9SMatthew G Knepley PetscFunctionBegin; 396641875f9SMatthew G Knepley if (ftype != MAT_FACTOR_CHOLESKY) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"CHOLMOD cannot do %s factorization with SBAIJ, only %s", 397641875f9SMatthew G Knepley MatFactorTypes[ftype],MatFactorTypes[MAT_FACTOR_CHOLESKY]); 398641875f9SMatthew G Knepley ierr = MatGetBlockSize(A,&bs);CHKERRQ(ierr); 399ce94432eSBarry Smith if (bs != 1) SETERRQ1(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"CHOLMOD only supports block size=1, given %D",bs); 400641875f9SMatthew G Knepley /* Create the factorization matrix F */ 401ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 402641875f9SMatthew G Knepley ierr = MatSetSizes(B,PETSC_DECIDE,PETSC_DECIDE,m,n);CHKERRQ(ierr); 4036b8f6f9dSBarry Smith ierr = PetscStrallocpy("cholmod",&((PetscObject)B)->type_name);CHKERRQ(ierr); 4046b8f6f9dSBarry Smith ierr = MatSetUp(B);CHKERRQ(ierr); 405b00a9115SJed Brown ierr = PetscNewLog(B,&chol);CHKERRQ(ierr); 40626fbe8dcSKarl Rupp 407641875f9SMatthew G Knepley chol->Wrap = MatWrapCholmod_seqsbaij; 4086b8f6f9dSBarry Smith B->data = chol; 409641875f9SMatthew G Knepley 4106b8f6f9dSBarry Smith B->ops->getinfo = MatGetInfo_External; 411641875f9SMatthew G Knepley B->ops->view = MatView_CHOLMOD; 412641875f9SMatthew G Knepley B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_CHOLMOD; 413641875f9SMatthew G Knepley B->ops->destroy = MatDestroy_CHOLMOD; 4143ca39a21SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverType_C",MatFactorGetSolverType_seqsbaij_cholmod);CHKERRQ(ierr); 415641875f9SMatthew G Knepley B->factortype = MAT_FACTOR_CHOLESKY; 416641875f9SMatthew G Knepley B->assembled = PETSC_TRUE; /* required by -ksp_view */ 417641875f9SMatthew G Knepley B->preallocated = PETSC_TRUE; 418641875f9SMatthew G Knepley 419641875f9SMatthew G Knepley ierr = CholmodStart(B);CHKERRQ(ierr); 42000c67f3bSHong Zhang 42100c67f3bSHong Zhang ierr = PetscFree(B->solvertype);CHKERRQ(ierr); 42200c67f3bSHong Zhang ierr = PetscStrallocpy(MATSOLVERCHOLMOD,&B->solvertype);CHKERRQ(ierr); 42300c67f3bSHong Zhang 424641875f9SMatthew G Knepley *F = B; 425641875f9SMatthew G Knepley PetscFunctionReturn(0); 426641875f9SMatthew G Knepley } 427