1dba47a55SKris Buschelman #define PETSCKSP_DLL 2ab718edeSHong Zhang 35582bec1SHong Zhang /* 45582bec1SHong Zhang Provides an interface to the ML 3.0 smoothed Aggregation 55582bec1SHong Zhang */ 65582bec1SHong Zhang #include "src/ksp/pc/pcimpl.h" /*I "petscpc.h" I*/ 75582bec1SHong Zhang #include "src/ksp/pc/impls/mg/mgimpl.h" /*I "petscmg.h" I*/ 85582bec1SHong Zhang #include "src/mat/impls/aij/seq/aij.h" 95582bec1SHong Zhang #include "src/mat/impls/aij/mpi/mpiaij.h" 10cb5d8e9eSHong Zhang 115582bec1SHong Zhang EXTERN_C_BEGIN 125582bec1SHong Zhang #include <math.h> 135582bec1SHong Zhang #include "ml_include.h" 145582bec1SHong Zhang EXTERN_C_END 155582bec1SHong Zhang 165582bec1SHong Zhang /* The context (data structure) at each grid level */ 175582bec1SHong Zhang typedef struct { 185582bec1SHong Zhang Vec x,b,r; /* global vectors */ 195582bec1SHong Zhang Mat A,P,R; 205582bec1SHong Zhang KSP ksp; 215582bec1SHong Zhang } GridCtx; 225582bec1SHong Zhang 235582bec1SHong Zhang /* The context used to input PETSc matrix into ML at fine grid */ 245582bec1SHong Zhang typedef struct { 255582bec1SHong Zhang Mat A,Aloc; 2624a42b14SHong Zhang Vec x,y; 275582bec1SHong Zhang ML_Operator *mlmat; 285582bec1SHong Zhang PetscScalar *pwork; /* tmp array used by PetscML_comm() */ 295582bec1SHong Zhang } FineGridCtx; 305582bec1SHong Zhang 315582bec1SHong Zhang /* The context associates a ML matrix with a PETSc shell matrix */ 325582bec1SHong Zhang typedef struct { 335582bec1SHong Zhang Mat A; /* PETSc shell matrix associated with mlmat */ 345582bec1SHong Zhang ML_Operator *mlmat; /* ML matrix assorciated with A */ 355582bec1SHong Zhang Vec y; 365582bec1SHong Zhang } Mat_MLShell; 375582bec1SHong Zhang 385582bec1SHong Zhang /* Private context for the ML preconditioner */ 395582bec1SHong Zhang typedef struct { 405582bec1SHong Zhang ML *ml_object; 415582bec1SHong Zhang ML_Aggregate *agg_object; 425582bec1SHong Zhang GridCtx *gridctx; 435582bec1SHong Zhang FineGridCtx *PetscMLdata; 445582bec1SHong Zhang PetscInt fine_level,MaxNlevels,MaxCoarseSize,CoarsenScheme; 455582bec1SHong Zhang PetscReal Threshold,DampingFactor; 465582bec1SHong Zhang PetscTruth SpectralNormScheme_Anorm; 475582bec1SHong Zhang PetscMPIInt size; 485582bec1SHong Zhang PetscErrorCode (*PCSetUp)(PC); 495582bec1SHong Zhang PetscErrorCode (*PCDestroy)(PC); 505582bec1SHong Zhang } PC_ML; 515582bec1SHong Zhang extern int PetscML_getrow(void *ML_data,int N_requested_rows,int requested_rows[], 525582bec1SHong Zhang int allocated_space,int columns[],double values[],int row_lengths[]); 535582bec1SHong Zhang extern int PetscML_matvec(void *ML_data, int in_length, double p[], int out_length,double ap[]); 545582bec1SHong Zhang extern int PetscML_comm(double x[], void *ML_data); 555582bec1SHong Zhang extern PetscErrorCode MatMult_ML(Mat,Vec,Vec); 565582bec1SHong Zhang extern PetscErrorCode MatMultAdd_ML(Mat,Vec,Vec,Vec); 57eef31507SHong Zhang extern PetscErrorCode MatConvert_MPIAIJ_ML(Mat,const MatType,MatReuse,Mat*); 585582bec1SHong Zhang extern PetscErrorCode MatDestroy_ML(Mat); 59eef31507SHong Zhang extern PetscErrorCode MatWrapML_SeqAIJ(ML_Operator*,Mat*); 60eef31507SHong Zhang extern PetscErrorCode MatWrapML_MPIAIJ(ML_Operator*,Mat*); 61eef31507SHong Zhang extern PetscErrorCode MatWrapML_SHELL(ML_Operator*,Mat*); 625582bec1SHong Zhang 635582bec1SHong Zhang /* -------------------------------------------------------------------------- */ 645582bec1SHong Zhang /* 655582bec1SHong Zhang PCSetUp_ML - Prepares for the use of the ML preconditioner 665582bec1SHong Zhang by setting data structures and options. 675582bec1SHong Zhang 685582bec1SHong Zhang Input Parameter: 695582bec1SHong Zhang . pc - the preconditioner context 705582bec1SHong Zhang 715582bec1SHong Zhang Application Interface Routine: PCSetUp() 725582bec1SHong Zhang 735582bec1SHong Zhang Notes: 745582bec1SHong Zhang The interface routine PCSetUp() is not usually called directly by 755582bec1SHong Zhang the user, but instead is called by PCApply() if necessary. 765582bec1SHong Zhang */ 776ca4d86aSHong Zhang extern PetscErrorCode PCSetFromOptions_MG(PC); 785582bec1SHong Zhang #undef __FUNCT__ 795582bec1SHong Zhang #define __FUNCT__ "PCSetUp_ML" 806ca4d86aSHong Zhang PetscErrorCode PCSetUp_ML(PC pc) 815582bec1SHong Zhang { 825582bec1SHong Zhang PetscErrorCode ierr; 83eef31507SHong Zhang PetscMPIInt size; 845582bec1SHong Zhang FineGridCtx *PetscMLdata; 855582bec1SHong Zhang ML *ml_object; 865582bec1SHong Zhang ML_Aggregate *agg_object; 875582bec1SHong Zhang ML_Operator *mlmat; 88ac346b81SHong Zhang PetscInt nlocal_allcols,Nlevels,mllevel,level,level1,m,fine_level; 895582bec1SHong Zhang Mat A,Aloc; 905582bec1SHong Zhang GridCtx *gridctx; 915582bec1SHong Zhang PC_ML *pc_ml=PETSC_NULL; 925582bec1SHong Zhang PetscObjectContainer container; 935582bec1SHong Zhang 945582bec1SHong Zhang PetscFunctionBegin; 955582bec1SHong Zhang ierr = PetscObjectQuery((PetscObject)pc,"PC_ML",(PetscObject *)&container);CHKERRQ(ierr); 965582bec1SHong Zhang if (container) { 975582bec1SHong Zhang ierr = PetscObjectContainerGetPointer(container,(void **)&pc_ml);CHKERRQ(ierr); 985582bec1SHong Zhang } else { 995582bec1SHong Zhang SETERRQ(PETSC_ERR_ARG_NULL,"Container does not exit"); 1005582bec1SHong Zhang } 1015582bec1SHong Zhang 1025582bec1SHong Zhang /* setup special features of PCML */ 1035582bec1SHong Zhang /*--------------------------------*/ 1045582bec1SHong Zhang /* covert A to Aloc to be used by ML at fine grid */ 1055582bec1SHong Zhang A = pc->pmat; 1065582bec1SHong Zhang ierr = MPI_Comm_size(A->comm,&size);CHKERRQ(ierr); 1075582bec1SHong Zhang pc_ml->size = size; 1085582bec1SHong Zhang if (size > 1){ 109eef31507SHong Zhang ierr = MatConvert_MPIAIJ_ML(A,PETSC_NULL,MAT_INITIAL_MATRIX,&Aloc);CHKERRQ(ierr); 1105582bec1SHong Zhang } else { 1115582bec1SHong Zhang Aloc = A; 1125582bec1SHong Zhang } 1135582bec1SHong Zhang 1145582bec1SHong Zhang /* create and initialize struct 'PetscMLdata' */ 1155582bec1SHong Zhang ierr = PetscNew(FineGridCtx,&PetscMLdata);CHKERRQ(ierr); 1165582bec1SHong Zhang PetscMLdata->A = A; 1175582bec1SHong Zhang PetscMLdata->Aloc = Aloc; 1185582bec1SHong Zhang ierr = PetscMalloc((Aloc->n+1)*sizeof(PetscScalar),&PetscMLdata->pwork);CHKERRQ(ierr); 1195582bec1SHong Zhang pc_ml->PetscMLdata = PetscMLdata; 1205582bec1SHong Zhang 12124a42b14SHong Zhang ierr = VecCreate(PETSC_COMM_SELF,&PetscMLdata->x);CHKERRQ(ierr); 12224a42b14SHong Zhang if (size == 1){ 1236ca4d86aSHong Zhang ierr = VecSetSizes(PetscMLdata->x,A->n,A->n);CHKERRQ(ierr); 12424a42b14SHong Zhang } else { 1256ca4d86aSHong Zhang ierr = VecSetSizes(PetscMLdata->x,Aloc->n,Aloc->n);CHKERRQ(ierr); 12624a42b14SHong Zhang } 12724a42b14SHong Zhang ierr = VecSetType(PetscMLdata->x,VECSEQ);CHKERRQ(ierr); 12824a42b14SHong Zhang 12924a42b14SHong Zhang ierr = VecCreate(PETSC_COMM_SELF,&PetscMLdata->y);CHKERRQ(ierr); 13024a42b14SHong Zhang ierr = VecSetSizes(PetscMLdata->y,A->m,PETSC_DECIDE);CHKERRQ(ierr); 13124a42b14SHong Zhang ierr = VecSetType(PetscMLdata->y,VECSEQ);CHKERRQ(ierr); 13224a42b14SHong Zhang 1335582bec1SHong Zhang /* create ML discretization matrix at fine grid */ 1345582bec1SHong Zhang ierr = MatGetSize(Aloc,&m,&nlocal_allcols);CHKERRQ(ierr); 1355582bec1SHong Zhang ML_Create(&ml_object,pc_ml->MaxNlevels); 1365582bec1SHong Zhang ML_Init_Amatrix(ml_object,0,m,m,PetscMLdata); 1375582bec1SHong Zhang ML_Set_Amatrix_Getrow(ml_object,0,PetscML_getrow,PetscML_comm,nlocal_allcols); 1385582bec1SHong Zhang ML_Set_Amatrix_Matvec(ml_object,0,PetscML_matvec); 1395582bec1SHong Zhang 1405582bec1SHong Zhang /* aggregation */ 1415582bec1SHong Zhang ML_Aggregate_Create(&agg_object); 1425582bec1SHong Zhang ML_Aggregate_Set_MaxCoarseSize(agg_object,pc_ml->MaxCoarseSize); 1435582bec1SHong Zhang /* set options */ 1445582bec1SHong Zhang switch (pc_ml->CoarsenScheme) { 1455582bec1SHong Zhang case 1: 1465582bec1SHong Zhang ML_Aggregate_Set_CoarsenScheme_Coupled(agg_object);break; 1475582bec1SHong Zhang case 2: 1485582bec1SHong Zhang ML_Aggregate_Set_CoarsenScheme_MIS(agg_object);break; 1495582bec1SHong Zhang case 3: 1505582bec1SHong Zhang ML_Aggregate_Set_CoarsenScheme_METIS(agg_object);break; 1515582bec1SHong Zhang } 1525582bec1SHong Zhang ML_Aggregate_Set_Threshold(agg_object,pc_ml->Threshold); 1535582bec1SHong Zhang ML_Aggregate_Set_DampingFactor(agg_object,pc_ml->DampingFactor); 1545582bec1SHong Zhang if (pc_ml->SpectralNormScheme_Anorm){ 1555582bec1SHong Zhang ML_Aggregate_Set_SpectralNormScheme_Anorm(agg_object); 1565582bec1SHong Zhang } 1575582bec1SHong Zhang 1585582bec1SHong Zhang Nlevels = ML_Gen_MGHierarchy_UsingAggregation(ml_object,0,ML_INCREASING,agg_object); 1595582bec1SHong Zhang if (Nlevels<=0) SETERRQ1(PETSC_ERR_ARG_OUTOFRANGE,"Nlevels %d must > 0",Nlevels); 160*97177400SBarry Smith ierr = PCMGSetLevels(pc,Nlevels,PETSC_NULL);CHKERRQ(ierr); 161*97177400SBarry Smith ierr = PCSetFromOptions_MG(pc);CHKERRQ(ierr); /* should be called in PCSetFromOptions_ML(), but cannot be called prior to PCMGSetLevels() */ 1625582bec1SHong Zhang pc_ml->ml_object = ml_object; 1635582bec1SHong Zhang pc_ml->agg_object = agg_object; 1645582bec1SHong Zhang 1655582bec1SHong Zhang ierr = PetscMalloc(Nlevels*sizeof(GridCtx),&gridctx);CHKERRQ(ierr); 1665582bec1SHong Zhang fine_level = Nlevels - 1; 1675582bec1SHong Zhang pc_ml->gridctx = gridctx; 1685582bec1SHong Zhang pc_ml->fine_level = fine_level; 1695582bec1SHong Zhang 1705582bec1SHong Zhang /* wrap ML matrices by PETSc shell matrices at coarsened grids. 1715582bec1SHong Zhang Level 0 is the finest grid for ML, but coarsest for PETSc! */ 172e14861a4SHong Zhang gridctx[fine_level].A = A; 173e14861a4SHong Zhang level = fine_level - 1; 174ab718edeSHong Zhang if (size == 1){ /* convert ML P, R and A into seqaij format */ 1755582bec1SHong Zhang for (mllevel=1; mllevel<Nlevels; mllevel++){ 176e14861a4SHong Zhang mlmat = &(ml_object->Pmat[mllevel]); 177eef31507SHong Zhang ierr = MatWrapML_SeqAIJ(mlmat,&gridctx[level].P);CHKERRQ(ierr); 178e14861a4SHong Zhang mlmat = &(ml_object->Amat[mllevel]); 179eef31507SHong Zhang ierr = MatWrapML_SeqAIJ(mlmat,&gridctx[level].A);CHKERRQ(ierr); 180e14861a4SHong Zhang mlmat = &(ml_object->Rmat[mllevel-1]); 181eef31507SHong Zhang ierr = MatWrapML_SeqAIJ(mlmat,&gridctx[level].R);CHKERRQ(ierr); 1825582bec1SHong Zhang level--; 1835582bec1SHong Zhang } 184ab718edeSHong Zhang } else { /* convert ML P and R into shell format, ML A into mpiaij format */ 1855582bec1SHong Zhang for (mllevel=1; mllevel<Nlevels; mllevel++){ 1865582bec1SHong Zhang mlmat = &(ml_object->Pmat[mllevel]); 187eef31507SHong Zhang ierr = MatWrapML_SHELL(mlmat,&gridctx[level].P);CHKERRQ(ierr); 188ab718edeSHong Zhang mlmat = &(ml_object->Rmat[mllevel-1]); 189eef31507SHong Zhang ierr = MatWrapML_SHELL(mlmat,&gridctx[level].R);CHKERRQ(ierr); 1905582bec1SHong Zhang mlmat = &(ml_object->Amat[mllevel]); 191eef31507SHong Zhang ierr = MatWrapML_MPIAIJ(mlmat,&gridctx[level].A);CHKERRQ(ierr); 1925582bec1SHong Zhang level--; 1935582bec1SHong Zhang } 1945582bec1SHong Zhang } 1955582bec1SHong Zhang 1965582bec1SHong Zhang /* create coarse level and the interpolation between the levels */ 197ac346b81SHong Zhang for (level=0; level<fine_level; level++){ 1985582bec1SHong Zhang ierr = VecCreate(gridctx[level].A->comm,&gridctx[level].x);CHKERRQ(ierr); 1995582bec1SHong Zhang ierr = VecSetSizes(gridctx[level].x,gridctx[level].A->n,PETSC_DECIDE);CHKERRQ(ierr); 2005582bec1SHong Zhang ierr = VecSetType(gridctx[level].x,VECMPI);CHKERRQ(ierr); 201*97177400SBarry Smith ierr = PCMGSetX(pc,level,gridctx[level].x);CHKERRQ(ierr); 2025582bec1SHong Zhang 2035582bec1SHong Zhang ierr = VecCreate(gridctx[level].A->comm,&gridctx[level].b);CHKERRQ(ierr); 2045582bec1SHong Zhang ierr = VecSetSizes(gridctx[level].b,gridctx[level].A->m,PETSC_DECIDE);CHKERRQ(ierr); 2055582bec1SHong Zhang ierr = VecSetType(gridctx[level].b,VECMPI);CHKERRQ(ierr); 206*97177400SBarry Smith ierr = PCMGSetRhs(pc,level,gridctx[level].b);CHKERRQ(ierr); 207ac346b81SHong Zhang 208ac346b81SHong Zhang level1 = level + 1; 209ac346b81SHong Zhang ierr = VecCreate(gridctx[level1].A->comm,&gridctx[level1].r);CHKERRQ(ierr); 210ac346b81SHong Zhang ierr = VecSetSizes(gridctx[level1].r,gridctx[level1].A->m,PETSC_DECIDE);CHKERRQ(ierr); 211ac346b81SHong Zhang ierr = VecSetType(gridctx[level1].r,VECMPI);CHKERRQ(ierr); 212*97177400SBarry Smith ierr = PCMGSetR(pc,level1,gridctx[level1].r);CHKERRQ(ierr); 213ac346b81SHong Zhang 214*97177400SBarry Smith ierr = PCMGSetInterpolate(pc,level1,gridctx[level].P);CHKERRQ(ierr); 215*97177400SBarry Smith ierr = PCMGSetRestriction(pc,level1,gridctx[level].R);CHKERRQ(ierr); 2165582bec1SHong Zhang 2175582bec1SHong Zhang if (level == 0){ 218*97177400SBarry Smith ierr = PCMGGetCoarseSolve(pc,&gridctx[level].ksp);CHKERRQ(ierr); 2195582bec1SHong Zhang } else { 220*97177400SBarry Smith ierr = PCMGGetSmoother(pc,level,&gridctx[level].ksp);CHKERRQ(ierr); 221*97177400SBarry Smith ierr = PCMGSetResidual(pc,level,PCMGDefaultResidual,gridctx[level].A);CHKERRQ(ierr); 2225582bec1SHong Zhang } 2235582bec1SHong Zhang ierr = KSPSetOperators(gridctx[level].ksp,gridctx[level].A,gridctx[level].A,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 2245582bec1SHong Zhang } 225*97177400SBarry Smith ierr = PCMGGetSmoother(pc,fine_level,&gridctx[fine_level].ksp);CHKERRQ(ierr); 226*97177400SBarry Smith ierr = PCMGSetResidual(pc,fine_level,PCMGDefaultResidual,gridctx[fine_level].A);CHKERRQ(ierr); 227ac346b81SHong Zhang ierr = KSPSetOperators(gridctx[fine_level].ksp,gridctx[level].A,gridctx[fine_level].A,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 228ac346b81SHong Zhang ierr = KSPSetOptionsPrefix(gridctx[fine_level].ksp,"mg_fine_");CHKERRQ(ierr); 2295582bec1SHong Zhang 2305582bec1SHong Zhang /* now call PCSetUp_MG() */ 2315582bec1SHong Zhang /*--------------------------------*/ 2325582bec1SHong Zhang ierr = (*pc_ml->PCSetUp)(pc);CHKERRQ(ierr); 2335582bec1SHong Zhang PetscFunctionReturn(0); 2345582bec1SHong Zhang } 2355582bec1SHong Zhang 2365582bec1SHong Zhang #undef __FUNCT__ 2375582bec1SHong Zhang #define __FUNCT__ "PetscObjectContainerDestroy_PC_ML" 2385582bec1SHong Zhang PetscErrorCode PetscObjectContainerDestroy_PC_ML(void *ptr) 2395582bec1SHong Zhang { 2405582bec1SHong Zhang PetscErrorCode ierr; 2415582bec1SHong Zhang PC_ML *pc_ml = (PC_ML*)ptr; 2425582bec1SHong Zhang PetscInt level; 2435582bec1SHong Zhang 2445582bec1SHong Zhang PetscFunctionBegin; 2455582bec1SHong Zhang if (pc_ml->size > 1){ierr = MatDestroy(pc_ml->PetscMLdata->Aloc);CHKERRQ(ierr);} 2465582bec1SHong Zhang ML_Aggregate_Destroy(&pc_ml->agg_object); 2475582bec1SHong Zhang ML_Destroy(&pc_ml->ml_object); 2485582bec1SHong Zhang 2495582bec1SHong Zhang ierr = PetscFree(pc_ml->PetscMLdata->pwork);CHKERRQ(ierr); 250ac346b81SHong Zhang if (pc_ml->PetscMLdata->x){ierr = VecDestroy(pc_ml->PetscMLdata->x);CHKERRQ(ierr);} 251ac346b81SHong Zhang if (pc_ml->PetscMLdata->y){ierr = VecDestroy(pc_ml->PetscMLdata->y);CHKERRQ(ierr);} 2525582bec1SHong Zhang ierr = PetscFree(pc_ml->PetscMLdata);CHKERRQ(ierr); 2535582bec1SHong Zhang 254ac346b81SHong Zhang for (level=0; level<pc_ml->fine_level; level++){ 255ac346b81SHong Zhang if (pc_ml->gridctx[level].A){ierr = MatDestroy(pc_ml->gridctx[level].A);CHKERRQ(ierr);} 256ac346b81SHong Zhang if (pc_ml->gridctx[level].P){ierr = MatDestroy(pc_ml->gridctx[level].P);CHKERRQ(ierr);} 257ac346b81SHong Zhang if (pc_ml->gridctx[level].R){ierr = MatDestroy(pc_ml->gridctx[level].R);CHKERRQ(ierr);} 258ac346b81SHong Zhang if (pc_ml->gridctx[level].x){ierr = VecDestroy(pc_ml->gridctx[level].x);CHKERRQ(ierr);} 259ac346b81SHong Zhang if (pc_ml->gridctx[level].b){ierr = VecDestroy(pc_ml->gridctx[level].b);CHKERRQ(ierr);} 260ac346b81SHong Zhang if (pc_ml->gridctx[level+1].r){ierr = VecDestroy(pc_ml->gridctx[level+1].r);CHKERRQ(ierr);} 2615582bec1SHong Zhang } 2625582bec1SHong Zhang ierr = PetscFree(pc_ml->gridctx);CHKERRQ(ierr); 2635582bec1SHong Zhang ierr = PetscFree(pc_ml);CHKERRQ(ierr); 2645582bec1SHong Zhang PetscFunctionReturn(0); 2655582bec1SHong Zhang } 2665582bec1SHong Zhang /* -------------------------------------------------------------------------- */ 2675582bec1SHong Zhang /* 2685582bec1SHong Zhang PCDestroy_ML - Destroys the private context for the ML preconditioner 2695582bec1SHong Zhang that was created with PCCreate_ML(). 2705582bec1SHong Zhang 2715582bec1SHong Zhang Input Parameter: 2725582bec1SHong Zhang . pc - the preconditioner context 2735582bec1SHong Zhang 2745582bec1SHong Zhang Application Interface Routine: PCDestroy() 2755582bec1SHong Zhang */ 2765582bec1SHong Zhang #undef __FUNCT__ 2775582bec1SHong Zhang #define __FUNCT__ "PCDestroy_ML" 2786ca4d86aSHong Zhang PetscErrorCode PCDestroy_ML(PC pc) 2795582bec1SHong Zhang { 2805582bec1SHong Zhang PetscErrorCode ierr; 2815582bec1SHong Zhang PC_ML *pc_ml=PETSC_NULL; 2825582bec1SHong Zhang PetscObjectContainer container; 2835582bec1SHong Zhang 2845582bec1SHong Zhang PetscFunctionBegin; 2855582bec1SHong Zhang ierr = PetscObjectQuery((PetscObject)pc,"PC_ML",(PetscObject *)&container);CHKERRQ(ierr); 2865582bec1SHong Zhang if (container) { 2875582bec1SHong Zhang ierr = PetscObjectContainerGetPointer(container,(void **)&pc_ml);CHKERRQ(ierr); 2885582bec1SHong Zhang pc->ops->destroy = pc_ml->PCDestroy; 2895582bec1SHong Zhang } else { 2905582bec1SHong Zhang SETERRQ(PETSC_ERR_ARG_NULL,"Container does not exit"); 2915582bec1SHong Zhang } 2929cb0ec93SHong Zhang /* detach pc and PC_ML and dereference container */ 2935582bec1SHong Zhang ierr = PetscObjectCompose((PetscObject)pc,"PC_ML",0);CHKERRQ(ierr); 2945582bec1SHong Zhang ierr = (*pc->ops->destroy)(pc);CHKERRQ(ierr); 2955582bec1SHong Zhang 2965582bec1SHong Zhang ierr = PetscObjectContainerDestroy(container);CHKERRQ(ierr); 2975582bec1SHong Zhang PetscFunctionReturn(0); 2985582bec1SHong Zhang } 2995582bec1SHong Zhang 3005582bec1SHong Zhang #undef __FUNCT__ 3015582bec1SHong Zhang #define __FUNCT__ "PCSetFromOptions_ML" 3026ca4d86aSHong Zhang PetscErrorCode PCSetFromOptions_ML(PC pc) 3035582bec1SHong Zhang { 3045582bec1SHong Zhang PetscErrorCode ierr; 3055582bec1SHong Zhang PetscInt indx,m,PrintLevel,MaxNlevels,MaxCoarseSize; 3065582bec1SHong Zhang PetscReal Threshold,DampingFactor; 3075582bec1SHong Zhang PetscTruth flg; 3085582bec1SHong Zhang const char *type[] = {"additive","multiplicative","full","cascade","kascade"}; 3095582bec1SHong Zhang const char *scheme[] = {"Uncoupled","Coupled","MIS","METIS"}; 3105582bec1SHong Zhang PC_ML *pc_ml=PETSC_NULL; 3115582bec1SHong Zhang PetscObjectContainer container; 3125582bec1SHong Zhang 3135582bec1SHong Zhang PetscFunctionBegin; 3145582bec1SHong Zhang ierr = PetscObjectQuery((PetscObject)pc,"PC_ML",(PetscObject *)&container);CHKERRQ(ierr); 3155582bec1SHong Zhang if (container) { 3165582bec1SHong Zhang ierr = PetscObjectContainerGetPointer(container,(void **)&pc_ml);CHKERRQ(ierr); 3175582bec1SHong Zhang } else { 3185582bec1SHong Zhang SETERRQ(PETSC_ERR_ARG_NULL,"Container does not exit"); 3195582bec1SHong Zhang } 3206ca4d86aSHong Zhang 3215582bec1SHong Zhang /* inherited MG options */ 3226ca4d86aSHong Zhang ierr = PetscOptionsHead("Multigrid options(inherited)");CHKERRQ(ierr); 3235582bec1SHong Zhang ierr = PetscOptionsInt("-pc_mg_cycles","1 for V cycle, 2 for W-cycle","MGSetCycles",1,&m,&flg);CHKERRQ(ierr); 3245582bec1SHong Zhang ierr = PetscOptionsInt("-pc_mg_smoothup","Number of post-smoothing steps","MGSetNumberSmoothUp",1,&m,&flg);CHKERRQ(ierr); 3255582bec1SHong Zhang ierr = PetscOptionsInt("-pc_mg_smoothdown","Number of pre-smoothing steps","MGSetNumberSmoothDown",1,&m,&flg);CHKERRQ(ierr); 3265582bec1SHong Zhang ierr = PetscOptionsEList("-pc_mg_type","Multigrid type","MGSetType",type,5,type[1],&indx,&flg);CHKERRQ(ierr); 3275582bec1SHong Zhang ierr = PetscOptionsTail();CHKERRQ(ierr); 3285582bec1SHong Zhang 3295582bec1SHong Zhang /* ML options */ 3305582bec1SHong Zhang ierr = PetscOptionsHead("ML options");CHKERRQ(ierr); 3315582bec1SHong Zhang /* set defaults */ 3325582bec1SHong Zhang PrintLevel = 0; 3335582bec1SHong Zhang MaxNlevels = 10; 3345582bec1SHong Zhang MaxCoarseSize = 1; 3355582bec1SHong Zhang indx = 0; 3365582bec1SHong Zhang Threshold = 0.0; 3375582bec1SHong Zhang DampingFactor = 4.0/3.0; 3385582bec1SHong Zhang 3395582bec1SHong Zhang ierr = PetscOptionsInt("-pc_ml_PrintLevel","Print level","ML_Set_PrintLevel",PrintLevel,&PrintLevel,PETSC_NULL);CHKERRQ(ierr); 3405582bec1SHong Zhang ML_Set_PrintLevel(PrintLevel); 3415582bec1SHong Zhang 3425582bec1SHong Zhang ierr = PetscOptionsInt("-pc_ml_maxNlevels","Maximum number of levels","None",MaxNlevels,&MaxNlevels,PETSC_NULL);CHKERRQ(ierr); 3435582bec1SHong Zhang pc_ml->MaxNlevels = MaxNlevels; 3445582bec1SHong Zhang 3455582bec1SHong Zhang ierr = PetscOptionsInt("-pc_ml_maxCoarseSize","Maximum coarsest mesh size","ML_Aggregate_Set_MaxCoarseSize",MaxCoarseSize,&MaxCoarseSize,PETSC_NULL);CHKERRQ(ierr); 3465582bec1SHong Zhang pc_ml->MaxCoarseSize = MaxCoarseSize; 3475582bec1SHong Zhang 3485582bec1SHong Zhang ierr = PetscOptionsEList("-pc_ml_CoarsenScheme","Aggregate Coarsen Scheme","ML_Aggregate_Set_CoarsenScheme_*",scheme,4,scheme[0],&indx,PETSC_NULL);CHKERRQ(ierr); 3495582bec1SHong Zhang pc_ml->CoarsenScheme = indx; 3505582bec1SHong Zhang 3515582bec1SHong Zhang ierr = PetscOptionsReal("-pc_ml_DampingFactor","P damping factor","ML_Aggregate_Set_DampingFactor",DampingFactor,&DampingFactor,PETSC_NULL);CHKERRQ(ierr); 3525582bec1SHong Zhang pc_ml->DampingFactor = DampingFactor; 3535582bec1SHong Zhang 3545582bec1SHong Zhang ierr = PetscOptionsReal("-pc_ml_Threshold","Smoother drop tol","ML_Aggregate_Set_Threshold",Threshold,&Threshold,PETSC_NULL);CHKERRQ(ierr); 3555582bec1SHong Zhang pc_ml->Threshold = Threshold; 3565582bec1SHong Zhang 3575582bec1SHong Zhang ierr = PetscOptionsLogical("-pc_ml_SpectralNormScheme_Anorm","Method used for estimating spectral radius","ML_Aggregate_Set_SpectralNormScheme_Anorm",PETSC_FALSE,&pc_ml->SpectralNormScheme_Anorm,PETSC_FALSE); 3585582bec1SHong Zhang 3595582bec1SHong Zhang ierr = PetscOptionsTail();CHKERRQ(ierr); 3605582bec1SHong Zhang PetscFunctionReturn(0); 3615582bec1SHong Zhang } 3625582bec1SHong Zhang 3635582bec1SHong Zhang /* -------------------------------------------------------------------------- */ 3645582bec1SHong Zhang /* 3655582bec1SHong Zhang PCCreate_ML - Creates a ML preconditioner context, PC_ML, 3665582bec1SHong Zhang and sets this as the private data within the generic preconditioning 3675582bec1SHong Zhang context, PC, that was created within PCCreate(). 3685582bec1SHong Zhang 3695582bec1SHong Zhang Input Parameter: 3705582bec1SHong Zhang . pc - the preconditioner context 3715582bec1SHong Zhang 3725582bec1SHong Zhang Application Interface Routine: PCCreate() 3735582bec1SHong Zhang */ 3745582bec1SHong Zhang 3755582bec1SHong Zhang /*MC 3765582bec1SHong Zhang PCML - Use geometric multigrid preconditioning. This preconditioner requires you provide 3775582bec1SHong Zhang fine grid discretization matrix. The coarser grid matrices and restriction/interpolation 3786ca4d86aSHong Zhang operators are computed by ML, with the matrices coverted to PETSc matrices in aij format 3796ca4d86aSHong Zhang and the restriction/interpolation operators wrapped as PETSc shell matrices. 3805582bec1SHong Zhang 3816ca4d86aSHong Zhang Options Database Key: 3826ca4d86aSHong Zhang Multigrid options(inherited) 3836ca4d86aSHong Zhang + -pc_mg_cycles <1>: 1 for V cycle, 2 for W-cycle (MGSetCycles) 3846ca4d86aSHong Zhang . -pc_mg_smoothup <1>: Number of post-smoothing steps (MGSetNumberSmoothUp) 3856ca4d86aSHong Zhang . -pc_mg_smoothdown <1>: Number of pre-smoothing steps (MGSetNumberSmoothDown) 3866ca4d86aSHong Zhang - -pc_mg_type <multiplicative> (one of) additive multiplicative full cascade kascade 3876ca4d86aSHong Zhang 3886ca4d86aSHong Zhang ML options 3896ca4d86aSHong Zhang + -pc_ml_PrintLevel <0>: Print level (ML_Set_PrintLevel) 3906ca4d86aSHong Zhang . -pc_ml_maxNlevels <10>: Maximum number of levels (None) 3916ca4d86aSHong Zhang . -pc_ml_maxCoarseSize <1>: Maximum coarsest mesh size (ML_Aggregate_Set_MaxCoarseSize) 3926ca4d86aSHong Zhang . -pc_ml_CoarsenScheme <Uncoupled> (one of) Uncoupled Coupled MIS METIS 3936ca4d86aSHong Zhang . -pc_ml_DampingFactor <1.33333>: P damping factor (ML_Aggregate_Set_DampingFactor) 3946ca4d86aSHong Zhang . -pc_ml_Threshold <0>: Smoother drop tol (ML_Aggregate_Set_Threshold) 3956ca4d86aSHong Zhang - -pc_ml_SpectralNormScheme_Anorm: <false> Method used for estimating spectral radius (ML_Aggregate_Set_SpectralNormScheme_Anorm) 3965582bec1SHong Zhang 3975582bec1SHong Zhang Level: intermediate 3985582bec1SHong Zhang 3995582bec1SHong Zhang Concepts: multigrid 4005582bec1SHong Zhang 4015582bec1SHong Zhang .seealso: PCCreate(), PCSetType(), PCType (for list of available types), PC, PCMGType, 402*97177400SBarry Smith PCMGSetLevels(), PCMGGetLevels(), PCMGSetType(), MPSetCycles(), PCMGSetNumberSmoothDown(), 403*97177400SBarry Smith PCMGSetNumberSmoothUp(), PCMGGetCoarseSolve(), PCMGSetResidual(), PCMGSetInterpolation(), 404*97177400SBarry Smith PCMGSetRestriction(), PCMGGetSmoother(), PCMGGetSmootherUp(), PCMGGetSmootherDown(), 405*97177400SBarry Smith PCMGSetCyclesOnLevel(), PCMGSetRhs(), PCMGSetX(), PCMGSetR() 4065582bec1SHong Zhang M*/ 4075582bec1SHong Zhang 4085582bec1SHong Zhang EXTERN_C_BEGIN 4095582bec1SHong Zhang #undef __FUNCT__ 4105582bec1SHong Zhang #define __FUNCT__ "PCCreate_ML" 411dba47a55SKris Buschelman PetscErrorCode PETSCKSP_DLLEXPORT PCCreate_ML(PC pc) 4125582bec1SHong Zhang { 4135582bec1SHong Zhang PetscErrorCode ierr; 4145582bec1SHong Zhang PC_ML *pc_ml; 4155582bec1SHong Zhang PetscObjectContainer container; 4165582bec1SHong Zhang 4175582bec1SHong Zhang PetscFunctionBegin; 4185582bec1SHong Zhang /* initialize pc as PCMG */ 4195582bec1SHong Zhang ierr = PCSetType(pc,PCMG);CHKERRQ(ierr); /* calls PCCreate_MG() and MGCreate_Private() */ 4205582bec1SHong Zhang 4215582bec1SHong Zhang /* create a supporting struct and attach it to pc */ 4225582bec1SHong Zhang ierr = PetscNew(PC_ML,&pc_ml);CHKERRQ(ierr); 4235582bec1SHong Zhang ierr = PetscObjectContainerCreate(PETSC_COMM_SELF,&container);CHKERRQ(ierr); 4245582bec1SHong Zhang ierr = PetscObjectContainerSetPointer(container,pc_ml);CHKERRQ(ierr); 4259cb0ec93SHong Zhang ierr = PetscObjectContainerSetUserDestroy(container,PetscObjectContainerDestroy_PC_ML);CHKERRQ(ierr); 4265582bec1SHong Zhang ierr = PetscObjectCompose((PetscObject)pc,"PC_ML",(PetscObject)container);CHKERRQ(ierr); 4275582bec1SHong Zhang 4285582bec1SHong Zhang pc_ml->PCSetUp = pc->ops->setup; 4295582bec1SHong Zhang pc_ml->PCDestroy = pc->ops->destroy; 4305582bec1SHong Zhang 4315582bec1SHong Zhang /* overwrite the pointers of PCMG by the functions of PCML */ 4325582bec1SHong Zhang pc->ops->setfromoptions = PCSetFromOptions_ML; 4335582bec1SHong Zhang pc->ops->setup = PCSetUp_ML; 4345582bec1SHong Zhang pc->ops->destroy = PCDestroy_ML; 4355582bec1SHong Zhang PetscFunctionReturn(0); 4365582bec1SHong Zhang } 4375582bec1SHong Zhang EXTERN_C_END 4385582bec1SHong Zhang 4395582bec1SHong Zhang int PetscML_getrow(void *ML_data, int N_requested_rows, int requested_rows[], 4405582bec1SHong Zhang int allocated_space, int columns[], double values[], int row_lengths[]) 4415582bec1SHong Zhang { 4425582bec1SHong Zhang PetscErrorCode ierr; 4435582bec1SHong Zhang Mat Aloc; 4445582bec1SHong Zhang Mat_SeqAIJ *a; 4455582bec1SHong Zhang PetscInt m,i,j,k=0,row,*aj; 4465582bec1SHong Zhang PetscScalar *aa; 4475582bec1SHong Zhang FineGridCtx *ml=(FineGridCtx*)ML_data; 4485582bec1SHong Zhang 4495582bec1SHong Zhang Aloc = ml->Aloc; 4505582bec1SHong Zhang a = (Mat_SeqAIJ*)Aloc->data; 4515582bec1SHong Zhang ierr = MatGetSize(Aloc,&m,PETSC_NULL);CHKERRQ(ierr); 4525582bec1SHong Zhang 4535582bec1SHong Zhang for (i = 0; i<N_requested_rows; i++) { 4545582bec1SHong Zhang row = requested_rows[i]; 4555582bec1SHong Zhang row_lengths[i] = a->ilen[row]; 4565582bec1SHong Zhang if (allocated_space < k+row_lengths[i]) return(0); 4575582bec1SHong Zhang if ( (row >= 0) || (row <= (m-1)) ) { 4585582bec1SHong Zhang aj = a->j + a->i[row]; 4595582bec1SHong Zhang aa = a->a + a->i[row]; 4605582bec1SHong Zhang for (j=0; j<row_lengths[i]; j++){ 4615582bec1SHong Zhang columns[k] = aj[j]; 4625582bec1SHong Zhang values[k++] = aa[j]; 4635582bec1SHong Zhang } 4645582bec1SHong Zhang } 4655582bec1SHong Zhang } 4665582bec1SHong Zhang return(1); 4675582bec1SHong Zhang } 4685582bec1SHong Zhang 4695582bec1SHong Zhang int PetscML_matvec(void *ML_data,int in_length,double p[],int out_length,double ap[]) 4705582bec1SHong Zhang { 4715582bec1SHong Zhang PetscErrorCode ierr; 4725582bec1SHong Zhang FineGridCtx *ml=(FineGridCtx*)ML_data; 4735582bec1SHong Zhang Mat A=ml->A, Aloc=ml->Aloc; 4745582bec1SHong Zhang PetscMPIInt size; 4755582bec1SHong Zhang PetscScalar *pwork=ml->pwork; 4765582bec1SHong Zhang PetscInt i; 4775582bec1SHong Zhang 4785582bec1SHong Zhang ierr = MPI_Comm_size(A->comm,&size);CHKERRQ(ierr); 4795582bec1SHong Zhang if (size == 1){ 48024a42b14SHong Zhang ierr = VecPlaceArray(ml->x,p);CHKERRQ(ierr); 4815582bec1SHong Zhang } else { 4825582bec1SHong Zhang for (i=0; i<in_length; i++) pwork[i] = p[i]; 4835582bec1SHong Zhang PetscML_comm(pwork,ml); 48424a42b14SHong Zhang ierr = VecPlaceArray(ml->x,pwork);CHKERRQ(ierr); 4855582bec1SHong Zhang } 48624a42b14SHong Zhang ierr = VecPlaceArray(ml->y,ap);CHKERRQ(ierr); 48724a42b14SHong Zhang ierr = MatMult(Aloc,ml->x,ml->y);CHKERRQ(ierr); 4885582bec1SHong Zhang return 0; 4895582bec1SHong Zhang } 4905582bec1SHong Zhang 4915582bec1SHong Zhang int PetscML_comm(double p[],void *ML_data) 4925582bec1SHong Zhang { 4935582bec1SHong Zhang PetscErrorCode ierr; 4945582bec1SHong Zhang FineGridCtx *ml=(FineGridCtx*)ML_data; 4955582bec1SHong Zhang Mat A=ml->A; 4965582bec1SHong Zhang Mat_MPIAIJ *a = (Mat_MPIAIJ*)A->data; 4975582bec1SHong Zhang PetscMPIInt size; 4985582bec1SHong Zhang PetscInt i,in_length=A->m,out_length=ml->Aloc->n; 4995582bec1SHong Zhang PetscScalar *array; 5005582bec1SHong Zhang 5015582bec1SHong Zhang ierr = MPI_Comm_size(A->comm,&size);CHKERRQ(ierr); 5025582bec1SHong Zhang if (size == 1) return 0; 50324a42b14SHong Zhang 50424a42b14SHong Zhang ierr = VecPlaceArray(ml->y,p);CHKERRQ(ierr); 50524a42b14SHong Zhang ierr = VecScatterBegin(ml->y,a->lvec,INSERT_VALUES,SCATTER_FORWARD,a->Mvctx);CHKERRQ(ierr); 50624a42b14SHong Zhang ierr = VecScatterEnd(ml->y,a->lvec,INSERT_VALUES,SCATTER_FORWARD,a->Mvctx);CHKERRQ(ierr); 5075582bec1SHong Zhang ierr = VecGetArray(a->lvec,&array);CHKERRQ(ierr); 5085582bec1SHong Zhang for (i=in_length; i<out_length; i++){ 5095582bec1SHong Zhang p[i] = array[i-in_length]; 5105582bec1SHong Zhang } 5115582bec1SHong Zhang return 0; 5125582bec1SHong Zhang } 5135582bec1SHong Zhang #undef __FUNCT__ 5145582bec1SHong Zhang #define __FUNCT__ "MatMult_ML" 5155582bec1SHong Zhang PetscErrorCode MatMult_ML(Mat A,Vec x,Vec y) 5165582bec1SHong Zhang { 5175582bec1SHong Zhang PetscErrorCode ierr; 5185582bec1SHong Zhang Mat_MLShell *shell; 5195582bec1SHong Zhang PetscScalar *xarray,*yarray; 5205582bec1SHong Zhang PetscInt x_length,y_length; 5215582bec1SHong Zhang 5225582bec1SHong Zhang PetscFunctionBegin; 5235582bec1SHong Zhang ierr = MatShellGetContext(A,(void *)&shell);CHKERRQ(ierr); 5245582bec1SHong Zhang ierr = VecGetArray(x,&xarray);CHKERRQ(ierr); 5255582bec1SHong Zhang ierr = VecGetArray(y,&yarray);CHKERRQ(ierr); 5265582bec1SHong Zhang x_length = shell->mlmat->invec_leng; 5275582bec1SHong Zhang y_length = shell->mlmat->outvec_leng; 5285582bec1SHong Zhang 5295582bec1SHong Zhang ML_Operator_Apply(shell->mlmat,x_length,xarray,y_length,yarray); 5305582bec1SHong Zhang 5315582bec1SHong Zhang ierr = VecRestoreArray(x,&xarray);CHKERRQ(ierr); 5325582bec1SHong Zhang ierr = VecRestoreArray(y,&yarray);CHKERRQ(ierr); 5335582bec1SHong Zhang PetscFunctionReturn(0); 5345582bec1SHong Zhang } 5355582bec1SHong Zhang /* MatMultAdd_ML - Compute y = w + A*x */ 5365582bec1SHong Zhang #undef __FUNCT__ 5375582bec1SHong Zhang #define __FUNCT__ "MatMultAdd_ML" 5385582bec1SHong Zhang PetscErrorCode MatMultAdd_ML(Mat A,Vec x,Vec w,Vec y) 5395582bec1SHong Zhang { 5405582bec1SHong Zhang PetscErrorCode ierr; 5415582bec1SHong Zhang Mat_MLShell *shell; 5425582bec1SHong Zhang PetscScalar *xarray,*yarray; 5435582bec1SHong Zhang const PetscScalar one=1.0; 5445582bec1SHong Zhang PetscInt x_length,y_length; 5455582bec1SHong Zhang 5465582bec1SHong Zhang PetscFunctionBegin; 5475582bec1SHong Zhang ierr = MatShellGetContext(A,(void *)&shell);CHKERRQ(ierr); 5485582bec1SHong Zhang ierr = VecGetArray(x,&xarray);CHKERRQ(ierr); 5495582bec1SHong Zhang ierr = VecGetArray(y,&yarray);CHKERRQ(ierr); 5505582bec1SHong Zhang 5515582bec1SHong Zhang x_length = shell->mlmat->invec_leng; 5525582bec1SHong Zhang y_length = shell->mlmat->outvec_leng; 5535582bec1SHong Zhang 5545582bec1SHong Zhang ML_Operator_Apply(shell->mlmat,x_length,xarray,y_length,yarray); 5555582bec1SHong Zhang 5565582bec1SHong Zhang ierr = VecRestoreArray(x,&xarray);CHKERRQ(ierr); 5575582bec1SHong Zhang ierr = VecRestoreArray(y,&yarray);CHKERRQ(ierr); 5585582bec1SHong Zhang ierr = VecAXPY(&one,w,y);CHKERRQ(ierr); 5595582bec1SHong Zhang 5605582bec1SHong Zhang PetscFunctionReturn(0); 5615582bec1SHong Zhang } 5625582bec1SHong Zhang 5635582bec1SHong Zhang /* newtype is ignored because "ml" is not listed under Petsc MatType yet */ 5645582bec1SHong Zhang #undef __FUNCT__ 5655582bec1SHong Zhang #define __FUNCT__ "MatConvert_MPIAIJ_ML" 566eef31507SHong Zhang PetscErrorCode MatConvert_MPIAIJ_ML(Mat A,const MatType newtype,MatReuse scall,Mat *Aloc) 5675582bec1SHong Zhang { 5685582bec1SHong Zhang PetscErrorCode ierr; 5695582bec1SHong Zhang Mat_MPIAIJ *mpimat=(Mat_MPIAIJ*)A->data; 5705582bec1SHong Zhang Mat_SeqAIJ *mat,*a=(Mat_SeqAIJ*)(mpimat->A)->data,*b=(Mat_SeqAIJ*)(mpimat->B)->data; 5715582bec1SHong Zhang PetscInt *ai=a->i,*aj=a->j,*bi=b->i,*bj=b->j; 5725582bec1SHong Zhang PetscScalar *aa=a->a,*ba=b->a,*ca; 5735582bec1SHong Zhang PetscInt am=A->m,an=A->n,i,j,k; 5745582bec1SHong Zhang PetscInt *ci,*cj,ncols; 5755582bec1SHong Zhang 5765582bec1SHong Zhang PetscFunctionBegin; 5775582bec1SHong Zhang if (am != an) SETERRQ2(PETSC_ERR_ARG_WRONG,"A must have a square diagonal portion, am: %d != an: %d",am,an); 5785582bec1SHong Zhang 5795582bec1SHong Zhang if (scall == MAT_INITIAL_MATRIX){ 5805582bec1SHong Zhang ierr = PetscMalloc((1+am)*sizeof(PetscInt),&ci);CHKERRQ(ierr); 5815582bec1SHong Zhang ci[0] = 0; 5825582bec1SHong Zhang for (i=0; i<am; i++){ 5835582bec1SHong Zhang ci[i+1] = ci[i] + (ai[i+1] - ai[i]) + (bi[i+1] - bi[i]); 5845582bec1SHong Zhang } 5855582bec1SHong Zhang ierr = PetscMalloc((1+ci[am])*sizeof(PetscInt),&cj);CHKERRQ(ierr); 5865582bec1SHong Zhang ierr = PetscMalloc((1+ci[am])*sizeof(PetscScalar),&ca);CHKERRQ(ierr); 5875582bec1SHong Zhang 5885582bec1SHong Zhang k = 0; 5895582bec1SHong Zhang for (i=0; i<am; i++){ 5905582bec1SHong Zhang /* diagonal portion of A */ 5915582bec1SHong Zhang ncols = ai[i+1] - ai[i]; 5925582bec1SHong Zhang for (j=0; j<ncols; j++) { 5935582bec1SHong Zhang cj[k] = *aj++; 5945582bec1SHong Zhang ca[k++] = *aa++; 5955582bec1SHong Zhang } 5965582bec1SHong Zhang /* off-diagonal portion of A */ 5975582bec1SHong Zhang ncols = bi[i+1] - bi[i]; 5985582bec1SHong Zhang for (j=0; j<ncols; j++) { 5995582bec1SHong Zhang cj[k] = an + (*bj); bj++; 6005582bec1SHong Zhang ca[k++] = *ba++; 6015582bec1SHong Zhang } 6025582bec1SHong Zhang } 6035582bec1SHong Zhang if (k != ci[am]) SETERRQ2(PETSC_ERR_ARG_WRONG,"k: %d != ci[am]: %d",k,ci[am]); 6045582bec1SHong Zhang 6055582bec1SHong Zhang /* put together the new matrix */ 6065582bec1SHong Zhang an = mpimat->A->n+mpimat->B->n; 6075582bec1SHong Zhang ierr = MatCreateSeqAIJWithArrays(PETSC_COMM_SELF,am,an,ci,cj,ca,Aloc);CHKERRQ(ierr); 6085582bec1SHong Zhang 6095582bec1SHong Zhang /* MatCreateSeqAIJWithArrays flags matrix so PETSc doesn't free the user's arrays. */ 6105582bec1SHong Zhang /* Since these are PETSc arrays, change flags to free them as necessary. */ 6115582bec1SHong Zhang mat = (Mat_SeqAIJ*)(*Aloc)->data; 6125582bec1SHong Zhang mat->freedata = PETSC_TRUE; 6135582bec1SHong Zhang mat->nonew = 0; 6145582bec1SHong Zhang } else if (scall == MAT_REUSE_MATRIX){ 6155582bec1SHong Zhang mat=(Mat_SeqAIJ*)(*Aloc)->data; 6165582bec1SHong Zhang ci = mat->i; cj = mat->j; ca = mat->a; 6175582bec1SHong Zhang for (i=0; i<am; i++) { 6185582bec1SHong Zhang /* diagonal portion of A */ 6195582bec1SHong Zhang ncols = ai[i+1] - ai[i]; 6205582bec1SHong Zhang for (j=0; j<ncols; j++) *ca++ = *aa++; 6215582bec1SHong Zhang /* off-diagonal portion of A */ 6225582bec1SHong Zhang ncols = bi[i+1] - bi[i]; 6235582bec1SHong Zhang for (j=0; j<ncols; j++) *ca++ = *ba++; 6245582bec1SHong Zhang } 6255582bec1SHong Zhang } else { 6265582bec1SHong Zhang SETERRQ1(PETSC_ERR_ARG_WRONG,"Invalid MatReuse %d",(int)scall); 6275582bec1SHong Zhang } 6285582bec1SHong Zhang PetscFunctionReturn(0); 6295582bec1SHong Zhang } 6305582bec1SHong Zhang extern PetscErrorCode MatDestroy_Shell(Mat); 6315582bec1SHong Zhang #undef __FUNCT__ 6325582bec1SHong Zhang #define __FUNCT__ "MatDestroy_ML" 6335582bec1SHong Zhang PetscErrorCode MatDestroy_ML(Mat A) 6345582bec1SHong Zhang { 6355582bec1SHong Zhang PetscErrorCode ierr; 6365582bec1SHong Zhang Mat_MLShell *shell; 6375582bec1SHong Zhang 6385582bec1SHong Zhang PetscFunctionBegin; 6395582bec1SHong Zhang ierr = MatShellGetContext(A,(void *)&shell);CHKERRQ(ierr); 6405582bec1SHong Zhang ierr = VecDestroy(shell->y);CHKERRQ(ierr); 6415582bec1SHong Zhang ierr = PetscFree(shell);CHKERRQ(ierr); 6425582bec1SHong Zhang ierr = MatDestroy_Shell(A);CHKERRQ(ierr); 6435582bec1SHong Zhang PetscFunctionReturn(0); 6445582bec1SHong Zhang } 6455582bec1SHong Zhang 6465582bec1SHong Zhang #undef __FUNCT__ 647eef31507SHong Zhang #define __FUNCT__ "MatWrapML_SeqAIJ" 648eef31507SHong Zhang PetscErrorCode MatWrapML_SeqAIJ(ML_Operator *mlmat,Mat *newmat) 6495582bec1SHong Zhang { 650e14861a4SHong Zhang struct ML_CSR_MSRdata *matdata = (struct ML_CSR_MSRdata *)mlmat->data; 6515582bec1SHong Zhang PetscErrorCode ierr; 652e14861a4SHong Zhang PetscInt m=mlmat->outvec_leng,n=mlmat->invec_leng,nnz[m],nz_max; 653e14861a4SHong Zhang PetscInt *ml_cols=matdata->columns,*aj,i,j,k; 654e14861a4SHong Zhang PetscScalar *ml_vals=matdata->values,*aa; 6555582bec1SHong Zhang 6565582bec1SHong Zhang PetscFunctionBegin; 657e14861a4SHong Zhang if ( mlmat->getrow == NULL) SETERRQ(PETSC_ERR_ARG_NULL,"mlmat->getrow = NULL"); 658ab718edeSHong Zhang if (m != n){ /* ML Pmat and Rmat are in CSR format. Pass array pointers into SeqAIJ matrix */ 659e14861a4SHong Zhang ierr = MatCreateSeqAIJWithArrays(PETSC_COMM_SELF,m,n,matdata->rowptr,ml_cols,ml_vals,newmat);CHKERRQ(ierr); 66024a42b14SHong Zhang PetscFunctionReturn(0); 66124a42b14SHong Zhang } 6625582bec1SHong Zhang 663e14861a4SHong Zhang /* ML Amat is in MSR format. Copy its data into SeqAIJ matrix */ 6645582bec1SHong Zhang ierr = MatCreate(PETSC_COMM_SELF,m,n,PETSC_DECIDE,PETSC_DECIDE,newmat);CHKERRQ(ierr); 6655582bec1SHong Zhang ierr = MatSetType(*newmat,MATSEQAIJ);CHKERRQ(ierr); 666e14861a4SHong Zhang 667e14861a4SHong Zhang nz_max = 0; 6685582bec1SHong Zhang for (i=0; i<m; i++) { 669e14861a4SHong Zhang nnz[i] = ml_cols[i+1] - ml_cols[i] + 1; 670e14861a4SHong Zhang if (nnz[i] > nz_max) nz_max = nnz[i]; 6715582bec1SHong Zhang } 6725582bec1SHong Zhang ierr = MatSeqAIJSetPreallocation(*newmat,0,nnz);CHKERRQ(ierr); 673ab718edeSHong Zhang ierr = MatSetOption(*newmat,MAT_COLUMNS_SORTED);CHKERRQ(ierr); /* check! */ 6745582bec1SHong Zhang 675e14861a4SHong Zhang nz_max++; 676e14861a4SHong Zhang ierr = PetscMalloc(nz_max*(sizeof(int)+sizeof(PetscScalar)),&aj);CHKERRQ(ierr); 677e14861a4SHong Zhang aa = (PetscScalar*)(aj + nz_max); 67824a42b14SHong Zhang 6795582bec1SHong Zhang for (i=0; i<m; i++){ 680e14861a4SHong Zhang k = 0; 681e14861a4SHong Zhang /* diagonal entry */ 682e14861a4SHong Zhang aj[k] = i; aa[k++] = ml_vals[i]; 683e14861a4SHong Zhang /* off diagonal entries */ 684e14861a4SHong Zhang for (j=ml_cols[i]; j<ml_cols[i+1]; j++){ 685e14861a4SHong Zhang aj[k] = ml_cols[j]; aa[k++] = ml_vals[j]; 68624a42b14SHong Zhang } 687ab718edeSHong Zhang /* sort aj and aa */ 688e14861a4SHong Zhang ierr = PetscSortIntWithScalarArray(nnz[i],aj,aa);CHKERRQ(ierr); 689e14861a4SHong Zhang ierr = MatSetValues(*newmat,1,&i,nnz[i],aj,aa,INSERT_VALUES);CHKERRQ(ierr); 6905582bec1SHong Zhang } 6915582bec1SHong Zhang ierr = MatAssemblyBegin(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 6925582bec1SHong Zhang ierr = MatAssemblyEnd(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 693e14861a4SHong Zhang ierr = PetscFree(aj);CHKERRQ(ierr); 6945582bec1SHong Zhang PetscFunctionReturn(0); 6955582bec1SHong Zhang } 6965582bec1SHong Zhang 6975582bec1SHong Zhang #undef __FUNCT__ 698eef31507SHong Zhang #define __FUNCT__ "MatWrapML_SHELL" 699eef31507SHong Zhang PetscErrorCode MatWrapML_SHELL(ML_Operator *mlmat,Mat *newmat) 7005582bec1SHong Zhang { 7015582bec1SHong Zhang PetscErrorCode ierr; 7025582bec1SHong Zhang PetscInt m,n; 7035582bec1SHong Zhang ML_Comm *MLcomm; 7045582bec1SHong Zhang Mat_MLShell *shellctx; 7055582bec1SHong Zhang 7065582bec1SHong Zhang PetscFunctionBegin; 7075582bec1SHong Zhang m = mlmat->outvec_leng; 7085582bec1SHong Zhang n = mlmat->invec_leng; 7095582bec1SHong Zhang if (!m || !n){ 7105582bec1SHong Zhang newmat = PETSC_NULL; 7115582bec1SHong Zhang } else { 7125582bec1SHong Zhang MLcomm = mlmat->comm; 7135582bec1SHong Zhang ierr = PetscNew(Mat_MLShell,&shellctx);CHKERRQ(ierr); 7145582bec1SHong Zhang ierr = MatCreateShell(MLcomm->USR_comm,m,n,PETSC_DETERMINE,PETSC_DETERMINE,shellctx,newmat);CHKERRQ(ierr); 7155582bec1SHong Zhang ierr = MatShellSetOperation(*newmat,MATOP_MULT,(void *)MatMult_ML);CHKERRQ(ierr); 7165582bec1SHong Zhang ierr = MatShellSetOperation(*newmat,MATOP_MULT_ADD,(void *)MatMultAdd_ML);CHKERRQ(ierr); 7175582bec1SHong Zhang shellctx->A = *newmat; 7185582bec1SHong Zhang shellctx->mlmat = mlmat; 7195582bec1SHong Zhang ierr = VecCreate(PETSC_COMM_WORLD,&shellctx->y);CHKERRQ(ierr); 7205582bec1SHong Zhang ierr = VecSetSizes(shellctx->y,m,PETSC_DECIDE);CHKERRQ(ierr); 7215582bec1SHong Zhang ierr = VecSetFromOptions(shellctx->y);CHKERRQ(ierr); 7225582bec1SHong Zhang (*newmat)->ops->destroy = MatDestroy_ML; 7235582bec1SHong Zhang } 7245582bec1SHong Zhang PetscFunctionReturn(0); 7255582bec1SHong Zhang } 726e14861a4SHong Zhang 727e14861a4SHong Zhang #undef __FUNCT__ 728eef31507SHong Zhang #define __FUNCT__ "MatWrapML_MPIAIJ" 729eef31507SHong Zhang PetscErrorCode MatWrapML_MPIAIJ(ML_Operator *mlmat,Mat *newmat) 730e14861a4SHong Zhang { 731ab718edeSHong Zhang struct ML_CSR_MSRdata *matdata = (struct ML_CSR_MSRdata *)mlmat->data; 732ab718edeSHong Zhang PetscInt *ml_cols=matdata->columns,*aj; 733ab718edeSHong Zhang PetscScalar *ml_vals=matdata->values,*aa; 734e14861a4SHong Zhang PetscErrorCode ierr; 735ab718edeSHong Zhang PetscInt i,j,k,*gordering; 736ab718edeSHong Zhang PetscInt m=mlmat->outvec_leng,n,nnzA[m],nnzB[m],nnz[m],nz_max,row; 737ab718edeSHong Zhang Mat A; 738e14861a4SHong Zhang 739e14861a4SHong Zhang PetscFunctionBegin; 740ab718edeSHong Zhang if (mlmat->getrow == NULL) SETERRQ(PETSC_ERR_ARG_NULL,"mlmat->getrow = NULL"); 741ab718edeSHong Zhang n = mlmat->invec_leng; 742e14861a4SHong Zhang if (m != n) SETERRQ2(PETSC_ERR_ARG_OUTOFRANGE,"m %d must equal to n %d",m,n); 743e14861a4SHong Zhang 744ab718edeSHong Zhang ierr = MatCreate(mlmat->comm->USR_comm,m,n,PETSC_DECIDE,PETSC_DECIDE,&A);CHKERRQ(ierr); 745ab718edeSHong Zhang ierr = MatSetType(A,MATMPIAIJ);CHKERRQ(ierr); 746e14861a4SHong Zhang nz_max = 0; 747e14861a4SHong Zhang for (i=0; i<m; i++){ 748ab718edeSHong Zhang nnz[i] = ml_cols[i+1] - ml_cols[i] + 1; 749e14861a4SHong Zhang if (nz_max < nnz[i]) nz_max = nnz[i]; 750ab718edeSHong Zhang nnzA[i] = 1; /* diag */ 751ab718edeSHong Zhang for (j=ml_cols[i]; j<ml_cols[i+1]; j++){ 752ab718edeSHong Zhang if (ml_cols[j] < m) nnzA[i]++; 753e14861a4SHong Zhang } 754e14861a4SHong Zhang nnzB[i] = nnz[i] - nnzA[i]; 755e14861a4SHong Zhang } 756ab718edeSHong Zhang ierr = MatMPIAIJSetPreallocation(A,0,nnzA,0,nnzB);CHKERRQ(ierr); 757e14861a4SHong Zhang 758ab718edeSHong Zhang /* insert mat values -- remap row and column indices */ 759ab718edeSHong Zhang nz_max++; 760ab718edeSHong Zhang ierr = PetscMalloc(nz_max*(sizeof(int)+sizeof(PetscScalar)),&aj);CHKERRQ(ierr); 761ab718edeSHong Zhang aa = (PetscScalar*)(aj + nz_max); 762ab718edeSHong Zhang ML_build_global_numbering(mlmat,mlmat->comm,&gordering); 763e14861a4SHong Zhang for (i=0; i<m; i++){ 764e14861a4SHong Zhang row = gordering[i]; 765ab718edeSHong Zhang k = 0; 766ab718edeSHong Zhang /* diagonal entry */ 767ab718edeSHong Zhang aj[k] = row; aa[k++] = ml_vals[i]; 768ab718edeSHong Zhang /* off diagonal entries */ 769ab718edeSHong Zhang for (j=ml_cols[i]; j<ml_cols[i+1]; j++){ 770ab718edeSHong Zhang aj[k] = gordering[ml_cols[j]]; aa[k++] = ml_vals[j]; 771e14861a4SHong Zhang } 772ab718edeSHong Zhang ierr = MatSetValues(A,1,&row,nnz[i],aj,aa,INSERT_VALUES);CHKERRQ(ierr); 773e14861a4SHong Zhang } 774ab718edeSHong Zhang ierr = MatAssemblyBegin(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 775ab718edeSHong Zhang ierr = MatAssemblyEnd(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 776ab718edeSHong Zhang *newmat = A; 777e14861a4SHong Zhang 778ab718edeSHong Zhang ierr = PetscFree(aj);CHKERRQ(ierr); 779e14861a4SHong Zhang PetscFunctionReturn(0); 780e14861a4SHong Zhang } 781