xref: /petsc/src/sys/memory/mhbw.c (revision 08401ef684002a709c6d3db98a0c9f54a8bcf1ec)
12f21b5c6SHong Zhang #include <petscsys.h>             /*I   "petscsys.h"   I*/
22f21b5c6SHong Zhang 
32f21b5c6SHong Zhang #if defined(PETSC_HAVE_MEMKIND)
42f21b5c6SHong Zhang #include <hbwmalloc.h>
52f21b5c6SHong Zhang #endif
62f21b5c6SHong Zhang 
72f21b5c6SHong Zhang /*
82f21b5c6SHong Zhang    These are defined in mal.c and ensure that malloced space is PetscScalar aligned
92f21b5c6SHong Zhang */
10071fcb05SBarry Smith PETSC_EXTERN PetscErrorCode PetscMallocAlign(size_t,PetscBool,int,const char[],const char[],void**);
1195c0884eSLisandro Dalcin PETSC_EXTERN PetscErrorCode PetscFreeAlign(void*,int,const char[],const char[]);
1295c0884eSLisandro Dalcin PETSC_EXTERN PetscErrorCode PetscReallocAlign(size_t,int,const char[],const char[],void**);
132f21b5c6SHong Zhang 
142f21b5c6SHong Zhang /*
152f21b5c6SHong Zhang    PetscHBWMalloc - HBW malloc.
162f21b5c6SHong Zhang 
172f21b5c6SHong Zhang    Input Parameters:
182f21b5c6SHong Zhang    +   a   - number of bytes to allocate
192f21b5c6SHong Zhang    .   lineno - line number where used
202f21b5c6SHong Zhang    .   function - function calling routine
212f21b5c6SHong Zhang    -   filename  - file name where used
222f21b5c6SHong Zhang 
232f21b5c6SHong Zhang    Returns:
242f21b5c6SHong Zhang    double aligned pointer to requested storage, or null if not
252f21b5c6SHong Zhang    available.
262f21b5c6SHong Zhang */
27071fcb05SBarry Smith static PetscErrorCode PetscHBWMalloc(size_t a,PetscBool clear,int lineno,const char function[],const char filename[],void **result)
282f21b5c6SHong Zhang {
292f21b5c6SHong Zhang #if !defined(PETSC_HAVE_MEMKIND)
30071fcb05SBarry Smith   return PetscMallocAlign(a,clear,lineno,function,filename,result);
312f21b5c6SHong Zhang #else
322f21b5c6SHong Zhang   if (!a) { *result = NULL; return 0; }
332f21b5c6SHong Zhang   /*
342f21b5c6SHong Zhang     The default policy is if insufficient memory is available from the high bandwidth memory
352f21b5c6SHong Zhang     fall back to standard memory. If we use the HBW_POLICY_BIND policy, errno is set to ENOMEM
362f21b5c6SHong Zhang     and the allocated pointer is set to NULL if there is not enough HWB memory available.
372f21b5c6SHong Zhang   */
382f21b5c6SHong Zhang   {
392da392ccSBarry Smith     int err = hbw_posix_memalign(result,PETSC_MEMALIGN,a);
40*08401ef6SPierre Jolivet     PetscCheck(!err && *result,PETSC_COMM_SELF,PETSC_ERR_MEM,"HBW Memory requested %.0f",(PetscLogDouble)a);
412f21b5c6SHong Zhang   }
422f21b5c6SHong Zhang   return 0;
432f21b5c6SHong Zhang #endif
442f21b5c6SHong Zhang }
452f21b5c6SHong Zhang 
460bf43a65SHong Zhang static PetscErrorCode PetscHBWFree(void *aa,int lineno,const char function[],const char filename[])
472f21b5c6SHong Zhang {
482f21b5c6SHong Zhang #if !defined(PETSC_HAVE_MEMKIND)
490bf43a65SHong Zhang   return PetscFreeAlign(aa,lineno,function,filename);
502f21b5c6SHong Zhang #else
512f21b5c6SHong Zhang   hbw_free(aa);
522f21b5c6SHong Zhang   return 0;
532f21b5c6SHong Zhang #endif
5413850c04SHong Zhang }
5513850c04SHong Zhang 
560bf43a65SHong Zhang static PetscErrorCode PetscHBWRealloc(size_t a,int lineno,const char function[],const char filename[],void **result)
570bf43a65SHong Zhang {
580bf43a65SHong Zhang #if !defined(PETSC_HAVE_MEMKIND)
590bf43a65SHong Zhang   return PetscReallocAlign(a,lineno,function,filename,result);
600bf43a65SHong Zhang #else
610bf43a65SHong Zhang   if (!a) {
622da392ccSBarry Smith     int err = PetscFreeAlign(*result,lineno,function,filename);
632da392ccSBarry Smith     if (err) return err;
640bf43a65SHong Zhang     *result = NULL;
650bf43a65SHong Zhang     return 0;
660bf43a65SHong Zhang   }
670bf43a65SHong Zhang   *result = hbw_realloc(*result,a);
68*08401ef6SPierre Jolivet   PetscCheck(*result,PETSC_COMM_SELF,PETSC_ERR_MEM,"Memory requested %.0f",(PetscLogDouble)a);
690bf43a65SHong Zhang   return 0;
700bf43a65SHong Zhang #endif
710bf43a65SHong Zhang }
720bf43a65SHong Zhang 
7395c0884eSLisandro Dalcin PETSC_INTERN PetscErrorCode PetscSetUseHBWMalloc_Private(void)
7413850c04SHong Zhang {
7513850c04SHong Zhang   PetscFunctionBegin;
769566063dSJacob Faibussowitsch   PetscCall(PetscMallocSet(PetscHBWMalloc,PetscHBWFree,NULL));
770bf43a65SHong Zhang   PetscTrRealloc = PetscHBWRealloc;
7813850c04SHong Zhang   PetscFunctionReturn(0);
792f21b5c6SHong Zhang }
80