1af0996ceSBarry Smith #include <petsc/private/petscimpl.h> 205035670SJunchao Zhang 3c2a741eeSJunchao Zhang #if defined(PETSC_HAVE_CUDA) 4c2a741eeSJunchao Zhang #include <cuda_runtime.h> 505035670SJunchao Zhang #endif 605035670SJunchao Zhang 705035670SJunchao Zhang #if defined(PETSC_HAVE_HIP) 805035670SJunchao Zhang #include <hip/hip_runtime.h> 9c2a741eeSJunchao Zhang #endif 10d96cc911SJed Brown 1128559dc8SJed Brown static PetscInt petsc_checkpointer_intensity = 1; 1228559dc8SJed Brown 1328559dc8SJed Brown /*@ 1428559dc8SJed Brown PetscCheckPointerSetIntensity - An intense pointer check registers a signal handler and attempts to dereference to 1528559dc8SJed Brown confirm whether the address is valid. An intensity of 0 never uses signal handlers, 1 uses them when not in a "hot" 1628559dc8SJed Brown function, and intensity of 2 always uses a signal handler. 1728559dc8SJed Brown 1828559dc8SJed Brown Not Collective 1928559dc8SJed Brown 20*4165533cSJose E. Roman Input Parameter: 2128559dc8SJed Brown . intensity - how much to check pointers for validity 2228559dc8SJed Brown 23c2f74817SBarry Smith Options Database: 245789d1f5SJed Brown . -check_pointer_intensity - intensity (0, 1, or 2) 25c2f74817SBarry Smith 2628559dc8SJed Brown Level: advanced 2728559dc8SJed Brown 285789d1f5SJed Brown .seealso: PetscCheckPointer(), PetscFunctionBeginHot() 2928559dc8SJed Brown @*/ 3028559dc8SJed Brown PetscErrorCode PetscCheckPointerSetIntensity(PetscInt intensity) 3128559dc8SJed Brown { 3228559dc8SJed Brown 3328559dc8SJed Brown PetscFunctionBegin; 3428559dc8SJed Brown switch (intensity) { 3528559dc8SJed Brown case 0: 3628559dc8SJed Brown case 1: 3728559dc8SJed Brown case 2: 3828559dc8SJed Brown petsc_checkpointer_intensity = intensity; 3928559dc8SJed Brown break; 4028559dc8SJed Brown default: SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Intensity %D not in 0,1,2",intensity); 4128559dc8SJed Brown } 4228559dc8SJed Brown PetscFunctionReturn(0); 4328559dc8SJed Brown } 4428559dc8SJed Brown 45d96cc911SJed Brown /* ---------------------------------------------------------------------------------------*/ 46718fc407SJed Brown 47718fc407SJed Brown #if defined(PETSC_HAVE_SETJMP_H) 48d96cc911SJed Brown #include <setjmp.h> 49f8a67e6dSJed Brown static jmp_buf PetscSegvJumpBuf; 50f8a67e6dSJed Brown static PetscBool PetscSegvJumpBuf_set; 51f8a67e6dSJed Brown 52f8a67e6dSJed Brown /*@C 53c2a741eeSJunchao Zhang PetscSignalSegvCheckPointerOrMpi - To be called from a signal handler for SIGSEGV. If the signal was received 5405035670SJunchao Zhang while executing PetscCheckPointer()/PetscCheckMpiXxxAwareness(), this function longjmps back there, otherwise returns 55c2a741eeSJunchao Zhang with no effect. This function is called automatically by PetscSignalHandlerDefault(). 56f8a67e6dSJed Brown 57f8a67e6dSJed Brown Not Collective 58f8a67e6dSJed Brown 59f8a67e6dSJed Brown Level: developer 60f8a67e6dSJed Brown 61f8a67e6dSJed Brown .seealso: PetscPushSignalHandler() 62f8a67e6dSJed Brown @*/ 6370a7d78aSStefano Zampini void PetscSignalSegvCheckPointerOrMpi(void) 6470a7d78aSStefano Zampini { 65f8a67e6dSJed Brown if (PetscSegvJumpBuf_set) longjmp(PetscSegvJumpBuf,1); 66f8a67e6dSJed Brown } 67d076d156SJed Brown 68d96cc911SJed Brown /*@C 69d96cc911SJed Brown PetscCheckPointer - Returns PETSC_TRUE if a pointer points to accessible data 70d96cc911SJed Brown 71d96cc911SJed Brown Not Collective 72d96cc911SJed Brown 73d96cc911SJed Brown Input Parameters: 74d96cc911SJed Brown + ptr - the pointer 75d96cc911SJed Brown - dtype - the type of data the pointer is suppose to point to 76d96cc911SJed Brown 77d96cc911SJed Brown Level: developer 78d96cc911SJed Brown 795789d1f5SJed Brown .seealso: PetscCheckPointerSetIntensity() 80d96cc911SJed Brown @*/ 81d96cc911SJed Brown PetscBool PetscCheckPointer(const void *ptr,PetscDataType dtype) 82d96cc911SJed Brown { 83d96cc911SJed Brown 84d96cc911SJed Brown if (PETSC_RUNNING_ON_VALGRIND) return PETSC_TRUE; 85d96cc911SJed Brown if (!ptr) return PETSC_FALSE; 8628559dc8SJed Brown if (petsc_checkpointer_intensity < 1) return PETSC_TRUE; 87d96cc911SJed Brown 88a2f94806SJed Brown /* Skip the verbose check if we are inside a hot function. */ 895c25fcd7SBarry Smith if (petscstack && petscstack->hotdepth > 0 && petsc_checkpointer_intensity < 2) return PETSC_TRUE; 90a2f94806SJed Brown 91718fc407SJed Brown PetscSegvJumpBuf_set = PETSC_TRUE; 92d96cc911SJed Brown 93d96cc911SJed Brown if (setjmp(PetscSegvJumpBuf)) { 94d96cc911SJed Brown /* A segv was triggered in the code below hence we return with an error code */ 95718fc407SJed Brown PetscSegvJumpBuf_set = PETSC_FALSE; 96d96cc911SJed Brown return PETSC_FALSE; 97d96cc911SJed Brown } else { 98d96cc911SJed Brown switch (dtype) { 99d96cc911SJed Brown case PETSC_INT:{ 100d96cc911SJed Brown PETSC_UNUSED PetscInt x = (PetscInt)*(volatile PetscInt*)ptr; 101d96cc911SJed Brown break; 102d96cc911SJed Brown } 103d96cc911SJed Brown #if defined(PETSC_USE_COMPLEX) 104d96cc911SJed Brown case PETSC_SCALAR:{ /* C++ is seriously dysfunctional with volatile std::complex. */ 10596d2aba5SSatish Balay #if defined(PETSC_USE_CXXCOMPLEX) 106d96cc911SJed Brown PetscReal xreal = ((volatile PetscReal*)ptr)[0],ximag = ((volatile PetscReal*)ptr)[1]; 107d96cc911SJed Brown PETSC_UNUSED volatile PetscScalar x = xreal + PETSC_i*ximag; 10896d2aba5SSatish Balay #else 10996d2aba5SSatish Balay PETSC_UNUSED PetscScalar x = *(volatile PetscScalar*)ptr; 11096d2aba5SSatish Balay #endif 111d96cc911SJed Brown break; 112d96cc911SJed Brown } 113d96cc911SJed Brown #endif 114d96cc911SJed Brown case PETSC_REAL:{ 115d96cc911SJed Brown PETSC_UNUSED PetscReal x = *(volatile PetscReal*)ptr; 116d96cc911SJed Brown break; 117d96cc911SJed Brown } 118d96cc911SJed Brown case PETSC_BOOL:{ 119d96cc911SJed Brown PETSC_UNUSED PetscBool x = *(volatile PetscBool*)ptr; 120d96cc911SJed Brown break; 121d96cc911SJed Brown } 122d96cc911SJed Brown case PETSC_ENUM:{ 123d96cc911SJed Brown PETSC_UNUSED PetscEnum x = *(volatile PetscEnum*)ptr; 124d96cc911SJed Brown break; 125d96cc911SJed Brown } 126d96cc911SJed Brown case PETSC_CHAR:{ 127f4e06bcbSJed Brown PETSC_UNUSED char x = *(volatile char*)ptr; 128d96cc911SJed Brown break; 129d96cc911SJed Brown } 130d96cc911SJed Brown case PETSC_OBJECT:{ 131d96cc911SJed Brown PETSC_UNUSED volatile PetscClassId classid = ((PetscObject)ptr)->classid; 132d96cc911SJed Brown break; 133d96cc911SJed Brown } 134d96cc911SJed Brown default:; 135d96cc911SJed Brown } 136d96cc911SJed Brown } 137718fc407SJed Brown PetscSegvJumpBuf_set = PETSC_FALSE; 138d96cc911SJed Brown return PETSC_TRUE; 139d96cc911SJed Brown } 140c2a741eeSJunchao Zhang 14105035670SJunchao Zhang #define PetscMPICUPMAwarnessCheckFunction \ 14205035670SJunchao Zhang PetscBool PetscMPICUPMAwarenessCheck(void) \ 14305035670SJunchao Zhang { \ 14405035670SJunchao Zhang cupmError_t cerr=cupmSuccess; \ 14505035670SJunchao Zhang int ierr,hbuf[2]={1,0},*dbuf=NULL; \ 14605035670SJunchao Zhang PetscBool awareness=PETSC_FALSE; \ 14705035670SJunchao Zhang cerr = cupmMalloc((void**)&dbuf,sizeof(int)*2);if (cerr != cupmSuccess) return PETSC_FALSE; \ 14805035670SJunchao Zhang cerr = cupmMemcpy(dbuf,hbuf,sizeof(int)*2,cupmMemcpyHostToDevice);if (cerr != cupmSuccess) return PETSC_FALSE; \ 14905035670SJunchao Zhang PetscSegvJumpBuf_set = PETSC_TRUE; \ 15005035670SJunchao Zhang if (setjmp(PetscSegvJumpBuf)) { \ 15105035670SJunchao Zhang /* If a segv was triggered in the MPI_Allreduce below, it is very likely due to the MPI is not GPU-aware */ \ 15205035670SJunchao Zhang awareness = PETSC_FALSE; \ 15305035670SJunchao Zhang } else { \ 15405035670SJunchao Zhang ierr = MPI_Allreduce(dbuf,dbuf+1,1,MPI_INT,MPI_SUM,PETSC_COMM_SELF); \ 15505035670SJunchao Zhang if (!ierr) awareness = PETSC_TRUE; \ 15605035670SJunchao Zhang } \ 15705035670SJunchao Zhang PetscSegvJumpBuf_set = PETSC_FALSE; \ 15805035670SJunchao Zhang cerr = cupmFree(dbuf);if (cerr != cupmSuccess) return PETSC_FALSE; \ 15905035670SJunchao Zhang return awareness; \ 16005035670SJunchao Zhang } 16105035670SJunchao Zhang 162c2a741eeSJunchao Zhang #if defined(PETSC_HAVE_CUDA) 16305035670SJunchao Zhang #define cupmError_t cudaError_t 16405035670SJunchao Zhang #define cupmMalloc cudaMalloc 16505035670SJunchao Zhang #define cupmMemcpy cudaMemcpy 16605035670SJunchao Zhang #define cupmFree cudaFree 16705035670SJunchao Zhang #define cupmSuccess cudaSuccess 16805035670SJunchao Zhang #define cupmMemcpyHostToDevice cudaMemcpyHostToDevice 16905035670SJunchao Zhang #define PetscMPICUPMAwarenessCheck PetscMPICUDAAwarenessCheck 17005035670SJunchao Zhang PetscMPICUPMAwarnessCheckFunction 171c2a741eeSJunchao Zhang #endif 17205035670SJunchao Zhang 17305035670SJunchao Zhang #if defined(PETSC_HAVE_HIP) 17405035670SJunchao Zhang #define cupmError_t hipError_t 17505035670SJunchao Zhang #define cupmMalloc hipMalloc 17605035670SJunchao Zhang #define cupmMemcpy hipMemcpy 17705035670SJunchao Zhang #define cupmFree hipFree 17805035670SJunchao Zhang #define cupmSuccess hipSuccess 17905035670SJunchao Zhang #define cupmMemcpyHostToDevice hipMemcpyHostToDevice 18005035670SJunchao Zhang #define PetscMPICUPMAwarenessCheck PetscMPIHIPAwarenessCheck 18105035670SJunchao Zhang PetscMPICUPMAwarnessCheckFunction 18205035670SJunchao Zhang #endif 18305035670SJunchao Zhang 184d96cc911SJed Brown #else 18570a7d78aSStefano Zampini void PetscSignalSegvCheckPointerOrMpi(void) 18670a7d78aSStefano Zampini { 187f8a67e6dSJed Brown return; 188f8a67e6dSJed Brown } 189f8a67e6dSJed Brown 190d96cc911SJed Brown PetscBool PetscCheckPointer(const void *ptr,PETSC_UNUSED PetscDataType dtype) 191d96cc911SJed Brown { 192d96cc911SJed Brown if (!ptr) return PETSC_FALSE; 193d96cc911SJed Brown return PETSC_TRUE; 194d96cc911SJed Brown } 195c2a741eeSJunchao Zhang 19605035670SJunchao Zhang #if defined (PETSC_HAVE_CUDA) 19705035670SJunchao Zhang PetscBool PetscMPICUDAAwarenessCheck(void) 198c2a741eeSJunchao Zhang { 199c2a741eeSJunchao Zhang /* If no setjmp (rare), return true and let users code run (and segfault if they should) */ 200c2a741eeSJunchao Zhang return PETSC_TRUE; 201c2a741eeSJunchao Zhang } 202d96cc911SJed Brown #endif 20305035670SJunchao Zhang 20405035670SJunchao Zhang #if defined (PETSC_HAVE_HIP) 20505035670SJunchao Zhang PetscBool PetscMPIHIPAwarenessCheck(void) 20605035670SJunchao Zhang { 20705035670SJunchao Zhang /* If no setjmp (rare), return true and let users code run (and segfault if they should) */ 20805035670SJunchao Zhang return PETSC_TRUE; 20905035670SJunchao Zhang } 21005035670SJunchao Zhang #endif 21105035670SJunchao Zhang 21205035670SJunchao Zhang #endif 213