1af0996ceSBarry Smith #include <petsc/private/petscimpl.h> 2022afb99SBarry Smith #include <petscvalgrind.h> 305035670SJunchao Zhang 4c2a741eeSJunchao Zhang #if defined(PETSC_HAVE_CUDA) 5c2a741eeSJunchao Zhang #include <cuda_runtime.h> 605035670SJunchao Zhang #endif 705035670SJunchao Zhang 805035670SJunchao Zhang #if defined(PETSC_HAVE_HIP) 905035670SJunchao Zhang #include <hip/hip_runtime.h> 10c2a741eeSJunchao Zhang #endif 11d96cc911SJed Brown 1228559dc8SJed Brown static PetscInt petsc_checkpointer_intensity = 1; 1328559dc8SJed Brown 1428559dc8SJed Brown /*@ 1528559dc8SJed Brown PetscCheckPointerSetIntensity - An intense pointer check registers a signal handler and attempts to dereference to 1628559dc8SJed Brown confirm whether the address is valid. An intensity of 0 never uses signal handlers, 1 uses them when not in a "hot" 1728559dc8SJed Brown function, and intensity of 2 always uses a signal handler. 1828559dc8SJed Brown 1928559dc8SJed Brown Not Collective 2028559dc8SJed Brown 2128559dc8SJed Brown Input Arguments: 2228559dc8SJed Brown . intensity - how much to check pointers for validity 2328559dc8SJed Brown 24c2f74817SBarry Smith Options Database: 255789d1f5SJed Brown . -check_pointer_intensity - intensity (0, 1, or 2) 26c2f74817SBarry Smith 2728559dc8SJed Brown Level: advanced 2828559dc8SJed Brown 295789d1f5SJed Brown .seealso: PetscCheckPointer(), PetscFunctionBeginHot() 3028559dc8SJed Brown @*/ 3128559dc8SJed Brown PetscErrorCode PetscCheckPointerSetIntensity(PetscInt intensity) 3228559dc8SJed Brown { 3328559dc8SJed Brown 3428559dc8SJed Brown PetscFunctionBegin; 3528559dc8SJed Brown switch (intensity) { 3628559dc8SJed Brown case 0: 3728559dc8SJed Brown case 1: 3828559dc8SJed Brown case 2: 3928559dc8SJed Brown petsc_checkpointer_intensity = intensity; 4028559dc8SJed Brown break; 4128559dc8SJed Brown default: SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Intensity %D not in 0,1,2",intensity); 4228559dc8SJed Brown } 4328559dc8SJed Brown PetscFunctionReturn(0); 4428559dc8SJed Brown } 4528559dc8SJed Brown 46d96cc911SJed Brown /* ---------------------------------------------------------------------------------------*/ 47718fc407SJed Brown 48718fc407SJed Brown #if defined(PETSC_HAVE_SETJMP_H) 49d96cc911SJed Brown #include <setjmp.h> 50f8a67e6dSJed Brown static jmp_buf PetscSegvJumpBuf; 51f8a67e6dSJed Brown static PetscBool PetscSegvJumpBuf_set; 52f8a67e6dSJed Brown 53f8a67e6dSJed Brown /*@C 54c2a741eeSJunchao Zhang PetscSignalSegvCheckPointerOrMpi - To be called from a signal handler for SIGSEGV. If the signal was received 5505035670SJunchao Zhang while executing PetscCheckPointer()/PetscCheckMpiXxxAwareness(), this function longjmps back there, otherwise returns 56c2a741eeSJunchao Zhang with no effect. This function is called automatically by PetscSignalHandlerDefault(). 57f8a67e6dSJed Brown 58f8a67e6dSJed Brown Not Collective 59f8a67e6dSJed Brown 60f8a67e6dSJed Brown Level: developer 61f8a67e6dSJed Brown 62f8a67e6dSJed Brown .seealso: PetscPushSignalHandler() 63f8a67e6dSJed Brown @*/ 64*70a7d78aSStefano Zampini void PetscSignalSegvCheckPointerOrMpi(void) 65*70a7d78aSStefano Zampini { 66f8a67e6dSJed Brown if (PetscSegvJumpBuf_set) longjmp(PetscSegvJumpBuf,1); 67f8a67e6dSJed Brown } 68d076d156SJed Brown 69d96cc911SJed Brown /*@C 70d96cc911SJed Brown PetscCheckPointer - Returns PETSC_TRUE if a pointer points to accessible data 71d96cc911SJed Brown 72d96cc911SJed Brown Not Collective 73d96cc911SJed Brown 74d96cc911SJed Brown Input Parameters: 75d96cc911SJed Brown + ptr - the pointer 76d96cc911SJed Brown - dtype - the type of data the pointer is suppose to point to 77d96cc911SJed Brown 78d96cc911SJed Brown Level: developer 79d96cc911SJed Brown 805789d1f5SJed Brown .seealso: PetscCheckPointerSetIntensity() 81d96cc911SJed Brown @*/ 82d96cc911SJed Brown PetscBool PetscCheckPointer(const void *ptr,PetscDataType dtype) 83d96cc911SJed Brown { 84d96cc911SJed Brown 85d96cc911SJed Brown if (PETSC_RUNNING_ON_VALGRIND) return PETSC_TRUE; 86d96cc911SJed Brown if (!ptr) return PETSC_FALSE; 8728559dc8SJed Brown if (petsc_checkpointer_intensity < 1) return PETSC_TRUE; 88d96cc911SJed Brown 89a2f94806SJed Brown /* Skip the verbose check if we are inside a hot function. */ 905c25fcd7SBarry Smith if (petscstack && petscstack->hotdepth > 0 && petsc_checkpointer_intensity < 2) return PETSC_TRUE; 91a2f94806SJed Brown 92718fc407SJed Brown PetscSegvJumpBuf_set = PETSC_TRUE; 93d96cc911SJed Brown 94d96cc911SJed Brown if (setjmp(PetscSegvJumpBuf)) { 95d96cc911SJed Brown /* A segv was triggered in the code below hence we return with an error code */ 96718fc407SJed Brown PetscSegvJumpBuf_set = PETSC_FALSE; 97d96cc911SJed Brown return PETSC_FALSE; 98d96cc911SJed Brown } else { 99d96cc911SJed Brown switch (dtype) { 100d96cc911SJed Brown case PETSC_INT:{ 101d96cc911SJed Brown PETSC_UNUSED PetscInt x = (PetscInt)*(volatile PetscInt*)ptr; 102d96cc911SJed Brown break; 103d96cc911SJed Brown } 104d96cc911SJed Brown #if defined(PETSC_USE_COMPLEX) 105d96cc911SJed Brown case PETSC_SCALAR:{ /* C++ is seriously dysfunctional with volatile std::complex. */ 10696d2aba5SSatish Balay #if defined(PETSC_USE_CXXCOMPLEX) 107d96cc911SJed Brown PetscReal xreal = ((volatile PetscReal*)ptr)[0],ximag = ((volatile PetscReal*)ptr)[1]; 108d96cc911SJed Brown PETSC_UNUSED volatile PetscScalar x = xreal + PETSC_i*ximag; 10996d2aba5SSatish Balay #else 11096d2aba5SSatish Balay PETSC_UNUSED PetscScalar x = *(volatile PetscScalar*)ptr; 11196d2aba5SSatish Balay #endif 112d96cc911SJed Brown break; 113d96cc911SJed Brown } 114d96cc911SJed Brown #endif 115d96cc911SJed Brown case PETSC_REAL:{ 116d96cc911SJed Brown PETSC_UNUSED PetscReal x = *(volatile PetscReal*)ptr; 117d96cc911SJed Brown break; 118d96cc911SJed Brown } 119d96cc911SJed Brown case PETSC_BOOL:{ 120d96cc911SJed Brown PETSC_UNUSED PetscBool x = *(volatile PetscBool*)ptr; 121d96cc911SJed Brown break; 122d96cc911SJed Brown } 123d96cc911SJed Brown case PETSC_ENUM:{ 124d96cc911SJed Brown PETSC_UNUSED PetscEnum x = *(volatile PetscEnum*)ptr; 125d96cc911SJed Brown break; 126d96cc911SJed Brown } 127d96cc911SJed Brown case PETSC_CHAR:{ 128f4e06bcbSJed Brown PETSC_UNUSED char x = *(volatile char*)ptr; 129d96cc911SJed Brown break; 130d96cc911SJed Brown } 131d96cc911SJed Brown case PETSC_OBJECT:{ 132d96cc911SJed Brown PETSC_UNUSED volatile PetscClassId classid = ((PetscObject)ptr)->classid; 133d96cc911SJed Brown break; 134d96cc911SJed Brown } 135d96cc911SJed Brown default:; 136d96cc911SJed Brown } 137d96cc911SJed Brown } 138718fc407SJed Brown PetscSegvJumpBuf_set = PETSC_FALSE; 139d96cc911SJed Brown return PETSC_TRUE; 140d96cc911SJed Brown } 141c2a741eeSJunchao Zhang 14205035670SJunchao Zhang #define PetscMPICUPMAwarnessCheckFunction \ 14305035670SJunchao Zhang PetscBool PetscMPICUPMAwarenessCheck(void) \ 14405035670SJunchao Zhang { \ 14505035670SJunchao Zhang cupmError_t cerr=cupmSuccess; \ 14605035670SJunchao Zhang int ierr,hbuf[2]={1,0},*dbuf=NULL; \ 14705035670SJunchao Zhang PetscBool awareness=PETSC_FALSE; \ 14805035670SJunchao Zhang cerr = cupmMalloc((void**)&dbuf,sizeof(int)*2);if (cerr != cupmSuccess) return PETSC_FALSE; \ 14905035670SJunchao Zhang cerr = cupmMemcpy(dbuf,hbuf,sizeof(int)*2,cupmMemcpyHostToDevice);if (cerr != cupmSuccess) return PETSC_FALSE; \ 15005035670SJunchao Zhang PetscSegvJumpBuf_set = PETSC_TRUE; \ 15105035670SJunchao Zhang if (setjmp(PetscSegvJumpBuf)) { \ 15205035670SJunchao Zhang /* If a segv was triggered in the MPI_Allreduce below, it is very likely due to the MPI is not GPU-aware */ \ 15305035670SJunchao Zhang awareness = PETSC_FALSE; \ 15405035670SJunchao Zhang } else { \ 15505035670SJunchao Zhang ierr = MPI_Allreduce(dbuf,dbuf+1,1,MPI_INT,MPI_SUM,PETSC_COMM_SELF); \ 15605035670SJunchao Zhang if (!ierr) awareness = PETSC_TRUE; \ 15705035670SJunchao Zhang } \ 15805035670SJunchao Zhang PetscSegvJumpBuf_set = PETSC_FALSE; \ 15905035670SJunchao Zhang cerr = cupmFree(dbuf);if (cerr != cupmSuccess) return PETSC_FALSE; \ 16005035670SJunchao Zhang return awareness; \ 16105035670SJunchao Zhang } 16205035670SJunchao Zhang 163c2a741eeSJunchao Zhang #if defined(PETSC_HAVE_CUDA) 16405035670SJunchao Zhang #define cupmError_t cudaError_t 16505035670SJunchao Zhang #define cupmMalloc cudaMalloc 16605035670SJunchao Zhang #define cupmMemcpy cudaMemcpy 16705035670SJunchao Zhang #define cupmFree cudaFree 16805035670SJunchao Zhang #define cupmSuccess cudaSuccess 16905035670SJunchao Zhang #define cupmMemcpyHostToDevice cudaMemcpyHostToDevice 17005035670SJunchao Zhang #define PetscMPICUPMAwarenessCheck PetscMPICUDAAwarenessCheck 17105035670SJunchao Zhang PetscMPICUPMAwarnessCheckFunction 172c2a741eeSJunchao Zhang #endif 17305035670SJunchao Zhang 17405035670SJunchao Zhang #if defined(PETSC_HAVE_HIP) 17505035670SJunchao Zhang #define cupmError_t hipError_t 17605035670SJunchao Zhang #define cupmMalloc hipMalloc 17705035670SJunchao Zhang #define cupmMemcpy hipMemcpy 17805035670SJunchao Zhang #define cupmFree hipFree 17905035670SJunchao Zhang #define cupmSuccess hipSuccess 18005035670SJunchao Zhang #define cupmMemcpyHostToDevice hipMemcpyHostToDevice 18105035670SJunchao Zhang #define PetscMPICUPMAwarenessCheck PetscMPIHIPAwarenessCheck 18205035670SJunchao Zhang PetscMPICUPMAwarnessCheckFunction 18305035670SJunchao Zhang #endif 18405035670SJunchao Zhang 185d96cc911SJed Brown #else 186*70a7d78aSStefano Zampini void PetscSignalSegvCheckPointerOrMpi(void) 187*70a7d78aSStefano Zampini { 188f8a67e6dSJed Brown return; 189f8a67e6dSJed Brown } 190f8a67e6dSJed Brown 191d96cc911SJed Brown PetscBool PetscCheckPointer(const void *ptr,PETSC_UNUSED PetscDataType dtype) 192d96cc911SJed Brown { 193d96cc911SJed Brown if (!ptr) return PETSC_FALSE; 194d96cc911SJed Brown return PETSC_TRUE; 195d96cc911SJed Brown } 196c2a741eeSJunchao Zhang 19705035670SJunchao Zhang #if defined (PETSC_HAVE_CUDA) 19805035670SJunchao Zhang PetscBool PetscMPICUDAAwarenessCheck(void) 199c2a741eeSJunchao Zhang { 200c2a741eeSJunchao Zhang /* If no setjmp (rare), return true and let users code run (and segfault if they should) */ 201c2a741eeSJunchao Zhang return PETSC_TRUE; 202c2a741eeSJunchao Zhang } 203d96cc911SJed Brown #endif 20405035670SJunchao Zhang 20505035670SJunchao Zhang #if defined (PETSC_HAVE_HIP) 20605035670SJunchao Zhang PetscBool PetscMPIHIPAwarenessCheck(void) 20705035670SJunchao Zhang { 20805035670SJunchao Zhang /* If no setjmp (rare), return true and let users code run (and segfault if they should) */ 20905035670SJunchao Zhang return PETSC_TRUE; 21005035670SJunchao Zhang } 21105035670SJunchao Zhang #endif 21205035670SJunchao Zhang 21305035670SJunchao Zhang #endif 214