1af0996ceSBarry Smith #include <petsc/private/petscimpl.h> 2022afb99SBarry Smith #include <petscvalgrind.h> 3*05035670SJunchao Zhang 4c2a741eeSJunchao Zhang #if defined(PETSC_HAVE_CUDA) 5c2a741eeSJunchao Zhang #include <cuda_runtime.h> 6*05035670SJunchao Zhang #endif 7*05035670SJunchao Zhang 8*05035670SJunchao Zhang #if defined(PETSC_HAVE_HIP) 9*05035670SJunchao Zhang #include <hip/hip_runtime.h> 10c2a741eeSJunchao Zhang #endif 11d96cc911SJed Brown 1228559dc8SJed Brown static PetscInt petsc_checkpointer_intensity = 1; 1328559dc8SJed Brown 1428559dc8SJed Brown /*@ 1528559dc8SJed Brown PetscCheckPointerSetIntensity - An intense pointer check registers a signal handler and attempts to dereference to 1628559dc8SJed Brown confirm whether the address is valid. An intensity of 0 never uses signal handlers, 1 uses them when not in a "hot" 1728559dc8SJed Brown function, and intensity of 2 always uses a signal handler. 1828559dc8SJed Brown 1928559dc8SJed Brown Not Collective 2028559dc8SJed Brown 2128559dc8SJed Brown Input Arguments: 2228559dc8SJed Brown . intensity - how much to check pointers for validity 2328559dc8SJed Brown 24c2f74817SBarry Smith Options Database: 255789d1f5SJed Brown . -check_pointer_intensity - intensity (0, 1, or 2) 26c2f74817SBarry Smith 2728559dc8SJed Brown Level: advanced 2828559dc8SJed Brown 295789d1f5SJed Brown .seealso: PetscCheckPointer(), PetscFunctionBeginHot() 3028559dc8SJed Brown @*/ 3128559dc8SJed Brown PetscErrorCode PetscCheckPointerSetIntensity(PetscInt intensity) 3228559dc8SJed Brown { 3328559dc8SJed Brown 3428559dc8SJed Brown PetscFunctionBegin; 3528559dc8SJed Brown switch (intensity) { 3628559dc8SJed Brown case 0: 3728559dc8SJed Brown case 1: 3828559dc8SJed Brown case 2: 3928559dc8SJed Brown petsc_checkpointer_intensity = intensity; 4028559dc8SJed Brown break; 4128559dc8SJed Brown default: SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Intensity %D not in 0,1,2",intensity); 4228559dc8SJed Brown } 4328559dc8SJed Brown PetscFunctionReturn(0); 4428559dc8SJed Brown } 4528559dc8SJed Brown 46d96cc911SJed Brown /* ---------------------------------------------------------------------------------------*/ 47718fc407SJed Brown 48718fc407SJed Brown #if defined(PETSC_HAVE_SETJMP_H) 49d96cc911SJed Brown #include <setjmp.h> 50f8a67e6dSJed Brown static jmp_buf PetscSegvJumpBuf; 51f8a67e6dSJed Brown static PetscBool PetscSegvJumpBuf_set; 52f8a67e6dSJed Brown 53f8a67e6dSJed Brown /*@C 54c2a741eeSJunchao Zhang PetscSignalSegvCheckPointerOrMpi - To be called from a signal handler for SIGSEGV. If the signal was received 55*05035670SJunchao Zhang while executing PetscCheckPointer()/PetscCheckMpiXxxAwareness(), this function longjmps back there, otherwise returns 56c2a741eeSJunchao Zhang with no effect. This function is called automatically by PetscSignalHandlerDefault(). 57f8a67e6dSJed Brown 58f8a67e6dSJed Brown Not Collective 59f8a67e6dSJed Brown 60f8a67e6dSJed Brown Level: developer 61f8a67e6dSJed Brown 62f8a67e6dSJed Brown .seealso: PetscPushSignalHandler() 63f8a67e6dSJed Brown @*/ 64c2a741eeSJunchao Zhang void PetscSignalSegvCheckPointerOrMpi(void) { 65f8a67e6dSJed Brown if (PetscSegvJumpBuf_set) longjmp(PetscSegvJumpBuf,1); 66f8a67e6dSJed Brown } 67d076d156SJed Brown 68d96cc911SJed Brown /*@C 69d96cc911SJed Brown PetscCheckPointer - Returns PETSC_TRUE if a pointer points to accessible data 70d96cc911SJed Brown 71d96cc911SJed Brown Not Collective 72d96cc911SJed Brown 73d96cc911SJed Brown Input Parameters: 74d96cc911SJed Brown + ptr - the pointer 75d96cc911SJed Brown - dtype - the type of data the pointer is suppose to point to 76d96cc911SJed Brown 77d96cc911SJed Brown Level: developer 78d96cc911SJed Brown 795789d1f5SJed Brown .seealso: PetscCheckPointerSetIntensity() 80d96cc911SJed Brown @*/ 81d96cc911SJed Brown PetscBool PetscCheckPointer(const void *ptr,PetscDataType dtype) 82d96cc911SJed Brown { 83d96cc911SJed Brown 84d96cc911SJed Brown if (PETSC_RUNNING_ON_VALGRIND) return PETSC_TRUE; 85d96cc911SJed Brown if (!ptr) return PETSC_FALSE; 8628559dc8SJed Brown if (petsc_checkpointer_intensity < 1) return PETSC_TRUE; 87d96cc911SJed Brown 88a2f94806SJed Brown /* Skip the verbose check if we are inside a hot function. */ 895c25fcd7SBarry Smith if (petscstack && petscstack->hotdepth > 0 && petsc_checkpointer_intensity < 2) return PETSC_TRUE; 90a2f94806SJed Brown 91718fc407SJed Brown PetscSegvJumpBuf_set = PETSC_TRUE; 92d96cc911SJed Brown 93d96cc911SJed Brown if (setjmp(PetscSegvJumpBuf)) { 94d96cc911SJed Brown /* A segv was triggered in the code below hence we return with an error code */ 95718fc407SJed Brown PetscSegvJumpBuf_set = PETSC_FALSE; 96d96cc911SJed Brown return PETSC_FALSE; 97d96cc911SJed Brown } else { 98d96cc911SJed Brown switch (dtype) { 99d96cc911SJed Brown case PETSC_INT:{ 100d96cc911SJed Brown PETSC_UNUSED PetscInt x = (PetscInt)*(volatile PetscInt*)ptr; 101d96cc911SJed Brown break; 102d96cc911SJed Brown } 103d96cc911SJed Brown #if defined(PETSC_USE_COMPLEX) 104d96cc911SJed Brown case PETSC_SCALAR:{ /* C++ is seriously dysfunctional with volatile std::complex. */ 10596d2aba5SSatish Balay #if defined(PETSC_USE_CXXCOMPLEX) 106d96cc911SJed Brown PetscReal xreal = ((volatile PetscReal*)ptr)[0],ximag = ((volatile PetscReal*)ptr)[1]; 107d96cc911SJed Brown PETSC_UNUSED volatile PetscScalar x = xreal + PETSC_i*ximag; 10896d2aba5SSatish Balay #else 10996d2aba5SSatish Balay PETSC_UNUSED PetscScalar x = *(volatile PetscScalar*)ptr; 11096d2aba5SSatish Balay #endif 111d96cc911SJed Brown break; 112d96cc911SJed Brown } 113d96cc911SJed Brown #endif 114d96cc911SJed Brown case PETSC_REAL:{ 115d96cc911SJed Brown PETSC_UNUSED PetscReal x = *(volatile PetscReal*)ptr; 116d96cc911SJed Brown break; 117d96cc911SJed Brown } 118d96cc911SJed Brown case PETSC_BOOL:{ 119d96cc911SJed Brown PETSC_UNUSED PetscBool x = *(volatile PetscBool*)ptr; 120d96cc911SJed Brown break; 121d96cc911SJed Brown } 122d96cc911SJed Brown case PETSC_ENUM:{ 123d96cc911SJed Brown PETSC_UNUSED PetscEnum x = *(volatile PetscEnum*)ptr; 124d96cc911SJed Brown break; 125d96cc911SJed Brown } 126d96cc911SJed Brown case PETSC_CHAR:{ 127f4e06bcbSJed Brown PETSC_UNUSED char x = *(volatile char*)ptr; 128d96cc911SJed Brown break; 129d96cc911SJed Brown } 130d96cc911SJed Brown case PETSC_OBJECT:{ 131d96cc911SJed Brown PETSC_UNUSED volatile PetscClassId classid = ((PetscObject)ptr)->classid; 132d96cc911SJed Brown break; 133d96cc911SJed Brown } 134d96cc911SJed Brown default:; 135d96cc911SJed Brown } 136d96cc911SJed Brown } 137718fc407SJed Brown PetscSegvJumpBuf_set = PETSC_FALSE; 138d96cc911SJed Brown return PETSC_TRUE; 139d96cc911SJed Brown } 140c2a741eeSJunchao Zhang 141*05035670SJunchao Zhang #define PetscMPICUPMAwarnessCheckFunction \ 142*05035670SJunchao Zhang PetscBool PetscMPICUPMAwarenessCheck(void) \ 143*05035670SJunchao Zhang { \ 144*05035670SJunchao Zhang cupmError_t cerr=cupmSuccess; \ 145*05035670SJunchao Zhang int ierr,hbuf[2]={1,0},*dbuf=NULL; \ 146*05035670SJunchao Zhang PetscBool awareness=PETSC_FALSE; \ 147*05035670SJunchao Zhang cerr = cupmMalloc((void**)&dbuf,sizeof(int)*2);if (cerr != cupmSuccess) return PETSC_FALSE; \ 148*05035670SJunchao Zhang cerr = cupmMemcpy(dbuf,hbuf,sizeof(int)*2,cupmMemcpyHostToDevice);if (cerr != cupmSuccess) return PETSC_FALSE; \ 149*05035670SJunchao Zhang PetscSegvJumpBuf_set = PETSC_TRUE; \ 150*05035670SJunchao Zhang if (setjmp(PetscSegvJumpBuf)) { \ 151*05035670SJunchao Zhang /* If a segv was triggered in the MPI_Allreduce below, it is very likely due to the MPI is not GPU-aware */ \ 152*05035670SJunchao Zhang awareness = PETSC_FALSE; \ 153*05035670SJunchao Zhang } else { \ 154*05035670SJunchao Zhang ierr = MPI_Allreduce(dbuf,dbuf+1,1,MPI_INT,MPI_SUM,PETSC_COMM_SELF); \ 155*05035670SJunchao Zhang if (!ierr) awareness = PETSC_TRUE; \ 156*05035670SJunchao Zhang } \ 157*05035670SJunchao Zhang PetscSegvJumpBuf_set = PETSC_FALSE; \ 158*05035670SJunchao Zhang cerr = cupmFree(dbuf);if (cerr != cupmSuccess) return PETSC_FALSE; \ 159*05035670SJunchao Zhang return awareness; \ 160*05035670SJunchao Zhang } 161*05035670SJunchao Zhang 162c2a741eeSJunchao Zhang #if defined(PETSC_HAVE_CUDA) 163*05035670SJunchao Zhang #define cupmError_t cudaError_t 164*05035670SJunchao Zhang #define cupmMalloc cudaMalloc 165*05035670SJunchao Zhang #define cupmMemcpy cudaMemcpy 166*05035670SJunchao Zhang #define cupmFree cudaFree 167*05035670SJunchao Zhang #define cupmSuccess cudaSuccess 168*05035670SJunchao Zhang #define cupmMemcpyHostToDevice cudaMemcpyHostToDevice 169*05035670SJunchao Zhang #define PetscMPICUPMAwarenessCheck PetscMPICUDAAwarenessCheck 170*05035670SJunchao Zhang PetscMPICUPMAwarnessCheckFunction 171c2a741eeSJunchao Zhang #endif 172*05035670SJunchao Zhang 173*05035670SJunchao Zhang #if defined(PETSC_HAVE_HIP) 174*05035670SJunchao Zhang #define cupmError_t hipError_t 175*05035670SJunchao Zhang #define cupmMalloc hipMalloc 176*05035670SJunchao Zhang #define cupmMemcpy hipMemcpy 177*05035670SJunchao Zhang #define cupmFree hipFree 178*05035670SJunchao Zhang #define cupmSuccess hipSuccess 179*05035670SJunchao Zhang #define cupmMemcpyHostToDevice hipMemcpyHostToDevice 180*05035670SJunchao Zhang #define PetscMPICUPMAwarenessCheck PetscMPIHIPAwarenessCheck 181*05035670SJunchao Zhang PetscMPICUPMAwarnessCheckFunction 182*05035670SJunchao Zhang #endif 183*05035670SJunchao Zhang 184d96cc911SJed Brown #else 185c2a741eeSJunchao Zhang void PetscSignalSegvCheckPointerOrMpi(void) { 186f8a67e6dSJed Brown return; 187f8a67e6dSJed Brown } 188f8a67e6dSJed Brown 189d96cc911SJed Brown PetscBool PetscCheckPointer(const void *ptr,PETSC_UNUSED PetscDataType dtype) 190d96cc911SJed Brown { 191d96cc911SJed Brown if (!ptr) return PETSC_FALSE; 192d96cc911SJed Brown return PETSC_TRUE; 193d96cc911SJed Brown } 194c2a741eeSJunchao Zhang 195*05035670SJunchao Zhang #if defined (PETSC_HAVE_CUDA) 196*05035670SJunchao Zhang PetscBool PetscMPICUDAAwarenessCheck(void) 197c2a741eeSJunchao Zhang { 198c2a741eeSJunchao Zhang /* If no setjmp (rare), return true and let users code run (and segfault if they should) */ 199c2a741eeSJunchao Zhang return PETSC_TRUE; 200c2a741eeSJunchao Zhang } 201d96cc911SJed Brown #endif 202*05035670SJunchao Zhang 203*05035670SJunchao Zhang #if defined (PETSC_HAVE_HIP) 204*05035670SJunchao Zhang PetscBool PetscMPIHIPAwarenessCheck(void) 205*05035670SJunchao Zhang { 206*05035670SJunchao Zhang /* If no setjmp (rare), return true and let users code run (and segfault if they should) */ 207*05035670SJunchao Zhang return PETSC_TRUE; 208*05035670SJunchao Zhang } 209*05035670SJunchao Zhang #endif 210*05035670SJunchao Zhang 211*05035670SJunchao Zhang #endif 212