15c6c1daeSBarry Smith 25c6c1daeSBarry Smith /* 35c6c1daeSBarry Smith PETSc code to log object creation and destruction and PETSc events. 45c6c1daeSBarry Smith 55c6c1daeSBarry Smith This provides the public API used by the rest of PETSc and by users. 65c6c1daeSBarry Smith 75c6c1daeSBarry Smith These routines use a private API that is not used elsewhere in PETSc and is not 85c6c1daeSBarry Smith accessible to users. The private API is defined in logimpl.h and the utils directory. 95c6c1daeSBarry Smith 105c6c1daeSBarry Smith */ 11af0996ceSBarry Smith #include <petsc/private/logimpl.h> /*I "petscsys.h" I*/ 125c6c1daeSBarry Smith #include <petsctime.h> 13665c2dedSJed Brown #include <petscviewer.h> 148fe3844cSJunchao Zhang #include <petscdevice.h> 158fe3844cSJunchao Zhang #include <petsc/private/deviceimpl.h> 16a0c7f9aaSSamuel Khuvis #if defined(PETSC_HAVE_TAU_PERFSTUBS) 17a0c7f9aaSSamuel Khuvis #include <../src/sys/perfstubs/timer.h> 18a0c7f9aaSSamuel Khuvis #endif 195c6c1daeSBarry Smith 205c6c1daeSBarry Smith PetscLogEvent PETSC_LARGEST_EVENT = PETSC_EVENT; 215c6c1daeSBarry Smith 225c6c1daeSBarry Smith #if defined(PETSC_USE_LOG) 235c6c1daeSBarry Smith #include <petscmachineinfo.h> 245c6c1daeSBarry Smith #include <petscconfiginfo.h> 255c6c1daeSBarry Smith 26c708d6e3SStefano Zampini #if defined(PETSC_HAVE_THREADSAFETY) 27c708d6e3SStefano Zampini 28c708d6e3SStefano Zampini PetscInt petsc_log_gid = -1; /* Global threadId counter */ 29c708d6e3SStefano Zampini PETSC_TLS PetscInt petsc_log_tid = -1; /* Local threadId */ 30c708d6e3SStefano Zampini 31c708d6e3SStefano Zampini /* shared variables */ 32c708d6e3SStefano Zampini PetscSpinlock PetscLogSpinLock; 33c708d6e3SStefano Zampini PetscHMapEvent eventInfoMap_th = NULL; 34c708d6e3SStefano Zampini 35c708d6e3SStefano Zampini #endif 36c708d6e3SStefano Zampini 375c6c1daeSBarry Smith /* used in the MPI_XXX() count macros in petsclog.h */ 385c6c1daeSBarry Smith 395c6c1daeSBarry Smith /* Action and object logging variables */ 400298fd71SBarry Smith Action *petsc_actions = NULL; 410298fd71SBarry Smith Object *petsc_objects = NULL; 425c6c1daeSBarry Smith PetscBool petsc_logActions = PETSC_FALSE; 435c6c1daeSBarry Smith PetscBool petsc_logObjects = PETSC_FALSE; 445c6c1daeSBarry Smith int petsc_numActions = 0, petsc_maxActions = 100; 455c6c1daeSBarry Smith int petsc_numObjects = 0, petsc_maxObjects = 100; 465c6c1daeSBarry Smith int petsc_numObjectsDestroyed = 0; 475c6c1daeSBarry Smith 485c6c1daeSBarry Smith /* Global counters */ 495c6c1daeSBarry Smith PetscLogDouble petsc_BaseTime = 0.0; 505c6c1daeSBarry Smith PetscLogDouble petsc_TotalFlops = 0.0; /* The number of flops */ 515c6c1daeSBarry Smith PetscLogDouble petsc_send_ct = 0.0; /* The number of sends */ 525c6c1daeSBarry Smith PetscLogDouble petsc_recv_ct = 0.0; /* The number of receives */ 535c6c1daeSBarry Smith PetscLogDouble petsc_send_len = 0.0; /* The total length of all sent messages */ 545c6c1daeSBarry Smith PetscLogDouble petsc_recv_len = 0.0; /* The total length of all received messages */ 555c6c1daeSBarry Smith PetscLogDouble petsc_isend_ct = 0.0; /* The number of immediate sends */ 565c6c1daeSBarry Smith PetscLogDouble petsc_irecv_ct = 0.0; /* The number of immediate receives */ 575c6c1daeSBarry Smith PetscLogDouble petsc_isend_len = 0.0; /* The total length of all immediate send messages */ 585c6c1daeSBarry Smith PetscLogDouble petsc_irecv_len = 0.0; /* The total length of all immediate receive messages */ 595c6c1daeSBarry Smith PetscLogDouble petsc_wait_ct = 0.0; /* The number of waits */ 605c6c1daeSBarry Smith PetscLogDouble petsc_wait_any_ct = 0.0; /* The number of anywaits */ 615c6c1daeSBarry Smith PetscLogDouble petsc_wait_all_ct = 0.0; /* The number of waitalls */ 625c6c1daeSBarry Smith PetscLogDouble petsc_sum_of_waits_ct = 0.0; /* The total number of waits */ 635c6c1daeSBarry Smith PetscLogDouble petsc_allreduce_ct = 0.0; /* The number of reductions */ 645c6c1daeSBarry Smith PetscLogDouble petsc_gather_ct = 0.0; /* The number of gathers and gathervs */ 655c6c1daeSBarry Smith PetscLogDouble petsc_scatter_ct = 0.0; /* The number of scatters and scattervs */ 66c708d6e3SStefano Zampini 67c708d6e3SStefano Zampini /* Thread Local storage */ 68c708d6e3SStefano Zampini PETSC_TLS PetscLogDouble petsc_TotalFlops_th = 0.0; 69c708d6e3SStefano Zampini PETSC_TLS PetscLogDouble petsc_send_ct_th = 0.0; 70c708d6e3SStefano Zampini PETSC_TLS PetscLogDouble petsc_recv_ct_th = 0.0; 71c708d6e3SStefano Zampini PETSC_TLS PetscLogDouble petsc_send_len_th = 0.0; 72c708d6e3SStefano Zampini PETSC_TLS PetscLogDouble petsc_recv_len_th = 0.0; 73c708d6e3SStefano Zampini PETSC_TLS PetscLogDouble petsc_isend_ct_th = 0.0; 74c708d6e3SStefano Zampini PETSC_TLS PetscLogDouble petsc_irecv_ct_th = 0.0; 75c708d6e3SStefano Zampini PETSC_TLS PetscLogDouble petsc_isend_len_th = 0.0; 76c708d6e3SStefano Zampini PETSC_TLS PetscLogDouble petsc_irecv_len_th = 0.0; 77c708d6e3SStefano Zampini PETSC_TLS PetscLogDouble petsc_wait_ct_th = 0.0; 78c708d6e3SStefano Zampini PETSC_TLS PetscLogDouble petsc_wait_any_ct_th = 0.0; 79c708d6e3SStefano Zampini PETSC_TLS PetscLogDouble petsc_wait_all_ct_th = 0.0; 80c708d6e3SStefano Zampini PETSC_TLS PetscLogDouble petsc_sum_of_waits_ct_th = 0.0; 81c708d6e3SStefano Zampini PETSC_TLS PetscLogDouble petsc_allreduce_ct_th = 0.0; 82c708d6e3SStefano Zampini PETSC_TLS PetscLogDouble petsc_gather_ct_th = 0.0; 83c708d6e3SStefano Zampini PETSC_TLS PetscLogDouble petsc_scatter_ct_th = 0.0; 84c708d6e3SStefano Zampini 8520c24465SJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 86bec0b493Shannah_mairs PetscLogDouble petsc_ctog_ct = 0.0; /* The total number of CPU to GPU copies */ 87bec0b493Shannah_mairs PetscLogDouble petsc_gtoc_ct = 0.0; /* The total number of GPU to CPU copies */ 88bec0b493Shannah_mairs PetscLogDouble petsc_ctog_sz = 0.0; /* The total size of CPU to GPU copies */ 89bec0b493Shannah_mairs PetscLogDouble petsc_gtoc_sz = 0.0; /* The total size of GPU to CPU copies */ 9045c4b7c1SBarry Smith PetscLogDouble petsc_ctog_ct_scalar = 0.0; /* The total number of CPU to GPU copies */ 9145c4b7c1SBarry Smith PetscLogDouble petsc_gtoc_ct_scalar = 0.0; /* The total number of GPU to CPU copies */ 9245c4b7c1SBarry Smith PetscLogDouble petsc_ctog_sz_scalar = 0.0; /* The total size of CPU to GPU copies */ 9345c4b7c1SBarry Smith PetscLogDouble petsc_gtoc_sz_scalar = 0.0; /* The total size of GPU to CPU copies */ 94958c4211Shannah_mairs PetscLogDouble petsc_gflops = 0.0; /* The flops done on a GPU */ 95958c4211Shannah_mairs PetscLogDouble petsc_gtime = 0.0; /* The time spent on a GPU */ 96c708d6e3SStefano Zampini 97c708d6e3SStefano Zampini PETSC_TLS PetscLogDouble petsc_ctog_ct_th = 0.0; 98c708d6e3SStefano Zampini PETSC_TLS PetscLogDouble petsc_gtoc_ct_th = 0.0; 99c708d6e3SStefano Zampini PETSC_TLS PetscLogDouble petsc_ctog_sz_th = 0.0; 100c708d6e3SStefano Zampini PETSC_TLS PetscLogDouble petsc_gtoc_sz_th = 0.0; 101c708d6e3SStefano Zampini PETSC_TLS PetscLogDouble petsc_ctog_ct_scalar_th = 0.0; 102c708d6e3SStefano Zampini PETSC_TLS PetscLogDouble petsc_gtoc_ct_scalar_th = 0.0; 103c708d6e3SStefano Zampini PETSC_TLS PetscLogDouble petsc_ctog_sz_scalar_th = 0.0; 104c708d6e3SStefano Zampini PETSC_TLS PetscLogDouble petsc_gtoc_sz_scalar_th = 0.0; 105c708d6e3SStefano Zampini PETSC_TLS PetscLogDouble petsc_gflops_th = 0.0; 106c708d6e3SStefano Zampini PETSC_TLS PetscLogDouble petsc_gtime_th = 0.0; 107c708d6e3SStefano Zampini #endif 108c708d6e3SStefano Zampini 109c708d6e3SStefano Zampini #if defined(PETSC_HAVE_THREADSAFETY) 110c708d6e3SStefano Zampini PetscErrorCode PetscAddLogDouble(PetscLogDouble *tot, PetscLogDouble *tot_th, PetscLogDouble tmp) 111c708d6e3SStefano Zampini { 112c708d6e3SStefano Zampini *tot_th += tmp; 1133ba16761SJacob Faibussowitsch PetscCall(PetscSpinlockLock(&PetscLogSpinLock)); 114c708d6e3SStefano Zampini *tot += tmp; 1153ba16761SJacob Faibussowitsch PetscCall(PetscSpinlockUnlock(&PetscLogSpinLock)); 1163ba16761SJacob Faibussowitsch return PETSC_SUCCESS; 117c708d6e3SStefano Zampini } 118c708d6e3SStefano Zampini 119c708d6e3SStefano Zampini PetscErrorCode PetscAddLogDoubleCnt(PetscLogDouble *cnt, PetscLogDouble *tot, PetscLogDouble *cnt_th, PetscLogDouble *tot_th, PetscLogDouble tmp) 120c708d6e3SStefano Zampini { 121c708d6e3SStefano Zampini *cnt_th = *cnt_th + 1; 122c708d6e3SStefano Zampini *tot_th += tmp; 1233ba16761SJacob Faibussowitsch PetscCall(PetscSpinlockLock(&PetscLogSpinLock)); 124c708d6e3SStefano Zampini *tot += (PetscLogDouble)(tmp); 125c708d6e3SStefano Zampini *cnt += *cnt + 1; 1263ba16761SJacob Faibussowitsch PetscCall(PetscSpinlockUnlock(&PetscLogSpinLock)); 1273ba16761SJacob Faibussowitsch return PETSC_SUCCESS; 128c708d6e3SStefano Zampini } 129c708d6e3SStefano Zampini 130c708d6e3SStefano Zampini PetscInt PetscLogGetTid(void) 131c708d6e3SStefano Zampini { 132c708d6e3SStefano Zampini if (petsc_log_tid < 0) { 1333ba16761SJacob Faibussowitsch PetscCall(PetscSpinlockLock(&PetscLogSpinLock)); 134c708d6e3SStefano Zampini petsc_log_tid = ++petsc_log_gid; 1353ba16761SJacob Faibussowitsch PetscCall(PetscSpinlockUnlock(&PetscLogSpinLock)); 136c708d6e3SStefano Zampini } 137c708d6e3SStefano Zampini return petsc_log_tid; 138c708d6e3SStefano Zampini } 139c708d6e3SStefano Zampini 140bec0b493Shannah_mairs #endif 1415c6c1daeSBarry Smith 1425c6c1daeSBarry Smith /* Logging functions */ 1430298fd71SBarry Smith PetscErrorCode (*PetscLogPHC)(PetscObject) = NULL; 1440298fd71SBarry Smith PetscErrorCode (*PetscLogPHD)(PetscObject) = NULL; 1450298fd71SBarry Smith PetscErrorCode (*PetscLogPLB)(PetscLogEvent, int, PetscObject, PetscObject, PetscObject, PetscObject) = NULL; 1460298fd71SBarry Smith PetscErrorCode (*PetscLogPLE)(PetscLogEvent, int, PetscObject, PetscObject, PetscObject, PetscObject) = NULL; 1475c6c1daeSBarry Smith 1485c6c1daeSBarry Smith /* Tracing event logging variables */ 1490298fd71SBarry Smith FILE *petsc_tracefile = NULL; 1505c6c1daeSBarry Smith int petsc_tracelevel = 0; 1515c6c1daeSBarry Smith const char *petsc_traceblanks = " "; 1525c6c1daeSBarry Smith char petsc_tracespace[128] = " "; 1535c6c1daeSBarry Smith PetscLogDouble petsc_tracetime = 0.0; 154896238b9SBarry Smith static PetscBool PetscLogInitializeCalled = PETSC_FALSE; 1555c6c1daeSBarry Smith 1567a101e5eSJacob Faibussowitsch static PetscIntStack current_log_event_stack = NULL; 1577a101e5eSJacob Faibussowitsch 158d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode PetscLogInitialize(void) 159d71ae5a4SJacob Faibussowitsch { 160fa2bb9feSLisandro Dalcin int stage; 161fa2bb9feSLisandro Dalcin PetscBool opt; 1625c6c1daeSBarry Smith 163fa2bb9feSLisandro Dalcin PetscFunctionBegin; 1643ba16761SJacob Faibussowitsch if (PetscLogInitializeCalled) PetscFunctionReturn(PETSC_SUCCESS); 165fa2bb9feSLisandro Dalcin PetscLogInitializeCalled = PETSC_TRUE; 1665c6c1daeSBarry Smith 1677a101e5eSJacob Faibussowitsch PetscCall(PetscIntStackCreate(¤t_log_event_stack)); 1689566063dSJacob Faibussowitsch PetscCall(PetscOptionsHasName(NULL, NULL, "-log_exclude_actions", &opt)); 169fa2bb9feSLisandro Dalcin if (opt) petsc_logActions = PETSC_FALSE; 1709566063dSJacob Faibussowitsch PetscCall(PetscOptionsHasName(NULL, NULL, "-log_exclude_objects", &opt)); 171fa2bb9feSLisandro Dalcin if (opt) petsc_logObjects = PETSC_FALSE; 17248a46eb9SPierre Jolivet if (petsc_logActions) PetscCall(PetscMalloc1(petsc_maxActions, &petsc_actions)); 17348a46eb9SPierre Jolivet if (petsc_logObjects) PetscCall(PetscMalloc1(petsc_maxObjects, &petsc_objects)); 174fa2bb9feSLisandro Dalcin PetscLogPHC = PetscLogObjCreateDefault; 175fa2bb9feSLisandro Dalcin PetscLogPHD = PetscLogObjDestroyDefault; 176fa2bb9feSLisandro Dalcin /* Setup default logging structures */ 1779566063dSJacob Faibussowitsch PetscCall(PetscStageLogCreate(&petsc_stageLog)); 1789566063dSJacob Faibussowitsch PetscCall(PetscStageLogRegister(petsc_stageLog, "Main Stage", &stage)); 1795c6c1daeSBarry Smith 180c708d6e3SStefano Zampini PetscCall(PetscSpinlockCreate(&PetscLogSpinLock)); 181c708d6e3SStefano Zampini #if defined(PETSC_HAVE_THREADSAFETY) 182c708d6e3SStefano Zampini petsc_log_tid = 0; 183c708d6e3SStefano Zampini petsc_log_gid = 0; 184c708d6e3SStefano Zampini PetscCall(PetscHMapEventCreate(&eventInfoMap_th)); 185c708d6e3SStefano Zampini #endif 186c708d6e3SStefano Zampini 187fa2bb9feSLisandro Dalcin /* All processors sync here for more consistent logging */ 1889566063dSJacob Faibussowitsch PetscCallMPI(MPI_Barrier(PETSC_COMM_WORLD)); 1893ba16761SJacob Faibussowitsch PetscCall(PetscTime(&petsc_BaseTime)); 1909566063dSJacob Faibussowitsch PetscCall(PetscLogStagePush(stage)); 191a0c7f9aaSSamuel Khuvis #if defined(PETSC_HAVE_TAU_PERFSTUBS) 192a0c7f9aaSSamuel Khuvis PetscStackCallExternalVoid("ps_initialize_", ps_initialize_()); 193a0c7f9aaSSamuel Khuvis #endif 1943ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 195fa2bb9feSLisandro Dalcin } 1965c6c1daeSBarry Smith 197d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode PetscLogFinalize(void) 198d71ae5a4SJacob Faibussowitsch { 1995c6c1daeSBarry Smith PetscStageLog stageLog; 2005c6c1daeSBarry Smith 2015c6c1daeSBarry Smith PetscFunctionBegin; 202c708d6e3SStefano Zampini #if defined(PETSC_HAVE_THREADSAFETY) 203c708d6e3SStefano Zampini if (eventInfoMap_th) { 204c708d6e3SStefano Zampini PetscEventPerfInfo **array; 205c708d6e3SStefano Zampini PetscInt n, off = 0; 206c708d6e3SStefano Zampini 207c708d6e3SStefano Zampini PetscCall(PetscHMapEventGetSize(eventInfoMap_th, &n)); 208c708d6e3SStefano Zampini PetscCall(PetscMalloc1(n, &array)); 209c708d6e3SStefano Zampini PetscCall(PetscHMapEventGetVals(eventInfoMap_th, &off, array)); 210c708d6e3SStefano Zampini for (PetscInt i = 0; i < n; i++) PetscCall(PetscFree(array[i])); 211c708d6e3SStefano Zampini PetscCall(PetscFree(array)); 212c708d6e3SStefano Zampini PetscCall(PetscHMapEventDestroy(&eventInfoMap_th)); 213c708d6e3SStefano Zampini } 214c708d6e3SStefano Zampini #endif 2159566063dSJacob Faibussowitsch PetscCall(PetscFree(petsc_actions)); 2169566063dSJacob Faibussowitsch PetscCall(PetscFree(petsc_objects)); 2179566063dSJacob Faibussowitsch PetscCall(PetscLogNestedEnd()); 2189566063dSJacob Faibussowitsch PetscCall(PetscLogSet(NULL, NULL)); 2195c6c1daeSBarry Smith 2205c6c1daeSBarry Smith /* Resetting phase */ 2219566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 2229566063dSJacob Faibussowitsch PetscCall(PetscStageLogDestroy(stageLog)); 2237a101e5eSJacob Faibussowitsch PetscCall(PetscIntStackDestroy(current_log_event_stack)); 2247a101e5eSJacob Faibussowitsch current_log_event_stack = NULL; 225a297a907SKarl Rupp 2265c6c1daeSBarry Smith petsc_TotalFlops = 0.0; 2275c6c1daeSBarry Smith petsc_numActions = 0; 2285c6c1daeSBarry Smith petsc_numObjects = 0; 2295c6c1daeSBarry Smith petsc_numObjectsDestroyed = 0; 2305c6c1daeSBarry Smith petsc_maxActions = 100; 2315c6c1daeSBarry Smith petsc_maxObjects = 100; 2320298fd71SBarry Smith petsc_actions = NULL; 2330298fd71SBarry Smith petsc_objects = NULL; 2345c6c1daeSBarry Smith petsc_logActions = PETSC_FALSE; 2355c6c1daeSBarry Smith petsc_logObjects = PETSC_FALSE; 2365c6c1daeSBarry Smith petsc_BaseTime = 0.0; 2375c6c1daeSBarry Smith petsc_TotalFlops = 0.0; 2385c6c1daeSBarry Smith petsc_send_ct = 0.0; 2395c6c1daeSBarry Smith petsc_recv_ct = 0.0; 2405c6c1daeSBarry Smith petsc_send_len = 0.0; 2415c6c1daeSBarry Smith petsc_recv_len = 0.0; 2425c6c1daeSBarry Smith petsc_isend_ct = 0.0; 2435c6c1daeSBarry Smith petsc_irecv_ct = 0.0; 2445c6c1daeSBarry Smith petsc_isend_len = 0.0; 2455c6c1daeSBarry Smith petsc_irecv_len = 0.0; 2465c6c1daeSBarry Smith petsc_wait_ct = 0.0; 2475c6c1daeSBarry Smith petsc_wait_any_ct = 0.0; 2485c6c1daeSBarry Smith petsc_wait_all_ct = 0.0; 2495c6c1daeSBarry Smith petsc_sum_of_waits_ct = 0.0; 2505c6c1daeSBarry Smith petsc_allreduce_ct = 0.0; 2515c6c1daeSBarry Smith petsc_gather_ct = 0.0; 2525c6c1daeSBarry Smith petsc_scatter_ct = 0.0; 253c708d6e3SStefano Zampini petsc_TotalFlops_th = 0.0; 254c708d6e3SStefano Zampini petsc_send_ct_th = 0.0; 255c708d6e3SStefano Zampini petsc_recv_ct_th = 0.0; 256c708d6e3SStefano Zampini petsc_send_len_th = 0.0; 257c708d6e3SStefano Zampini petsc_recv_len_th = 0.0; 258c708d6e3SStefano Zampini petsc_isend_ct_th = 0.0; 259c708d6e3SStefano Zampini petsc_irecv_ct_th = 0.0; 260c708d6e3SStefano Zampini petsc_isend_len_th = 0.0; 261c708d6e3SStefano Zampini petsc_irecv_len_th = 0.0; 262c708d6e3SStefano Zampini petsc_wait_ct_th = 0.0; 263c708d6e3SStefano Zampini petsc_wait_any_ct_th = 0.0; 264c708d6e3SStefano Zampini petsc_wait_all_ct_th = 0.0; 265c708d6e3SStefano Zampini petsc_sum_of_waits_ct_th = 0.0; 266c708d6e3SStefano Zampini petsc_allreduce_ct_th = 0.0; 267c708d6e3SStefano Zampini petsc_gather_ct_th = 0.0; 268c708d6e3SStefano Zampini petsc_scatter_ct_th = 0.0; 269c708d6e3SStefano Zampini 270d9c66bfbSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 271bec0b493Shannah_mairs petsc_ctog_ct = 0.0; 272bec0b493Shannah_mairs petsc_gtoc_ct = 0.0; 273bec0b493Shannah_mairs petsc_ctog_sz = 0.0; 274bec0b493Shannah_mairs petsc_gtoc_sz = 0.0; 275958c4211Shannah_mairs petsc_gflops = 0.0; 276958c4211Shannah_mairs petsc_gtime = 0.0; 277c708d6e3SStefano Zampini petsc_ctog_ct_th = 0.0; 278c708d6e3SStefano Zampini petsc_gtoc_ct_th = 0.0; 279c708d6e3SStefano Zampini petsc_ctog_sz_th = 0.0; 280c708d6e3SStefano Zampini petsc_gtoc_sz_th = 0.0; 281c708d6e3SStefano Zampini petsc_gflops_th = 0.0; 282c708d6e3SStefano Zampini petsc_gtime_th = 0.0; 283bec0b493Shannah_mairs #endif 284c708d6e3SStefano Zampini 2855c6c1daeSBarry Smith PETSC_LARGEST_EVENT = PETSC_EVENT; 2860298fd71SBarry Smith PetscLogPHC = NULL; 2870298fd71SBarry Smith PetscLogPHD = NULL; 2880298fd71SBarry Smith petsc_tracefile = NULL; 2895c6c1daeSBarry Smith petsc_tracelevel = 0; 2905c6c1daeSBarry Smith petsc_traceblanks = " "; 2919371c9d4SSatish Balay petsc_tracespace[0] = ' '; 2929371c9d4SSatish Balay petsc_tracespace[1] = 0; 2935c6c1daeSBarry Smith petsc_tracetime = 0.0; 2945c6c1daeSBarry Smith PETSC_LARGEST_CLASSID = PETSC_SMALLEST_CLASSID; 2955c6c1daeSBarry Smith PETSC_OBJECT_CLASSID = 0; 29602c9f0b5SLisandro Dalcin petsc_stageLog = NULL; 297896238b9SBarry Smith PetscLogInitializeCalled = PETSC_FALSE; 2983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2995c6c1daeSBarry Smith } 3005c6c1daeSBarry Smith 3015c6c1daeSBarry Smith /*@C 3025c6c1daeSBarry Smith PetscLogSet - Sets the logging functions called at the beginning and ending of every event. 3035c6c1daeSBarry Smith 3045c6c1daeSBarry Smith Not Collective 3055c6c1daeSBarry Smith 3065c6c1daeSBarry Smith Input Parameters: 3075c6c1daeSBarry Smith + b - The function called at beginning of event 3085c6c1daeSBarry Smith - e - The function called at end of event 3095c6c1daeSBarry Smith 3105c6c1daeSBarry Smith Level: developer 3115c6c1daeSBarry Smith 312aec76313SJacob Faibussowitsch Developer Notes: 313811af0c4SBarry Smith The default loggers are `PetscLogEventBeginDefault()` and `PetscLogEventEndDefault()`. 314811af0c4SBarry Smith 315d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogDump()`, `PetscLogDefaultBegin()`, `PetscLogAllBegin()`, `PetscLogTraceBegin()`, `PetscLogEventBeginDefault()`, `PetscLogEventEndDefault()` 3165c6c1daeSBarry Smith @*/ 317d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogSet(PetscErrorCode (*b)(PetscLogEvent, int, PetscObject, PetscObject, PetscObject, PetscObject), PetscErrorCode (*e)(PetscLogEvent, int, PetscObject, PetscObject, PetscObject, PetscObject)) 318d71ae5a4SJacob Faibussowitsch { 3195c6c1daeSBarry Smith PetscFunctionBegin; 3205c6c1daeSBarry Smith PetscLogPLB = b; 3215c6c1daeSBarry Smith PetscLogPLE = e; 3223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3235c6c1daeSBarry Smith } 3245c6c1daeSBarry Smith 3255c6c1daeSBarry Smith /*@C 3264dd65854SConnor Ward PetscLogIsActive - Check if logging is currently in progress. 3274dd65854SConnor Ward 3284dd65854SConnor Ward Not Collective 3294dd65854SConnor Ward 3304dd65854SConnor Ward Output Parameter: 331811af0c4SBarry Smith . isActive - `PETSC_TRUE` if logging is in progress, `PETSC_FALSE` otherwise 3324dd65854SConnor Ward 3334dd65854SConnor Ward Level: beginner 3344dd65854SConnor Ward 335d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogDefaultBegin()`, `PetscLogAllBegin()`, `PetscLogSet()` 3364dd65854SConnor Ward @*/ 337d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogIsActive(PetscBool *isActive) 338d71ae5a4SJacob Faibussowitsch { 3394dd65854SConnor Ward PetscFunctionBegin; 3404dd65854SConnor Ward *isActive = (PetscLogPLB && PetscLogPLE) ? PETSC_TRUE : PETSC_FALSE; 3413ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3424dd65854SConnor Ward } 3434dd65854SConnor Ward 3444dd65854SConnor Ward /*@C 345811af0c4SBarry Smith PetscLogDefaultBegin - Turns on logging of objects and events using the default logging functions `PetscLogEventBeginDefault()` and `PetscLogEventEndDefault()`. This logs flop 3465c6c1daeSBarry Smith rates and object creation and should not slow programs down too much. 3475c6c1daeSBarry Smith This routine may be called more than once. 3485c6c1daeSBarry Smith 349811af0c4SBarry Smith Logically Collective over `PETSC_COMM_WORLD` 3505c6c1daeSBarry Smith 351811af0c4SBarry Smith Options Database Key: 352a2553e36SBarry Smith . -log_view [viewertype:filename:viewerformat] - Prints summary of flop and timing information to the 353a2553e36SBarry Smith screen (for code configured with --with-log=1 (which is the default)) 3545c6c1daeSBarry Smith 35510450e9eSJacob Faibussowitsch Example Usage: 3565c6c1daeSBarry Smith .vb 3575c6c1daeSBarry Smith PetscInitialize(...); 358bb1d7374SBarry Smith PetscLogDefaultBegin(); 3595c6c1daeSBarry Smith ... code ... 3605c6c1daeSBarry Smith PetscLogView(viewer); or PetscLogDump(); 3615c6c1daeSBarry Smith PetscFinalize(); 3625c6c1daeSBarry Smith .ve 3635c6c1daeSBarry Smith 364d1f92df0SBarry Smith Level: advanced 365d1f92df0SBarry Smith 366811af0c4SBarry Smith Note: 367811af0c4SBarry Smith `PetscLogView()` or `PetscLogDump()` actually cause the printing of 3685c6c1daeSBarry Smith the logging information. 3695c6c1daeSBarry Smith 370d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogDump()`, `PetscLogAllBegin()`, `PetscLogView()`, `PetscLogTraceBegin()` 3715c6c1daeSBarry Smith @*/ 372d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogDefaultBegin(void) 373d71ae5a4SJacob Faibussowitsch { 3745c6c1daeSBarry Smith PetscFunctionBegin; 3759566063dSJacob Faibussowitsch PetscCall(PetscLogSet(PetscLogEventBeginDefault, PetscLogEventEndDefault)); 3763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3775c6c1daeSBarry Smith } 3785c6c1daeSBarry Smith 3795c6c1daeSBarry Smith /*@C 3805c6c1daeSBarry Smith PetscLogAllBegin - Turns on extensive logging of objects and events. Logs 3815c6c1daeSBarry Smith all events. This creates large log files and slows the program down. 3825c6c1daeSBarry Smith 383811af0c4SBarry Smith Logically Collective on `PETSC_COMM_WORLD` 3845c6c1daeSBarry Smith 385811af0c4SBarry Smith Options Database Key: 386a2553e36SBarry Smith . -log_all - Prints extensive log information 3875c6c1daeSBarry Smith 38810450e9eSJacob Faibussowitsch Example Usage: 3895c6c1daeSBarry Smith .vb 3905c6c1daeSBarry Smith PetscInitialize(...); 3915c6c1daeSBarry Smith PetscLogAllBegin(); 3925c6c1daeSBarry Smith ... code ... 3935c6c1daeSBarry Smith PetscLogDump(filename); 3945c6c1daeSBarry Smith PetscFinalize(); 3955c6c1daeSBarry Smith .ve 3965c6c1daeSBarry Smith 397d1f92df0SBarry Smith Level: advanced 398d1f92df0SBarry Smith 399811af0c4SBarry Smith Note: 400811af0c4SBarry Smith A related routine is `PetscLogDefaultBegin()` (with the options key -log_view), which is 4015c6c1daeSBarry Smith intended for production runs since it logs only flop rates and object 4025c6c1daeSBarry Smith creation (and shouldn't significantly slow the programs). 4035c6c1daeSBarry Smith 404d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogDump()`, `PetscLogDefaultBegin()`, `PetscLogTraceBegin()` 4055c6c1daeSBarry Smith @*/ 406d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogAllBegin(void) 407d71ae5a4SJacob Faibussowitsch { 4085c6c1daeSBarry Smith PetscFunctionBegin; 4099566063dSJacob Faibussowitsch PetscCall(PetscLogSet(PetscLogEventBeginComplete, PetscLogEventEndComplete)); 4103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4115c6c1daeSBarry Smith } 4125c6c1daeSBarry Smith 413956f8c0dSBarry Smith /*@C 4145c6c1daeSBarry Smith PetscLogTraceBegin - Activates trace logging. Every time a PETSc event 4155c6c1daeSBarry Smith begins or ends, the event name is printed. 4165c6c1daeSBarry Smith 417811af0c4SBarry Smith Logically Collective on `PETSC_COMM_WORLD` 4185c6c1daeSBarry Smith 4195c6c1daeSBarry Smith Input Parameter: 4205c6c1daeSBarry Smith . file - The file to print trace in (e.g. stdout) 4215c6c1daeSBarry Smith 4225c6c1daeSBarry Smith Options Database Key: 423811af0c4SBarry Smith . -log_trace [filename] - Activates `PetscLogTraceBegin()` 4245c6c1daeSBarry Smith 425d1f92df0SBarry Smith Level: intermediate 426d1f92df0SBarry Smith 4275c6c1daeSBarry Smith Notes: 428811af0c4SBarry Smith `PetscLogTraceBegin()` prints the processor number, the execution time (sec), 4295c6c1daeSBarry Smith then "Event begin:" or "Event end:" followed by the event name. 4305c6c1daeSBarry Smith 431811af0c4SBarry Smith `PetscLogTraceBegin()` allows tracing of all PETSc calls, which is useful 4325c6c1daeSBarry Smith to determine where a program is hanging without running in the 4335c6c1daeSBarry Smith debugger. Can be used in conjunction with the -info option. 4345c6c1daeSBarry Smith 435d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogDump()`, `PetscLogAllBegin()`, `PetscLogView()`, `PetscLogDefaultBegin()` 4365c6c1daeSBarry Smith @*/ 437d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogTraceBegin(FILE *file) 438d71ae5a4SJacob Faibussowitsch { 4395c6c1daeSBarry Smith PetscFunctionBegin; 4405c6c1daeSBarry Smith petsc_tracefile = file; 441a297a907SKarl Rupp 4429566063dSJacob Faibussowitsch PetscCall(PetscLogSet(PetscLogEventBeginTrace, PetscLogEventEndTrace)); 4433ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4445c6c1daeSBarry Smith } 4455c6c1daeSBarry Smith 4465c6c1daeSBarry Smith /*@ 4475c6c1daeSBarry Smith PetscLogActions - Determines whether actions are logged for the graphical viewer. 4485c6c1daeSBarry Smith 4495c6c1daeSBarry Smith Not Collective 4505c6c1daeSBarry Smith 4515c6c1daeSBarry Smith Input Parameter: 452811af0c4SBarry Smith . flag - `PETSC_TRUE` if actions are to be logged 453811af0c4SBarry Smith 454811af0c4SBarry Smith Options Database Key: 455811af0c4SBarry Smith . -log_exclude_actions - Turns off actions logging 4565c6c1daeSBarry Smith 4575c6c1daeSBarry Smith Level: intermediate 4585c6c1daeSBarry Smith 459811af0c4SBarry Smith Note: 460811af0c4SBarry Smith Logging of actions continues to consume more memory as the program 4615c6c1daeSBarry Smith runs. Long running programs should consider turning this feature off. 462aec76313SJacob Faibussowitsch 463d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogStagePush()`, `PetscLogStagePop()` 4645c6c1daeSBarry Smith @*/ 465d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogActions(PetscBool flag) 466d71ae5a4SJacob Faibussowitsch { 4675c6c1daeSBarry Smith PetscFunctionBegin; 4685c6c1daeSBarry Smith petsc_logActions = flag; 4693ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4705c6c1daeSBarry Smith } 4715c6c1daeSBarry Smith 4725c6c1daeSBarry Smith /*@ 4735c6c1daeSBarry Smith PetscLogObjects - Determines whether objects are logged for the graphical viewer. 4745c6c1daeSBarry Smith 4755c6c1daeSBarry Smith Not Collective 4765c6c1daeSBarry Smith 4775c6c1daeSBarry Smith Input Parameter: 478811af0c4SBarry Smith . flag - `PETSC_TRUE` if objects are to be logged 479811af0c4SBarry Smith 480811af0c4SBarry Smith Options Database Key: 481811af0c4SBarry Smith . -log_exclude_objects - Turns off objects logging 4825c6c1daeSBarry Smith 4835c6c1daeSBarry Smith Level: intermediate 4845c6c1daeSBarry Smith 485811af0c4SBarry Smith Note: 486811af0c4SBarry Smith Logging of objects continues to consume more memory as the program 4875c6c1daeSBarry Smith runs. Long running programs should consider turning this feature off. 4885c6c1daeSBarry Smith 489d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogStagePush()`, `PetscLogStagePop()` 4905c6c1daeSBarry Smith @*/ 491d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogObjects(PetscBool flag) 492d71ae5a4SJacob Faibussowitsch { 4935c6c1daeSBarry Smith PetscFunctionBegin; 4945c6c1daeSBarry Smith petsc_logObjects = flag; 4953ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4965c6c1daeSBarry Smith } 4975c6c1daeSBarry Smith 4985c6c1daeSBarry Smith /*------------------------------------------------ Stage Functions --------------------------------------------------*/ 4995c6c1daeSBarry Smith /*@C 50074c0405dSRichard Tran Mills PetscLogStageRegister - Attaches a character string name to a logging stage. 5015c6c1daeSBarry Smith 5025c6c1daeSBarry Smith Not Collective 5035c6c1daeSBarry Smith 5045c6c1daeSBarry Smith Input Parameter: 5055c6c1daeSBarry Smith . sname - The name to associate with that stage 5065c6c1daeSBarry Smith 5075c6c1daeSBarry Smith Output Parameter: 5085c6c1daeSBarry Smith . stage - The stage number 5095c6c1daeSBarry Smith 5105c6c1daeSBarry Smith Level: intermediate 5115c6c1daeSBarry Smith 512d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogStagePush()`, `PetscLogStagePop()` 5135c6c1daeSBarry Smith @*/ 514d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogStageRegister(const char sname[], PetscLogStage *stage) 515d71ae5a4SJacob Faibussowitsch { 5165c6c1daeSBarry Smith PetscStageLog stageLog; 5175c6c1daeSBarry Smith PetscLogEvent event; 5185c6c1daeSBarry Smith 5195c6c1daeSBarry Smith PetscFunctionBegin; 5209566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 5219566063dSJacob Faibussowitsch PetscCall(PetscStageLogRegister(stageLog, sname, stage)); 5225c6c1daeSBarry Smith /* Copy events already changed in the main stage, this sucks */ 5239566063dSJacob Faibussowitsch PetscCall(PetscEventPerfLogEnsureSize(stageLog->stageInfo[*stage].eventLog, stageLog->eventLog->numEvents)); 52448a46eb9SPierre Jolivet for (event = 0; event < stageLog->eventLog->numEvents; event++) PetscCall(PetscEventPerfInfoCopy(&stageLog->stageInfo[0].eventLog->eventInfo[event], &stageLog->stageInfo[*stage].eventLog->eventInfo[event])); 5259566063dSJacob Faibussowitsch PetscCall(PetscClassPerfLogEnsureSize(stageLog->stageInfo[*stage].classLog, stageLog->classLog->numClasses)); 526a0c7f9aaSSamuel Khuvis #if defined(PETSC_HAVE_TAU_PERFSTUBS) 527a0c7f9aaSSamuel Khuvis if (perfstubs_initialized == PERFSTUBS_SUCCESS) PetscStackCallExternalVoid("ps_timer_create_", stageLog->stageInfo[*stage].timer = ps_timer_create_(sname)); 528a0c7f9aaSSamuel Khuvis #endif 5293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5305c6c1daeSBarry Smith } 5315c6c1daeSBarry Smith 5325c6c1daeSBarry Smith /*@C 533811af0c4SBarry Smith PetscLogStagePush - This function pushes a stage on the logging stack. Events started and stopped until `PetscLogStagePop()` will be associated with the stage 5345c6c1daeSBarry Smith 5355c6c1daeSBarry Smith Not Collective 5365c6c1daeSBarry Smith 5375c6c1daeSBarry Smith Input Parameter: 5385c6c1daeSBarry Smith . stage - The stage on which to log 5395c6c1daeSBarry Smith 54010450e9eSJacob Faibussowitsch Example Usage: 541811af0c4SBarry Smith If the option -log_view is used to run the program containing the 5425c6c1daeSBarry Smith following code, then 2 sets of summary data will be printed during 5435c6c1daeSBarry Smith PetscFinalize(). 5445c6c1daeSBarry Smith .vb 5455c6c1daeSBarry Smith PetscInitialize(int *argc,char ***args,0,0); 5465c6c1daeSBarry Smith [stage 0 of code] 5475c6c1daeSBarry Smith PetscLogStagePush(1); 5485c6c1daeSBarry Smith [stage 1 of code] 5495c6c1daeSBarry Smith PetscLogStagePop(); 5505c6c1daeSBarry Smith PetscBarrier(...); 5515c6c1daeSBarry Smith [more stage 0 of code] 5525c6c1daeSBarry Smith PetscFinalize(); 5535c6c1daeSBarry Smith .ve 5545c6c1daeSBarry Smith 555d1f92df0SBarry Smith Level: intermediate 556d1f92df0SBarry Smith 557811af0c4SBarry Smith Note: 558811af0c4SBarry Smith Use `PetscLogStageRegister()` to register a stage. 5595c6c1daeSBarry Smith 560d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogStagePop()`, `PetscLogStageRegister()`, `PetscBarrier()` 5615c6c1daeSBarry Smith @*/ 562d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogStagePush(PetscLogStage stage) 563d71ae5a4SJacob Faibussowitsch { 5645c6c1daeSBarry Smith PetscStageLog stageLog; 5655c6c1daeSBarry Smith 5665c6c1daeSBarry Smith PetscFunctionBegin; 5679566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 5689566063dSJacob Faibussowitsch PetscCall(PetscStageLogPush(stageLog, stage)); 569a0c7f9aaSSamuel Khuvis #if defined(PETSC_HAVE_TAU_PERFSTUBS) 570a0c7f9aaSSamuel Khuvis if (perfstubs_initialized == PERFSTUBS_SUCCESS && stageLog->stageInfo[stage].timer != NULL) PetscStackCallExternalVoid("ps_timer_start_", ps_timer_start_(stageLog->stageInfo[stage].timer)); 571a0c7f9aaSSamuel Khuvis #endif 5723ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5735c6c1daeSBarry Smith } 5745c6c1daeSBarry Smith 5755c6c1daeSBarry Smith /*@C 576811af0c4SBarry Smith PetscLogStagePop - This function pops a stage from the logging stack that was pushed with `PetscLogStagePush()` 5775c6c1daeSBarry Smith 5785c6c1daeSBarry Smith Not Collective 5795c6c1daeSBarry Smith 58010450e9eSJacob Faibussowitsch Example Usage: 581811af0c4SBarry Smith If the option -log_view is used to run the program containing the 5825c6c1daeSBarry Smith following code, then 2 sets of summary data will be printed during 5835c6c1daeSBarry Smith PetscFinalize(). 5845c6c1daeSBarry Smith .vb 5855c6c1daeSBarry Smith PetscInitialize(int *argc,char ***args,0,0); 5865c6c1daeSBarry Smith [stage 0 of code] 5875c6c1daeSBarry Smith PetscLogStagePush(1); 5885c6c1daeSBarry Smith [stage 1 of code] 5895c6c1daeSBarry Smith PetscLogStagePop(); 5905c6c1daeSBarry Smith PetscBarrier(...); 5915c6c1daeSBarry Smith [more stage 0 of code] 5925c6c1daeSBarry Smith PetscFinalize(); 5935c6c1daeSBarry Smith .ve 5945c6c1daeSBarry Smith 5955c6c1daeSBarry Smith Level: intermediate 5965c6c1daeSBarry Smith 597d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogStagePush()`, `PetscLogStageRegister()`, `PetscBarrier()` 5985c6c1daeSBarry Smith @*/ 599d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogStagePop(void) 600d71ae5a4SJacob Faibussowitsch { 6015c6c1daeSBarry Smith PetscStageLog stageLog; 6025c6c1daeSBarry Smith 6035c6c1daeSBarry Smith PetscFunctionBegin; 6049566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 605a0c7f9aaSSamuel Khuvis #if defined(PETSC_HAVE_TAU_PERFSTUBS) 606a0c7f9aaSSamuel Khuvis if (perfstubs_initialized == PERFSTUBS_SUCCESS && stageLog->stageInfo[stageLog->curStage].timer != NULL) PetscStackCallExternalVoid("ps_timer_stop_", ps_timer_stop_(stageLog->stageInfo[stageLog->curStage].timer)); 607a0c7f9aaSSamuel Khuvis #endif 6089566063dSJacob Faibussowitsch PetscCall(PetscStageLogPop(stageLog)); 6093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6105c6c1daeSBarry Smith } 6115c6c1daeSBarry Smith 6125c6c1daeSBarry Smith /*@ 613811af0c4SBarry Smith PetscLogStageSetActive - Sets if a stage is used for `PetscLogEventBegin()` and `PetscLogEventEnd()`. 6145c6c1daeSBarry Smith 6155c6c1daeSBarry Smith Not Collective 6165c6c1daeSBarry Smith 6175c6c1daeSBarry Smith Input Parameters: 6185c6c1daeSBarry Smith + stage - The stage 619811af0c4SBarry Smith - isActive - The activity flag, `PETSC_TRUE` for logging, else `PETSC_FALSE` (defaults to `PETSC_TRUE`) 6205c6c1daeSBarry Smith 6215c6c1daeSBarry Smith Level: intermediate 6225c6c1daeSBarry Smith 623811af0c4SBarry Smith Note: 624811af0c4SBarry Smith If this is set to `PETSC_FALSE` the logging acts as if the stage did not exist 625811af0c4SBarry Smith 626d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogStageRegister()`, `PetscLogStagePush()`, `PetscLogStagePop()`, `PetscLogEventBegin()`, `PetscLogEventEnd()`, `PetscPreLoadBegin()`, `PetscPreLoadEnd()`, `PetscPreLoadStage()` 6275c6c1daeSBarry Smith @*/ 628d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogStageSetActive(PetscLogStage stage, PetscBool isActive) 629d71ae5a4SJacob Faibussowitsch { 6305c6c1daeSBarry Smith PetscStageLog stageLog; 6315c6c1daeSBarry Smith 6325c6c1daeSBarry Smith PetscFunctionBegin; 6339566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 6349566063dSJacob Faibussowitsch PetscCall(PetscStageLogSetActive(stageLog, stage, isActive)); 6353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6365c6c1daeSBarry Smith } 6375c6c1daeSBarry Smith 6385c6c1daeSBarry Smith /*@ 639811af0c4SBarry Smith PetscLogStageGetActive - Checks if a stage is used for `PetscLogEventBegin()` and `PetscLogEventEnd()`. 6405c6c1daeSBarry Smith 6415c6c1daeSBarry Smith Not Collective 6425c6c1daeSBarry Smith 6435c6c1daeSBarry Smith Input Parameter: 6445c6c1daeSBarry Smith . stage - The stage 6455c6c1daeSBarry Smith 6465c6c1daeSBarry Smith Output Parameter: 647811af0c4SBarry Smith . isActive - The activity flag, `PETSC_TRUE` for logging, else `PETSC_FALSE` (defaults to `PETSC_TRUE`) 6485c6c1daeSBarry Smith 6495c6c1daeSBarry Smith Level: intermediate 6505c6c1daeSBarry Smith 651d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogStageRegister()`, `PetscLogStagePush()`, `PetscLogStagePop()`, `PetscLogEventBegin()`, `PetscLogEventEnd()`, `PetscPreLoadBegin()`, `PetscPreLoadEnd()`, `PetscPreLoadStage()` 6525c6c1daeSBarry Smith @*/ 653d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogStageGetActive(PetscLogStage stage, PetscBool *isActive) 654d71ae5a4SJacob Faibussowitsch { 6555c6c1daeSBarry Smith PetscStageLog stageLog; 6565c6c1daeSBarry Smith 6575c6c1daeSBarry Smith PetscFunctionBegin; 6589566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 6599566063dSJacob Faibussowitsch PetscCall(PetscStageLogGetActive(stageLog, stage, isActive)); 6603ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6615c6c1daeSBarry Smith } 6625c6c1daeSBarry Smith 6635c6c1daeSBarry Smith /*@ 664811af0c4SBarry Smith PetscLogStageSetVisible - Determines stage visibility in `PetscLogView()` 6655c6c1daeSBarry Smith 6665c6c1daeSBarry Smith Not Collective 6675c6c1daeSBarry Smith 6685c6c1daeSBarry Smith Input Parameters: 6695c6c1daeSBarry Smith + stage - The stage 670811af0c4SBarry Smith - isVisible - The visibility flag, `PETSC_TRUE` to print, else `PETSC_FALSE` (defaults to `PETSC_TRUE`) 6715c6c1daeSBarry Smith 6725c6c1daeSBarry Smith Level: intermediate 6735c6c1daeSBarry Smith 674aec76313SJacob Faibussowitsch Developer Notes: 675811af0c4SBarry Smith What does visible mean, needs to be documented. 676811af0c4SBarry Smith 677d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogStageRegister()`, `PetscLogStagePush()`, `PetscLogStagePop()`, `PetscLogView()` 6785c6c1daeSBarry Smith @*/ 679d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogStageSetVisible(PetscLogStage stage, PetscBool isVisible) 680d71ae5a4SJacob Faibussowitsch { 6815c6c1daeSBarry Smith PetscStageLog stageLog; 6825c6c1daeSBarry Smith 6835c6c1daeSBarry Smith PetscFunctionBegin; 6849566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 6859566063dSJacob Faibussowitsch PetscCall(PetscStageLogSetVisible(stageLog, stage, isVisible)); 6863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6875c6c1daeSBarry Smith } 6885c6c1daeSBarry Smith 6895c6c1daeSBarry Smith /*@ 690811af0c4SBarry Smith PetscLogStageGetVisible - Returns stage visibility in `PetscLogView()` 6915c6c1daeSBarry Smith 6925c6c1daeSBarry Smith Not Collective 6935c6c1daeSBarry Smith 6945c6c1daeSBarry Smith Input Parameter: 6955c6c1daeSBarry Smith . stage - The stage 6965c6c1daeSBarry Smith 6975c6c1daeSBarry Smith Output Parameter: 698811af0c4SBarry Smith . isVisible - The visibility flag, `PETSC_TRUE` to print, else `PETSC_FALSE` (defaults to `PETSC_TRUE`) 6995c6c1daeSBarry Smith 7005c6c1daeSBarry Smith Level: intermediate 7015c6c1daeSBarry Smith 702d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogStageRegister()`, `PetscLogStagePush()`, `PetscLogStagePop()`, `PetscLogView()` 7035c6c1daeSBarry Smith @*/ 704d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogStageGetVisible(PetscLogStage stage, PetscBool *isVisible) 705d71ae5a4SJacob Faibussowitsch { 7065c6c1daeSBarry Smith PetscStageLog stageLog; 7075c6c1daeSBarry Smith 7085c6c1daeSBarry Smith PetscFunctionBegin; 7099566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 7109566063dSJacob Faibussowitsch PetscCall(PetscStageLogGetVisible(stageLog, stage, isVisible)); 7113ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7125c6c1daeSBarry Smith } 7135c6c1daeSBarry Smith 7145c6c1daeSBarry Smith /*@C 7155c6c1daeSBarry Smith PetscLogStageGetId - Returns the stage id when given the stage name. 7165c6c1daeSBarry Smith 7175c6c1daeSBarry Smith Not Collective 7185c6c1daeSBarry Smith 7195c6c1daeSBarry Smith Input Parameter: 7205c6c1daeSBarry Smith . name - The stage name 7215c6c1daeSBarry Smith 7225c6c1daeSBarry Smith Output Parameter: 7235a4a3fabSBarry Smith . stage - The stage, , or -1 if no stage with that name exists 7245c6c1daeSBarry Smith 7255c6c1daeSBarry Smith Level: intermediate 7265c6c1daeSBarry Smith 727d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogStageRegister()`, `PetscLogStagePush()`, `PetscLogStagePop()`, `PetscPreLoadBegin()`, `PetscPreLoadEnd()`, `PetscPreLoadStage()` 7285c6c1daeSBarry Smith @*/ 729d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogStageGetId(const char name[], PetscLogStage *stage) 730d71ae5a4SJacob Faibussowitsch { 7315c6c1daeSBarry Smith PetscStageLog stageLog; 7325c6c1daeSBarry Smith 7335c6c1daeSBarry Smith PetscFunctionBegin; 7349566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 7359566063dSJacob Faibussowitsch PetscCall(PetscStageLogGetStage(stageLog, name, stage)); 7363ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7375c6c1daeSBarry Smith } 7385c6c1daeSBarry Smith 7395c6c1daeSBarry Smith /*------------------------------------------------ Event Functions --------------------------------------------------*/ 7407a101e5eSJacob Faibussowitsch 7415c6c1daeSBarry Smith /*@C 742811af0c4SBarry Smith PetscLogEventRegister - Registers an event name for logging operations 7435c6c1daeSBarry Smith 7445c6c1daeSBarry Smith Not Collective 7455c6c1daeSBarry Smith 746d8d19677SJose E. Roman Input Parameters: 7475c6c1daeSBarry Smith + name - The name associated with the event 7485c6c1daeSBarry Smith - classid - The classid associated to the class for this event, obtain either with 749811af0c4SBarry Smith `PetscClassIdRegister()` or use a predefined one such as `KSP_CLASSID`, `SNES_CLASSID`, the predefined ones 7505c6c1daeSBarry Smith are only available in C code 7515c6c1daeSBarry Smith 7525c6c1daeSBarry Smith Output Parameter: 753811af0c4SBarry Smith . event - The event id for use with `PetscLogEventBegin()` and `PetscLogEventEnd()`. 7545c6c1daeSBarry Smith 75510450e9eSJacob Faibussowitsch Example Usage: 7565c6c1daeSBarry Smith .vb 7575c6c1daeSBarry Smith PetscLogEvent USER_EVENT; 7585c6c1daeSBarry Smith PetscClassId classid; 7595c6c1daeSBarry Smith PetscLogDouble user_event_flops; 7605c6c1daeSBarry Smith PetscClassIdRegister("class name",&classid); 7615c6c1daeSBarry Smith PetscLogEventRegister("User event name",classid,&USER_EVENT); 7625c6c1daeSBarry Smith PetscLogEventBegin(USER_EVENT,0,0,0,0); 7635c6c1daeSBarry Smith [code segment to monitor] 7645c6c1daeSBarry Smith PetscLogFlops(user_event_flops); 7655c6c1daeSBarry Smith PetscLogEventEnd(USER_EVENT,0,0,0,0); 7665c6c1daeSBarry Smith .ve 7675c6c1daeSBarry Smith 768d1f92df0SBarry Smith Level: intermediate 769d1f92df0SBarry Smith 7705c6c1daeSBarry Smith Notes: 7715c6c1daeSBarry Smith PETSc automatically logs library events if the code has been 772a2553e36SBarry Smith configured with --with-log (which is the default) and 773811af0c4SBarry Smith -log_view or -log_all is specified. `PetscLogEventRegister()` is 7745c6c1daeSBarry Smith intended for logging user events to supplement this PETSc 7755c6c1daeSBarry Smith information. 7765c6c1daeSBarry Smith 777495fc317SBarry Smith PETSc can gather data for use with the utilities Jumpshot 7785c6c1daeSBarry Smith (part of the MPICH distribution). If PETSc has been compiled 7795c6c1daeSBarry Smith with flag -DPETSC_HAVE_MPE (MPE is an additional utility within 7805c6c1daeSBarry Smith MPICH), the user can employ another command line option, -log_mpe, 7815c6c1daeSBarry Smith to create a logfile, "mpe.log", which can be visualized 782495fc317SBarry Smith Jumpshot. 7835c6c1daeSBarry Smith 7845c6c1daeSBarry Smith The classid is associated with each event so that classes of events 7855c6c1daeSBarry Smith can be disabled simultaneously, such as all matrix events. The user 786811af0c4SBarry Smith can either use an existing classid, such as `MAT_CLASSID`, or create 7875c6c1daeSBarry Smith their own as shown in the example. 7885c6c1daeSBarry Smith 789c5deb1d5SJed Brown If an existing event with the same name exists, its event handle is 790c5deb1d5SJed Brown returned instead of creating a new event. 791c5deb1d5SJed Brown 792d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogStageRegister()`, `PetscLogEventBegin()`, `PetscLogEventEnd()`, `PetscLogFlops()`, 793db781477SPatrick Sanan `PetscLogEventActivate()`, `PetscLogEventDeactivate()`, `PetscClassIdRegister()` 7945c6c1daeSBarry Smith @*/ 795d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogEventRegister(const char name[], PetscClassId classid, PetscLogEvent *event) 796d71ae5a4SJacob Faibussowitsch { 7975c6c1daeSBarry Smith PetscStageLog stageLog; 7985c6c1daeSBarry Smith int stage; 7995c6c1daeSBarry Smith 8005c6c1daeSBarry Smith PetscFunctionBegin; 8015c6c1daeSBarry Smith *event = PETSC_DECIDE; 8029566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 8039566063dSJacob Faibussowitsch PetscCall(PetscEventRegLogGetEvent(stageLog->eventLog, name, event)); 8043ba16761SJacob Faibussowitsch if (*event > 0) PetscFunctionReturn(PETSC_SUCCESS); 8059566063dSJacob Faibussowitsch PetscCall(PetscEventRegLogRegister(stageLog->eventLog, name, classid, event)); 8065c6c1daeSBarry Smith for (stage = 0; stage < stageLog->numStages; stage++) { 8079566063dSJacob Faibussowitsch PetscCall(PetscEventPerfLogEnsureSize(stageLog->stageInfo[stage].eventLog, stageLog->eventLog->numEvents)); 8089566063dSJacob Faibussowitsch PetscCall(PetscClassPerfLogEnsureSize(stageLog->stageInfo[stage].classLog, stageLog->classLog->numClasses)); 8095c6c1daeSBarry Smith } 8103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 8115c6c1daeSBarry Smith } 8125c6c1daeSBarry Smith 8135c6c1daeSBarry Smith /*@ 814217044c2SLisandro Dalcin PetscLogEventSetCollective - Indicates that a particular event is collective. 815217044c2SLisandro Dalcin 816217044c2SLisandro Dalcin Not Collective 817217044c2SLisandro Dalcin 818d8d19677SJose E. Roman Input Parameters: 819217044c2SLisandro Dalcin + event - The event id 820d5b43468SJose E. Roman - collective - Boolean flag indicating whether a particular event is collective 821217044c2SLisandro Dalcin 822d1f92df0SBarry Smith Level: developer 823d1f92df0SBarry Smith 824811af0c4SBarry Smith Notes: 825811af0c4SBarry Smith New events returned from `PetscLogEventRegister()` are collective by default. 826811af0c4SBarry Smith 827811af0c4SBarry Smith Collective events are handled specially if the -log_sync is used. In that case the logging saves information about 828811af0c4SBarry Smith two parts of the event; the time for all the MPI ranks to synchronize and then the time for the actual computation/communication 829811af0c4SBarry Smith to be performed. This option is useful to debug imbalance within the computations or communications 830217044c2SLisandro Dalcin 831d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogEventBegin()`, `PetscLogEventEnd()`, `PetscLogEventRegister()` 832217044c2SLisandro Dalcin @*/ 833d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogEventSetCollective(PetscLogEvent event, PetscBool collective) 834d71ae5a4SJacob Faibussowitsch { 835217044c2SLisandro Dalcin PetscStageLog stageLog; 836217044c2SLisandro Dalcin PetscEventRegLog eventRegLog; 837217044c2SLisandro Dalcin 838217044c2SLisandro Dalcin PetscFunctionBegin; 8399566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 8409566063dSJacob Faibussowitsch PetscCall(PetscStageLogGetEventRegLog(stageLog, &eventRegLog)); 841cc73adaaSBarry Smith PetscCheck(event >= 0 && event <= eventRegLog->numEvents, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Invalid event id"); 842217044c2SLisandro Dalcin eventRegLog->eventInfo[event].collective = collective; 8433ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 844217044c2SLisandro Dalcin } 845217044c2SLisandro Dalcin 846217044c2SLisandro Dalcin /*@ 847fa2bb9feSLisandro Dalcin PetscLogEventIncludeClass - Activates event logging for a PETSc object class in every stage. 848fa2bb9feSLisandro Dalcin 849fa2bb9feSLisandro Dalcin Not Collective 850fa2bb9feSLisandro Dalcin 851fa2bb9feSLisandro Dalcin Input Parameter: 852811af0c4SBarry Smith . classid - The object class, for example `MAT_CLASSID`, `SNES_CLASSID`, etc. 853fa2bb9feSLisandro Dalcin 854fa2bb9feSLisandro Dalcin Level: developer 855fa2bb9feSLisandro Dalcin 856d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogEventActivateClass()`, `PetscLogEventDeactivateClass()`, `PetscLogEventActivate()`, `PetscLogEventDeactivate()` 857fa2bb9feSLisandro Dalcin @*/ 858d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogEventIncludeClass(PetscClassId classid) 859d71ae5a4SJacob Faibussowitsch { 860fa2bb9feSLisandro Dalcin PetscStageLog stageLog; 861fa2bb9feSLisandro Dalcin int stage; 862fa2bb9feSLisandro Dalcin 863fa2bb9feSLisandro Dalcin PetscFunctionBegin; 8649566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 86548a46eb9SPierre Jolivet for (stage = 0; stage < stageLog->numStages; stage++) PetscCall(PetscEventPerfLogActivateClass(stageLog->stageInfo[stage].eventLog, stageLog->eventLog, classid)); 8663ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 867fa2bb9feSLisandro Dalcin } 868fa2bb9feSLisandro Dalcin 869fa2bb9feSLisandro Dalcin /*@ 870fa2bb9feSLisandro Dalcin PetscLogEventExcludeClass - Deactivates event logging for a PETSc object class in every stage. 871fa2bb9feSLisandro Dalcin 872fa2bb9feSLisandro Dalcin Not Collective 873fa2bb9feSLisandro Dalcin 874fa2bb9feSLisandro Dalcin Input Parameter: 875811af0c4SBarry Smith . classid - The object class, for example `MAT_CLASSID`, `SNES_CLASSID`, etc. 876fa2bb9feSLisandro Dalcin 877fa2bb9feSLisandro Dalcin Level: developer 878fa2bb9feSLisandro Dalcin 879811af0c4SBarry Smith Note: 880811af0c4SBarry Smith If a class is excluded then events associated with that class are not logged. 881811af0c4SBarry Smith 882d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogEventDeactivateClass()`, `PetscLogEventActivateClass()`, `PetscLogEventDeactivate()`, `PetscLogEventActivate()` 883fa2bb9feSLisandro Dalcin @*/ 884d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogEventExcludeClass(PetscClassId classid) 885d71ae5a4SJacob Faibussowitsch { 886fa2bb9feSLisandro Dalcin PetscStageLog stageLog; 887fa2bb9feSLisandro Dalcin int stage; 888fa2bb9feSLisandro Dalcin 889fa2bb9feSLisandro Dalcin PetscFunctionBegin; 8909566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 89148a46eb9SPierre Jolivet for (stage = 0; stage < stageLog->numStages; stage++) PetscCall(PetscEventPerfLogDeactivateClass(stageLog->stageInfo[stage].eventLog, stageLog->eventLog, classid)); 8923ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 893fa2bb9feSLisandro Dalcin } 894fa2bb9feSLisandro Dalcin 895fa2bb9feSLisandro Dalcin /*@ 8965c6c1daeSBarry Smith PetscLogEventActivate - Indicates that a particular event should be logged. 8975c6c1daeSBarry Smith 8985c6c1daeSBarry Smith Not Collective 8995c6c1daeSBarry Smith 9005c6c1daeSBarry Smith Input Parameter: 9015c6c1daeSBarry Smith . event - The event id 9025c6c1daeSBarry Smith 90310450e9eSJacob Faibussowitsch Example Usage: 9045c6c1daeSBarry Smith .vb 9055c6c1daeSBarry Smith PetscLogEventDeactivate(VEC_SetValues); 9065c6c1daeSBarry Smith [code where you do not want to log VecSetValues()] 9075c6c1daeSBarry Smith PetscLogEventActivate(VEC_SetValues); 9085c6c1daeSBarry Smith [code where you do want to log VecSetValues()] 9095c6c1daeSBarry Smith .ve 9105c6c1daeSBarry Smith 911d1f92df0SBarry Smith Level: advanced 912d1f92df0SBarry Smith 9135c6c1daeSBarry Smith Note: 9145c6c1daeSBarry Smith The event may be either a pre-defined PETSc event (found in include/petsclog.h) 915811af0c4SBarry Smith or an event number obtained with `PetscLogEventRegister()`. 9165c6c1daeSBarry Smith 917d1f92df0SBarry Smith .seealso: [](ch_profiling), `PlogEventDeactivate()`, `PlogEventDeactivatePush()`, `PetscLogEventDeactivatePop()` 9185c6c1daeSBarry Smith @*/ 919d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogEventActivate(PetscLogEvent event) 920d71ae5a4SJacob Faibussowitsch { 9215c6c1daeSBarry Smith PetscStageLog stageLog; 9225c6c1daeSBarry Smith int stage; 9235c6c1daeSBarry Smith 9245c6c1daeSBarry Smith PetscFunctionBegin; 9259566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 9269566063dSJacob Faibussowitsch PetscCall(PetscStageLogGetCurrent(stageLog, &stage)); 9279566063dSJacob Faibussowitsch PetscCall(PetscEventPerfLogActivate(stageLog->stageInfo[stage].eventLog, event)); 9283ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 9295c6c1daeSBarry Smith } 9305c6c1daeSBarry Smith 9315c6c1daeSBarry Smith /*@ 9325c6c1daeSBarry Smith PetscLogEventDeactivate - Indicates that a particular event should not be logged. 9335c6c1daeSBarry Smith 9345c6c1daeSBarry Smith Not Collective 9355c6c1daeSBarry Smith 9365c6c1daeSBarry Smith Input Parameter: 9375c6c1daeSBarry Smith . event - The event id 9385c6c1daeSBarry Smith 93910450e9eSJacob Faibussowitsch Example Usage: 9405c6c1daeSBarry Smith .vb 9415c6c1daeSBarry Smith PetscLogEventDeactivate(VEC_SetValues); 9425c6c1daeSBarry Smith [code where you do not want to log VecSetValues()] 9435c6c1daeSBarry Smith PetscLogEventActivate(VEC_SetValues); 9445c6c1daeSBarry Smith [code where you do want to log VecSetValues()] 9455c6c1daeSBarry Smith .ve 9465c6c1daeSBarry Smith 947d1f92df0SBarry Smith Level: advanced 948d1f92df0SBarry Smith 9495c6c1daeSBarry Smith Note: 9505c6c1daeSBarry Smith The event may be either a pre-defined PETSc event (found in 951811af0c4SBarry Smith include/petsclog.h) or an event number obtained with `PetscLogEventRegister()`). 9525c6c1daeSBarry Smith 953d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogEventActivate()`, `PetscLogEventDeactivatePush()`, `PetscLogEventDeactivatePop()` 9545c6c1daeSBarry Smith @*/ 955d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogEventDeactivate(PetscLogEvent event) 956d71ae5a4SJacob Faibussowitsch { 9575c6c1daeSBarry Smith PetscStageLog stageLog; 9585c6c1daeSBarry Smith int stage; 9595c6c1daeSBarry Smith 9605c6c1daeSBarry Smith PetscFunctionBegin; 9619566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 9629566063dSJacob Faibussowitsch PetscCall(PetscStageLogGetCurrent(stageLog, &stage)); 9639566063dSJacob Faibussowitsch PetscCall(PetscEventPerfLogDeactivate(stageLog->stageInfo[stage].eventLog, event)); 9643ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 9655c6c1daeSBarry Smith } 9665c6c1daeSBarry Smith 9675c6c1daeSBarry Smith /*@ 968811af0c4SBarry Smith PetscLogEventDeactivatePush - Indicates that a particular event should not be logged until `PetscLogEventDeactivatePop()` is called 969c00cb57fSBarry Smith 970c00cb57fSBarry Smith Not Collective 971c00cb57fSBarry Smith 972c00cb57fSBarry Smith Input Parameter: 973c00cb57fSBarry Smith . event - The event id 974c00cb57fSBarry Smith 97510450e9eSJacob Faibussowitsch Example Usage: 976c00cb57fSBarry Smith .vb 977c00cb57fSBarry Smith PetscLogEventDeactivatePush(VEC_SetValues); 978c00cb57fSBarry Smith [code where you do not want to log VecSetValues()] 979c00cb57fSBarry Smith PetscLogEventDeactivatePop(VEC_SetValues); 980c00cb57fSBarry Smith [code where you do want to log VecSetValues()] 981c00cb57fSBarry Smith .ve 982c00cb57fSBarry Smith 983d1f92df0SBarry Smith Level: advanced 984d1f92df0SBarry Smith 985c00cb57fSBarry Smith Note: 986c00cb57fSBarry Smith The event may be either a pre-defined PETSc event (found in 987811af0c4SBarry Smith include/petsclog.h) or an event number obtained with `PetscLogEventRegister()`). 988c00cb57fSBarry Smith 989d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogEventActivate()`, `PetscLogEventDeactivatePop()`, `PetscLogEventDeactivate()` 990c00cb57fSBarry Smith @*/ 991d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogEventDeactivatePush(PetscLogEvent event) 992d71ae5a4SJacob Faibussowitsch { 993c00cb57fSBarry Smith PetscStageLog stageLog; 994c00cb57fSBarry Smith int stage; 995c00cb57fSBarry Smith 996c00cb57fSBarry Smith PetscFunctionBegin; 9979566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 9989566063dSJacob Faibussowitsch PetscCall(PetscStageLogGetCurrent(stageLog, &stage)); 9999566063dSJacob Faibussowitsch PetscCall(PetscEventPerfLogDeactivatePush(stageLog->stageInfo[stage].eventLog, event)); 10003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1001c00cb57fSBarry Smith } 1002c00cb57fSBarry Smith 1003c00cb57fSBarry Smith /*@ 1004811af0c4SBarry Smith PetscLogEventDeactivatePop - Indicates that a particular event should again be logged after the logging was turned off with `PetscLogEventDeactivatePush()` 1005c00cb57fSBarry Smith 1006c00cb57fSBarry Smith Not Collective 1007c00cb57fSBarry Smith 1008c00cb57fSBarry Smith Input Parameter: 1009c00cb57fSBarry Smith . event - The event id 1010c00cb57fSBarry Smith 101110450e9eSJacob Faibussowitsch Example Usage: 1012c00cb57fSBarry Smith .vb 1013c00cb57fSBarry Smith PetscLogEventDeactivatePush(VEC_SetValues); 1014c00cb57fSBarry Smith [code where you do not want to log VecSetValues()] 1015c00cb57fSBarry Smith PetscLogEventDeactivatePop(VEC_SetValues); 1016c00cb57fSBarry Smith [code where you do want to log VecSetValues()] 1017c00cb57fSBarry Smith .ve 1018c00cb57fSBarry Smith 1019d1f92df0SBarry Smith Level: advanced 1020d1f92df0SBarry Smith 1021c00cb57fSBarry Smith Note: 1022c00cb57fSBarry Smith The event may be either a pre-defined PETSc event (found in 1023811af0c4SBarry Smith include/petsclog.h) or an event number obtained with `PetscLogEventRegister()`). 1024c00cb57fSBarry Smith 1025d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogEventActivate()`, `PetscLogEventDeactivatePush()` 1026c00cb57fSBarry Smith @*/ 1027d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogEventDeactivatePop(PetscLogEvent event) 1028d71ae5a4SJacob Faibussowitsch { 1029c00cb57fSBarry Smith PetscStageLog stageLog; 1030c00cb57fSBarry Smith int stage; 1031c00cb57fSBarry Smith 1032c00cb57fSBarry Smith PetscFunctionBegin; 10339566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 10349566063dSJacob Faibussowitsch PetscCall(PetscStageLogGetCurrent(stageLog, &stage)); 10359566063dSJacob Faibussowitsch PetscCall(PetscEventPerfLogDeactivatePop(stageLog->stageInfo[stage].eventLog, event)); 10363ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1037c00cb57fSBarry Smith } 1038c00cb57fSBarry Smith 1039c00cb57fSBarry Smith /*@ 1040811af0c4SBarry Smith PetscLogEventSetActiveAll - Turns on logging of all events 10415c6c1daeSBarry Smith 10425c6c1daeSBarry Smith Not Collective 10435c6c1daeSBarry Smith 10445c6c1daeSBarry Smith Input Parameters: 10455c6c1daeSBarry Smith + event - The event id 10465c6c1daeSBarry Smith - isActive - The activity flag determining whether the event is logged 10475c6c1daeSBarry Smith 10485c6c1daeSBarry Smith Level: advanced 10495c6c1daeSBarry Smith 1050d1f92df0SBarry Smith .seealso: [](ch_profiling), `PlogEventActivate()`, `PlogEventDeactivate()` 10515c6c1daeSBarry Smith @*/ 1052d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogEventSetActiveAll(PetscLogEvent event, PetscBool isActive) 1053d71ae5a4SJacob Faibussowitsch { 10545c6c1daeSBarry Smith PetscStageLog stageLog; 10555c6c1daeSBarry Smith int stage; 10565c6c1daeSBarry Smith 10575c6c1daeSBarry Smith PetscFunctionBegin; 10589566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 10595c6c1daeSBarry Smith for (stage = 0; stage < stageLog->numStages; stage++) { 10605c6c1daeSBarry Smith if (isActive) { 10619566063dSJacob Faibussowitsch PetscCall(PetscEventPerfLogActivate(stageLog->stageInfo[stage].eventLog, event)); 10625c6c1daeSBarry Smith } else { 10639566063dSJacob Faibussowitsch PetscCall(PetscEventPerfLogDeactivate(stageLog->stageInfo[stage].eventLog, event)); 10645c6c1daeSBarry Smith } 10655c6c1daeSBarry Smith } 10663ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10675c6c1daeSBarry Smith } 10685c6c1daeSBarry Smith 10695c6c1daeSBarry Smith /*@ 1070811af0c4SBarry Smith PetscLogEventActivateClass - Activates event logging for a PETSc object class for the current stage 10715c6c1daeSBarry Smith 10725c6c1daeSBarry Smith Not Collective 10735c6c1daeSBarry Smith 10745c6c1daeSBarry Smith Input Parameter: 1075811af0c4SBarry Smith . classid - The event class, for example `MAT_CLASSID`, `SNES_CLASSID`, etc. 10765c6c1daeSBarry Smith 10775c6c1daeSBarry Smith Level: developer 10785c6c1daeSBarry Smith 1079d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogEventIncludeClass()`, `PetscLogEventExcludeClass()`, `PetscLogEventDeactivateClass()`, `PetscLogEventActivate()`, `PetscLogEventDeactivate()` 10805c6c1daeSBarry Smith @*/ 1081d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogEventActivateClass(PetscClassId classid) 1082d71ae5a4SJacob Faibussowitsch { 10835c6c1daeSBarry Smith PetscStageLog stageLog; 10845c6c1daeSBarry Smith int stage; 10855c6c1daeSBarry Smith 10865c6c1daeSBarry Smith PetscFunctionBegin; 10879566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 10889566063dSJacob Faibussowitsch PetscCall(PetscStageLogGetCurrent(stageLog, &stage)); 10899566063dSJacob Faibussowitsch PetscCall(PetscEventPerfLogActivateClass(stageLog->stageInfo[stage].eventLog, stageLog->eventLog, classid)); 10903ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10915c6c1daeSBarry Smith } 10925c6c1daeSBarry Smith 10935c6c1daeSBarry Smith /*@ 1094811af0c4SBarry Smith PetscLogEventDeactivateClass - Deactivates event logging for a PETSc object class for the current stage 10955c6c1daeSBarry Smith 10965c6c1daeSBarry Smith Not Collective 10975c6c1daeSBarry Smith 10985c6c1daeSBarry Smith Input Parameter: 1099811af0c4SBarry Smith . classid - The event class, for example `MAT_CLASSID`, `SNES_CLASSID`, etc. 11005c6c1daeSBarry Smith 11015c6c1daeSBarry Smith Level: developer 11025c6c1daeSBarry Smith 1103d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogEventIncludeClass()`, `PetscLogEventExcludeClass()`, `PetscLogEventActivateClass()`, `PetscLogEventActivate()`, `PetscLogEventDeactivate()` 11045c6c1daeSBarry Smith @*/ 1105d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogEventDeactivateClass(PetscClassId classid) 1106d71ae5a4SJacob Faibussowitsch { 11075c6c1daeSBarry Smith PetscStageLog stageLog; 11085c6c1daeSBarry Smith int stage; 11095c6c1daeSBarry Smith 11105c6c1daeSBarry Smith PetscFunctionBegin; 11119566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 11129566063dSJacob Faibussowitsch PetscCall(PetscStageLogGetCurrent(stageLog, &stage)); 11139566063dSJacob Faibussowitsch PetscCall(PetscEventPerfLogDeactivateClass(stageLog->stageInfo[stage].eventLog, stageLog->eventLog, classid)); 11143ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 11155c6c1daeSBarry Smith } 11165c6c1daeSBarry Smith 11175c6c1daeSBarry Smith /*MC 111862872c28SLisandro Dalcin PetscLogEventSync - Synchronizes the beginning of a user event. 111962872c28SLisandro Dalcin 112062872c28SLisandro Dalcin Synopsis: 112162872c28SLisandro Dalcin #include <petsclog.h> 112262872c28SLisandro Dalcin PetscErrorCode PetscLogEventSync(int e, MPI_Comm comm) 112362872c28SLisandro Dalcin 112462872c28SLisandro Dalcin Collective 112562872c28SLisandro Dalcin 112662872c28SLisandro Dalcin Input Parameters: 112762872c28SLisandro Dalcin + e - integer associated with the event obtained from PetscLogEventRegister() 112862872c28SLisandro Dalcin - comm - an MPI communicator 112962872c28SLisandro Dalcin 113010450e9eSJacob Faibussowitsch Example Usage: 113162872c28SLisandro Dalcin .vb 113262872c28SLisandro Dalcin PetscLogEvent USER_EVENT; 113310450e9eSJacob Faibussowitsch 113462872c28SLisandro Dalcin PetscLogEventRegister("User event", 0, &USER_EVENT); 113562872c28SLisandro Dalcin PetscLogEventSync(USER_EVENT, PETSC_COMM_WORLD); 113662872c28SLisandro Dalcin PetscLogEventBegin(USER_EVENT, 0, 0, 0, 0); 113762872c28SLisandro Dalcin [code segment to monitor] 113862872c28SLisandro Dalcin PetscLogEventEnd(USER_EVENT, 0, 0, 0 , 0); 113962872c28SLisandro Dalcin .ve 114062872c28SLisandro Dalcin 1141d1f92df0SBarry Smith Level: developer 1142d1f92df0SBarry Smith 1143811af0c4SBarry Smith Note: 114410450e9eSJacob Faibussowitsch This routine should be called only if there is not a `PetscObject` available to pass to 114510450e9eSJacob Faibussowitsch `PetscLogEventBegin()`. 114662872c28SLisandro Dalcin 1147d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogEventRegister()`, `PetscLogEventBegin()`, `PetscLogEventEnd()` 114862872c28SLisandro Dalcin M*/ 114962872c28SLisandro Dalcin 115062872c28SLisandro Dalcin /*MC 11515c6c1daeSBarry Smith PetscLogEventBegin - Logs the beginning of a user event. 11525c6c1daeSBarry Smith 11535c6c1daeSBarry Smith Synopsis: 1154aaa7dc30SBarry Smith #include <petsclog.h> 1155f2ba6396SBarry Smith PetscErrorCode PetscLogEventBegin(int e, PetscObject o1, PetscObject o2, PetscObject o3, PetscObject o4) 11565c6c1daeSBarry Smith 11575c6c1daeSBarry Smith Not Collective 11585c6c1daeSBarry Smith 11595c6c1daeSBarry Smith Input Parameters: 11605c6c1daeSBarry Smith + e - integer associated with the event obtained from PetscLogEventRegister() 11615c6c1daeSBarry Smith - o1,o2,o3,o4 - objects associated with the event, or 0 11625c6c1daeSBarry Smith 11635c6c1daeSBarry Smith Fortran Synopsis: 11645c6c1daeSBarry Smith void PetscLogEventBegin(int e, PetscErrorCode ierr) 11655c6c1daeSBarry Smith 116610450e9eSJacob Faibussowitsch Example Usage: 11675c6c1daeSBarry Smith .vb 11685c6c1daeSBarry Smith PetscLogEvent USER_EVENT; 116910450e9eSJacob Faibussowitsch 11705c6c1daeSBarry Smith PetscLogDouble user_event_flops; 11715c6c1daeSBarry Smith PetscLogEventRegister("User event",0, &USER_EVENT); 11725c6c1daeSBarry Smith PetscLogEventBegin(USER_EVENT, 0, 0, 0, 0); 11735c6c1daeSBarry Smith [code segment to monitor] 11745c6c1daeSBarry Smith PetscLogFlops(user_event_flops); 11755c6c1daeSBarry Smith PetscLogEventEnd(USER_EVENT, 0, 0, 0, 0); 11765c6c1daeSBarry Smith .ve 11775c6c1daeSBarry Smith 1178d1f92df0SBarry Smith Level: intermediate 1179d1f92df0SBarry Smith 1180811af0c4SBarry Smith Developer Note: 118110450e9eSJacob Faibussowitsch `PetscLogEventBegin()` and `PetscLogEventBegin()` return error codes instead of explicitly 118210450e9eSJacob Faibussowitsch handling the errors that occur in the macro directly because other packages that use this 118310450e9eSJacob Faibussowitsch macros have used them in their own functions or methods that do not return error codes and it 118410450e9eSJacob Faibussowitsch would be disruptive to change the current behavior. 1185d0609cedSBarry Smith 1186d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogEventRegister()`, `PetscLogEventEnd()`, `PetscLogFlops()` 11875c6c1daeSBarry Smith M*/ 11885c6c1daeSBarry Smith 11895c6c1daeSBarry Smith /*MC 11905c6c1daeSBarry Smith PetscLogEventEnd - Log the end of a user event. 11915c6c1daeSBarry Smith 11925c6c1daeSBarry Smith Synopsis: 1193aaa7dc30SBarry Smith #include <petsclog.h> 1194f2ba6396SBarry Smith PetscErrorCode PetscLogEventEnd(int e, PetscObject o1, PetscObject o2, PetscObject o3, PetscObject o4) 11955c6c1daeSBarry Smith 11965c6c1daeSBarry Smith Not Collective 11975c6c1daeSBarry Smith 11985c6c1daeSBarry Smith Input Parameters: 11995c6c1daeSBarry Smith + e - integer associated with the event obtained with PetscLogEventRegister() 12005c6c1daeSBarry Smith - o1,o2,o3,o4 - objects associated with the event, or 0 12015c6c1daeSBarry Smith 12025c6c1daeSBarry Smith Fortran Synopsis: 12035c6c1daeSBarry Smith void PetscLogEventEnd(int e, PetscErrorCode ierr) 12045c6c1daeSBarry Smith 120510450e9eSJacob Faibussowitsch Example Usage: 12065c6c1daeSBarry Smith .vb 12075c6c1daeSBarry Smith PetscLogEvent USER_EVENT; 120810450e9eSJacob Faibussowitsch 12095c6c1daeSBarry Smith PetscLogDouble user_event_flops; 121010450e9eSJacob Faibussowitsch PetscLogEventRegister("User event", 0, &USER_EVENT); 12115c6c1daeSBarry Smith PetscLogEventBegin(USER_EVENT, 0, 0, 0, 0); 12125c6c1daeSBarry Smith [code segment to monitor] 12135c6c1daeSBarry Smith PetscLogFlops(user_event_flops); 12145c6c1daeSBarry Smith PetscLogEventEnd(USER_EVENT, 0, 0, 0, 0); 12155c6c1daeSBarry Smith .ve 12165c6c1daeSBarry Smith 12175c6c1daeSBarry Smith Level: intermediate 12185c6c1daeSBarry Smith 1219d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogEventRegister()`, `PetscLogEventBegin()`, `PetscLogFlops()` 12205c6c1daeSBarry Smith M*/ 12215c6c1daeSBarry Smith 12225c6c1daeSBarry Smith /*@C 12235c6c1daeSBarry Smith PetscLogEventGetId - Returns the event id when given the event name. 12245c6c1daeSBarry Smith 12255c6c1daeSBarry Smith Not Collective 12265c6c1daeSBarry Smith 12275c6c1daeSBarry Smith Input Parameter: 12285c6c1daeSBarry Smith . name - The event name 12295c6c1daeSBarry Smith 12305c6c1daeSBarry Smith Output Parameter: 1231c5deb1d5SJed Brown . event - The event, or -1 if no event with that name exists 12325c6c1daeSBarry Smith 12335c6c1daeSBarry Smith Level: intermediate 12345c6c1daeSBarry Smith 1235d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogEventBegin()`, `PetscLogEventEnd()`, `PetscLogStageGetId()` 12365c6c1daeSBarry Smith @*/ 1237d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogEventGetId(const char name[], PetscLogEvent *event) 1238d71ae5a4SJacob Faibussowitsch { 12395c6c1daeSBarry Smith PetscStageLog stageLog; 12405c6c1daeSBarry Smith 12415c6c1daeSBarry Smith PetscFunctionBegin; 12429566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 12439566063dSJacob Faibussowitsch PetscCall(PetscEventRegLogGetEvent(stageLog->eventLog, name, event)); 12443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12455c6c1daeSBarry Smith } 12465c6c1daeSBarry Smith 1247d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogPushCurrentEvent_Internal(PetscLogEvent event) 1248d71ae5a4SJacob Faibussowitsch { 12497a101e5eSJacob Faibussowitsch PetscFunctionBegin; 1250c708d6e3SStefano Zampini if (!PetscDefined(HAVE_THREADSAFETY)) PetscCall(PetscIntStackPush(current_log_event_stack, event)); 12513ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12527a101e5eSJacob Faibussowitsch } 12537a101e5eSJacob Faibussowitsch 1254d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogPopCurrentEvent_Internal(void) 1255d71ae5a4SJacob Faibussowitsch { 12567a101e5eSJacob Faibussowitsch PetscFunctionBegin; 1257c708d6e3SStefano Zampini if (!PetscDefined(HAVE_THREADSAFETY)) PetscCall(PetscIntStackPop(current_log_event_stack, NULL)); 12583ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12597a101e5eSJacob Faibussowitsch } 12607a101e5eSJacob Faibussowitsch 1261d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogGetCurrentEvent_Internal(PetscLogEvent *event) 1262d71ae5a4SJacob Faibussowitsch { 12637a101e5eSJacob Faibussowitsch PetscBool empty; 12647a101e5eSJacob Faibussowitsch 12657a101e5eSJacob Faibussowitsch PetscFunctionBegin; 12664f572ea9SToby Isaac PetscAssertPointer(event, 1); 12677a101e5eSJacob Faibussowitsch *event = PETSC_DECIDE; 12687a101e5eSJacob Faibussowitsch PetscCall(PetscIntStackEmpty(current_log_event_stack, &empty)); 12697a101e5eSJacob Faibussowitsch if (!empty) PetscCall(PetscIntStackTop(current_log_event_stack, event)); 12703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12717a101e5eSJacob Faibussowitsch } 12727a101e5eSJacob Faibussowitsch 1273d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogEventPause_Internal(PetscLogEvent event) 1274d71ae5a4SJacob Faibussowitsch { 12757a101e5eSJacob Faibussowitsch PetscFunctionBegin; 12767a101e5eSJacob Faibussowitsch if (event != PETSC_DECIDE) PetscCall(PetscLogEventEnd(event, NULL, NULL, NULL, NULL)); 12773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12787a101e5eSJacob Faibussowitsch } 12797a101e5eSJacob Faibussowitsch 1280d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogEventResume_Internal(PetscLogEvent event) 1281d71ae5a4SJacob Faibussowitsch { 12827a101e5eSJacob Faibussowitsch PetscStageLog stageLog; 12837a101e5eSJacob Faibussowitsch PetscEventPerfLog eventLog; 12847a101e5eSJacob Faibussowitsch int stage; 12857a101e5eSJacob Faibussowitsch 12867a101e5eSJacob Faibussowitsch PetscFunctionBegin; 12873ba16761SJacob Faibussowitsch if (event == PETSC_DECIDE) PetscFunctionReturn(PETSC_SUCCESS); 12887a101e5eSJacob Faibussowitsch PetscCall(PetscLogEventBegin(event, NULL, NULL, NULL, NULL)); 12897a101e5eSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 12907a101e5eSJacob Faibussowitsch PetscCall(PetscStageLogGetCurrent(stageLog, &stage)); 12917a101e5eSJacob Faibussowitsch PetscCall(PetscStageLogGetEventPerfLog(stageLog, stage, &eventLog)); 12927a101e5eSJacob Faibussowitsch eventLog->eventInfo[event].count--; 12933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12947a101e5eSJacob Faibussowitsch } 12957a101e5eSJacob Faibussowitsch 1296*1c1ad86eSToby Isaac /*------------------------------------------------ Class Functions --------------------------------------------------*/ 1297*1c1ad86eSToby Isaac 1298*1c1ad86eSToby Isaac /*MC 1299*1c1ad86eSToby Isaac PetscLogObjectCreate - Log the creation of a `PetscObject` 1300*1c1ad86eSToby Isaac 1301*1c1ad86eSToby Isaac Synopsis: 1302*1c1ad86eSToby Isaac #include <petsclog.h> 1303*1c1ad86eSToby Isaac PetscErrorCode PetscLogObjectCreate(PetscObject h) 1304*1c1ad86eSToby Isaac 1305*1c1ad86eSToby Isaac Not Collective 1306*1c1ad86eSToby Isaac 1307*1c1ad86eSToby Isaac Input Parameters: 1308*1c1ad86eSToby Isaac . h - A `PetscObject` 1309*1c1ad86eSToby Isaac 1310*1c1ad86eSToby Isaac Level: developer 1311*1c1ad86eSToby Isaac 1312*1c1ad86eSToby Isaac Developer Note: 1313*1c1ad86eSToby Isaac Called internally by PETSc when creating objects: users do not need to call this directly. 1314*1c1ad86eSToby Isaac 1315*1c1ad86eSToby Isaac .seealso: [](ch_profiling), `PetscLogObjectDestroy()` 1316*1c1ad86eSToby Isaac M*/ 1317*1c1ad86eSToby Isaac 1318*1c1ad86eSToby Isaac /*MC 1319*1c1ad86eSToby Isaac PetscLogObjectDestroy - Logs the destruction of a `PetscObject` 1320*1c1ad86eSToby Isaac 1321*1c1ad86eSToby Isaac Synopsis: 1322*1c1ad86eSToby Isaac #include <petsclog.h> 1323*1c1ad86eSToby Isaac PetscErrorCode PetscLogObjectDestroy(PetscObject h) 1324*1c1ad86eSToby Isaac 1325*1c1ad86eSToby Isaac Not Collective 1326*1c1ad86eSToby Isaac 1327*1c1ad86eSToby Isaac Input Parameters: 1328*1c1ad86eSToby Isaac . h - A `PetscObject` 1329*1c1ad86eSToby Isaac 1330*1c1ad86eSToby Isaac Level: developer 1331*1c1ad86eSToby Isaac 1332*1c1ad86eSToby Isaac Developer Note: 1333*1c1ad86eSToby Isaac Called internally by PETSc when destroying objects: users do not need to call this directly. 1334*1c1ad86eSToby Isaac 1335*1c1ad86eSToby Isaac .seealso: [](ch_profiling), `PetscLogObjectCreate()` 1336*1c1ad86eSToby Isaac M*/ 1337*1c1ad86eSToby Isaac 13385c6c1daeSBarry Smith /*------------------------------------------------ Output Functions -------------------------------------------------*/ 13395c6c1daeSBarry Smith /*@C 13405c6c1daeSBarry Smith PetscLogDump - Dumps logs of objects to a file. This file is intended to 13415c6c1daeSBarry Smith be read by bin/petscview. This program no longer exists. 13425c6c1daeSBarry Smith 1343811af0c4SBarry Smith Collective on `PETSC_COMM_WORLD` 13445c6c1daeSBarry Smith 13455c6c1daeSBarry Smith Input Parameter: 1346aec76313SJacob Faibussowitsch . sname - an optional file name 13475c6c1daeSBarry Smith 134810450e9eSJacob Faibussowitsch Example Usage: 13495c6c1daeSBarry Smith .vb 13505c6c1daeSBarry Smith PetscInitialize(...); 1351bb1d7374SBarry Smith PetscLogDefaultBegin(); or PetscLogAllBegin(); 13525c6c1daeSBarry Smith ... code ... 13535c6c1daeSBarry Smith PetscLogDump(filename); 13545c6c1daeSBarry Smith PetscFinalize(); 13555c6c1daeSBarry Smith .ve 13565c6c1daeSBarry Smith 1357d1f92df0SBarry Smith Level: advanced 1358d1f92df0SBarry Smith 1359811af0c4SBarry Smith Note: 136037fdd005SBarry Smith The default file name is Log.<rank> where <rank> is the MPI process rank. If no name is specified, 13615c6c1daeSBarry Smith this file will be used. 13625c6c1daeSBarry Smith 1363d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogDefaultBegin()`, `PetscLogAllBegin()`, `PetscLogView()` 13645c6c1daeSBarry Smith @*/ 1365d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogDump(const char sname[]) 1366d71ae5a4SJacob Faibussowitsch { 13675c6c1daeSBarry Smith PetscStageLog stageLog; 13685c6c1daeSBarry Smith PetscEventPerfInfo *eventInfo; 13695c6c1daeSBarry Smith FILE *fd; 13705c6c1daeSBarry Smith char file[PETSC_MAX_PATH_LEN], fname[PETSC_MAX_PATH_LEN]; 13715c6c1daeSBarry Smith PetscLogDouble flops, _TotalTime; 13725c6c1daeSBarry Smith PetscMPIInt rank; 13735c6c1daeSBarry Smith int action, object, curStage; 13745c6c1daeSBarry Smith PetscLogEvent event; 13755c6c1daeSBarry Smith 13765c6c1daeSBarry Smith PetscFunctionBegin; 13775c6c1daeSBarry Smith /* Calculate the total elapsed time */ 13783ba16761SJacob Faibussowitsch PetscCall(PetscTime(&_TotalTime)); 13795c6c1daeSBarry Smith _TotalTime -= petsc_BaseTime; 13805c6c1daeSBarry Smith /* Open log file */ 13819566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_rank(PETSC_COMM_WORLD, &rank)); 1382a364092eSJacob Faibussowitsch PetscCall(PetscSNPrintf(file, PETSC_STATIC_ARRAY_LENGTH(file), "%s.%d", sname && sname[0] ? sname : "Log", rank)); 13839566063dSJacob Faibussowitsch PetscCall(PetscFixFilename(file, fname)); 13849566063dSJacob Faibussowitsch PetscCall(PetscFOpen(PETSC_COMM_WORLD, fname, "w", &fd)); 138508401ef6SPierre Jolivet PetscCheck(!(rank == 0) || !(!fd), PETSC_COMM_SELF, PETSC_ERR_FILE_OPEN, "Cannot open file: %s", fname); 13865c6c1daeSBarry Smith /* Output totals */ 13879566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(PETSC_COMM_WORLD, fd, "Total Flop %14e %16.8e\n", petsc_TotalFlops, _TotalTime)); 13889566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(PETSC_COMM_WORLD, fd, "Clock Resolution %g\n", 0.0)); 13895c6c1daeSBarry Smith /* Output actions */ 13905c6c1daeSBarry Smith if (petsc_logActions) { 13919566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(PETSC_COMM_WORLD, fd, "Actions accomplished %d\n", petsc_numActions)); 13925c6c1daeSBarry Smith for (action = 0; action < petsc_numActions; action++) { 13939371c9d4SSatish Balay PetscCall(PetscFPrintf(PETSC_COMM_WORLD, fd, "%g %d %d %d %d %d %d %g %g %g\n", petsc_actions[action].time, petsc_actions[action].action, (int)petsc_actions[action].event, (int)petsc_actions[action].classid, petsc_actions[action].id1, 1394d0609cedSBarry Smith petsc_actions[action].id2, petsc_actions[action].id3, petsc_actions[action].flops, petsc_actions[action].mem, petsc_actions[action].maxmem)); 13955c6c1daeSBarry Smith } 13965c6c1daeSBarry Smith } 13975c6c1daeSBarry Smith /* Output objects */ 13985c6c1daeSBarry Smith if (petsc_logObjects) { 13999566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(PETSC_COMM_WORLD, fd, "Objects created %d destroyed %d\n", petsc_numObjects, petsc_numObjectsDestroyed)); 14005c6c1daeSBarry Smith for (object = 0; object < petsc_numObjects; object++) { 14019566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(PETSC_COMM_WORLD, fd, "Parent ID: %d Memory: %d\n", petsc_objects[object].parent, (int)petsc_objects[object].mem)); 14025c6c1daeSBarry Smith if (!petsc_objects[object].name[0]) { 14039566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(PETSC_COMM_WORLD, fd, "No Name\n")); 14045c6c1daeSBarry Smith } else { 14059566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(PETSC_COMM_WORLD, fd, "Name: %s\n", petsc_objects[object].name)); 14065c6c1daeSBarry Smith } 14075c6c1daeSBarry Smith if (petsc_objects[object].info[0] != 0) { 14089566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(PETSC_COMM_WORLD, fd, "No Info\n")); 14095c6c1daeSBarry Smith } else { 14109566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(PETSC_COMM_WORLD, fd, "Info: %s\n", petsc_objects[object].info)); 14115c6c1daeSBarry Smith } 14125c6c1daeSBarry Smith } 14135c6c1daeSBarry Smith } 14145c6c1daeSBarry Smith /* Output events */ 14159566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(PETSC_COMM_WORLD, fd, "Event log:\n")); 14169566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 14179566063dSJacob Faibussowitsch PetscCall(PetscIntStackTop(stageLog->stack, &curStage)); 14185c6c1daeSBarry Smith eventInfo = stageLog->stageInfo[curStage].eventLog->eventInfo; 14195c6c1daeSBarry Smith for (event = 0; event < stageLog->stageInfo[curStage].eventLog->numEvents; event++) { 1420a297a907SKarl Rupp if (eventInfo[event].time != 0.0) flops = eventInfo[event].flops / eventInfo[event].time; 1421a297a907SKarl Rupp else flops = 0.0; 1422d0609cedSBarry Smith PetscCall(PetscFPrintf(PETSC_COMM_WORLD, fd, "%d %16d %16g %16g %16g\n", event, eventInfo[event].count, eventInfo[event].flops, eventInfo[event].time, flops)); 14235c6c1daeSBarry Smith } 14249566063dSJacob Faibussowitsch PetscCall(PetscFClose(PETSC_COMM_WORLD, fd)); 14253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 14265c6c1daeSBarry Smith } 14275c6c1daeSBarry Smith 1428f14045dbSBarry Smith /* 1429f14045dbSBarry Smith PetscLogView_Detailed - Each process prints the times for its own events 1430f14045dbSBarry Smith 1431f14045dbSBarry Smith */ 143210450e9eSJacob Faibussowitsch static PetscErrorCode PetscLogView_Detailed(PetscViewer viewer) 1433d71ae5a4SJacob Faibussowitsch { 14342dff6485SMatthew G. Knepley PetscStageLog stageLog; 1435217044c2SLisandro Dalcin PetscEventPerfInfo *eventInfo = NULL, *stageInfo = NULL; 1436217044c2SLisandro Dalcin PetscLogDouble locTotalTime, numRed, maxMem; 14372dff6485SMatthew G. Knepley int numStages, numEvents, stage, event; 1438217044c2SLisandro Dalcin MPI_Comm comm = PetscObjectComm((PetscObject)viewer); 14392dff6485SMatthew G. Knepley PetscMPIInt rank, size; 1440f14045dbSBarry Smith 1441f14045dbSBarry Smith PetscFunctionBegin; 14429566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(comm, &size)); 14439566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_rank(comm, &rank)); 14442dff6485SMatthew G. Knepley /* Must preserve reduction count before we go on */ 14452dff6485SMatthew G. Knepley numRed = petsc_allreduce_ct + petsc_gather_ct + petsc_scatter_ct; 14462d1ec343SBarry Smith /* Get the total elapsed time */ 14473ba16761SJacob Faibussowitsch PetscCall(PetscTime(&locTotalTime)); 14489371c9d4SSatish Balay locTotalTime -= petsc_BaseTime; 14499566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "size = %d\n", size)); 14509566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "LocalTimes = {}\n")); 14519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "LocalMessages = {}\n")); 14529566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "LocalMessageLens = {}\n")); 14539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "LocalReductions = {}\n")); 14549566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "LocalFlop = {}\n")); 14559566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "LocalObjects = {}\n")); 14569566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "LocalMemory = {}\n")); 14579566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 14589566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&stageLog->numStages, &numStages, 1, MPI_INT, MPI_MAX, comm)); 14599566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "Stages = {}\n")); 14602d1ec343SBarry Smith for (stage = 0; stage < numStages; stage++) { 14619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "Stages[\"%s\"] = {}\n", stageLog->stageInfo[stage].name)); 14629566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "Stages[\"%s\"][\"summary\"] = {}\n", stageLog->stageInfo[stage].name)); 14639566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&stageLog->stageInfo[stage].eventLog->numEvents, &numEvents, 1, MPI_INT, MPI_MAX, comm)); 146448a46eb9SPierre Jolivet for (event = 0; event < numEvents; event++) PetscCall(PetscViewerASCIIPrintf(viewer, "Stages[\"%s\"][\"%s\"] = {}\n", stageLog->stageInfo[stage].name, stageLog->eventLog->eventInfo[event].name)); 14652d1ec343SBarry Smith } 14669566063dSJacob Faibussowitsch PetscCall(PetscMallocGetMaximumUsage(&maxMem)); 14679566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPushSynchronized(viewer)); 14689566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, "LocalTimes[%d] = %g\n", rank, locTotalTime)); 14699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, "LocalMessages[%d] = %g\n", rank, (petsc_irecv_ct + petsc_isend_ct + petsc_recv_ct + petsc_send_ct))); 14709566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, "LocalMessageLens[%d] = %g\n", rank, (petsc_irecv_len + petsc_isend_len + petsc_recv_len + petsc_send_len))); 14719566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, "LocalReductions[%d] = %g\n", rank, numRed)); 14729566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, "LocalFlop[%d] = %g\n", rank, petsc_TotalFlops)); 14739566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, "LocalObjects[%d] = %d\n", rank, petsc_numObjects)); 14749566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, "LocalMemory[%d] = %g\n", rank, maxMem)); 14759566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 14762d1ec343SBarry Smith for (stage = 0; stage < numStages; stage++) { 1477217044c2SLisandro Dalcin stageInfo = &stageLog->stageInfo[stage].perfInfo; 14789371c9d4SSatish Balay PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, "Stages[\"%s\"][\"summary\"][%d] = {\"time\" : %g, \"numMessages\" : %g, \"messageLength\" : %g, \"numReductions\" : %g, \"flop\" : %g}\n", stageLog->stageInfo[stage].name, rank, stageInfo->time, 14799371c9d4SSatish Balay stageInfo->numMessages, stageInfo->messageLength, stageInfo->numReductions, stageInfo->flops)); 14809566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&stageLog->stageInfo[stage].eventLog->numEvents, &numEvents, 1, MPI_INT, MPI_MAX, comm)); 14812d1ec343SBarry Smith for (event = 0; event < numEvents; event++) { 1482217044c2SLisandro Dalcin eventInfo = &stageLog->stageInfo[stage].eventLog->eventInfo[event]; 1483d0609cedSBarry Smith PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, "Stages[\"%s\"][\"%s\"][%d] = {\"count\" : %d, \"time\" : %g, \"syncTime\" : %g, \"numMessages\" : %g, \"messageLength\" : %g, \"numReductions\" : %g, \"flop\" : %g", 14849371c9d4SSatish Balay stageLog->stageInfo[stage].name, stageLog->eventLog->eventInfo[event].name, rank, eventInfo->count, eventInfo->time, eventInfo->syncTime, eventInfo->numMessages, eventInfo->messageLength, eventInfo->numReductions, 14859371c9d4SSatish Balay eventInfo->flops)); 1486891e75beSMatthew G. Knepley if (eventInfo->dof[0] >= 0.) { 1487891e75beSMatthew G. Knepley PetscInt d, e; 14885d68e14cSMatthew G. Knepley 14899566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, ", \"dof\" : [")); 1490891e75beSMatthew G. Knepley for (d = 0; d < 8; ++d) { 14919566063dSJacob Faibussowitsch if (d > 0) PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, ", ")); 14929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, "%g", eventInfo->dof[d])); 1493891e75beSMatthew G. Knepley } 14949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, "]")); 14959566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, ", \"error\" : [")); 14965d68e14cSMatthew G. Knepley for (e = 0; e < 8; ++e) { 14979566063dSJacob Faibussowitsch if (e > 0) PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, ", ")); 14989566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, "%g", eventInfo->errors[e])); 14995d68e14cSMatthew G. Knepley } 15009566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, "]")); 15015d68e14cSMatthew G. Knepley } 15029566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, "}\n")); 15032d1ec343SBarry Smith } 15042d1ec343SBarry Smith } 15059566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 15069566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPopSynchronized(viewer)); 15073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1508f14045dbSBarry Smith } 1509f14045dbSBarry Smith 151038144912Sdeepblu2718 /* 151138144912Sdeepblu2718 PetscLogView_CSV - Each process prints the times for its own events in Comma-Separated Value Format 151238144912Sdeepblu2718 */ 151310450e9eSJacob Faibussowitsch static PetscErrorCode PetscLogView_CSV(PetscViewer viewer) 1514d71ae5a4SJacob Faibussowitsch { 151538144912Sdeepblu2718 PetscStageLog stageLog; 1516669c5be0SSatish Balay PetscEventPerfInfo *eventInfo = NULL; 151738144912Sdeepblu2718 PetscLogDouble locTotalTime, maxMem; 151838144912Sdeepblu2718 int numStages, numEvents, stage, event; 151938144912Sdeepblu2718 MPI_Comm comm = PetscObjectComm((PetscObject)viewer); 152038144912Sdeepblu2718 PetscMPIInt rank, size; 152138144912Sdeepblu2718 152238144912Sdeepblu2718 PetscFunctionBegin; 15239566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(comm, &size)); 15249566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_rank(comm, &rank)); 152538144912Sdeepblu2718 /* Must preserve reduction count before we go on */ 152638144912Sdeepblu2718 /* Get the total elapsed time */ 15273ba16761SJacob Faibussowitsch PetscCall(PetscTime(&locTotalTime)); 15289371c9d4SSatish Balay locTotalTime -= petsc_BaseTime; 15299566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 15309566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&stageLog->numStages, &numStages, 1, MPI_INT, MPI_MAX, comm)); 15319566063dSJacob Faibussowitsch PetscCall(PetscMallocGetMaximumUsage(&maxMem)); 15329566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPushSynchronized(viewer)); 1533d0609cedSBarry Smith PetscCall(PetscViewerASCIIPrintf(viewer, "Stage Name,Event Name,Rank,Count,Time,Num Messages,Message Length,Num Reductions,FLOP,dof0,dof1,dof2,dof3,dof4,dof5,dof6,dof7,e0,e1,e2,e3,e4,e5,e6,e7,%d\n", size)); 15349566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 153538144912Sdeepblu2718 for (stage = 0; stage < numStages; stage++) { 15369e29573dSMatthew G. Knepley PetscEventPerfInfo *stageInfo = &stageLog->stageInfo[stage].perfInfo; 15379e29573dSMatthew G. Knepley 15389371c9d4SSatish Balay PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, "%s,summary,%d,1,%g,%g,%g,%g,%g\n", stageLog->stageInfo[stage].name, rank, stageInfo->time, stageInfo->numMessages, stageInfo->messageLength, stageInfo->numReductions, stageInfo->flops)); 15399566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&stageLog->stageInfo[stage].eventLog->numEvents, &numEvents, 1, MPI_INT, MPI_MAX, comm)); 154038144912Sdeepblu2718 for (event = 0; event < numEvents; event++) { 154138144912Sdeepblu2718 eventInfo = &stageLog->stageInfo[stage].eventLog->eventInfo[event]; 15429371c9d4SSatish Balay PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, "%s,%s,%d,%d,%g,%g,%g,%g,%g", stageLog->stageInfo[stage].name, stageLog->eventLog->eventInfo[event].name, rank, eventInfo->count, eventInfo->time, eventInfo->numMessages, eventInfo->messageLength, 15439371c9d4SSatish Balay eventInfo->numReductions, eventInfo->flops)); 154438144912Sdeepblu2718 if (eventInfo->dof[0] >= 0.) { 154538144912Sdeepblu2718 PetscInt d, e; 154638144912Sdeepblu2718 154748a46eb9SPierre Jolivet for (d = 0; d < 8; ++d) PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, ",%g", eventInfo->dof[d])); 154848a46eb9SPierre Jolivet for (e = 0; e < 8; ++e) PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, ",%g", eventInfo->errors[e])); 154938144912Sdeepblu2718 } 15509566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, "\n")); 155138144912Sdeepblu2718 } 155238144912Sdeepblu2718 } 15539566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 15549566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPopSynchronized(viewer)); 15553ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 155638144912Sdeepblu2718 } 155738144912Sdeepblu2718 1558d71ae5a4SJacob Faibussowitsch static PetscErrorCode PetscLogViewWarnSync(MPI_Comm comm, FILE *fd) 1559d71ae5a4SJacob Faibussowitsch { 1560217044c2SLisandro Dalcin PetscFunctionBegin; 15613ba16761SJacob Faibussowitsch if (!PetscLogSyncOn) PetscFunctionReturn(PETSC_SUCCESS); 15629566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n\n")); 15639566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " ##########################################################\n")); 15649566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # #\n")); 15659566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # WARNING!!! #\n")); 15669566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # #\n")); 15679566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # This program was run with logging synchronization. #\n")); 15689566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # This option provides more meaningful imbalance #\n")); 15699566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # figures at the expense of slowing things down and #\n")); 15709566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # providing a distorted view of the overall runtime. #\n")); 15719566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # #\n")); 15729566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " ##########################################################\n\n\n")); 15733ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1574217044c2SLisandro Dalcin } 1575217044c2SLisandro Dalcin 1576d71ae5a4SJacob Faibussowitsch static PetscErrorCode PetscLogViewWarnDebugging(MPI_Comm comm, FILE *fd) 1577d71ae5a4SJacob Faibussowitsch { 1578f4091ad2SBarry Smith PetscFunctionBegin; 157976bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 15809566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n\n")); 15819566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " ##########################################################\n")); 15829566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # #\n")); 15839566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # WARNING!!! #\n")); 15849566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # #\n")); 15859566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # This code was compiled with a debugging option. #\n")); 15869566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # To get timing results run ./configure #\n")); 15879566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # using --with-debugging=no, the performance will #\n")); 15889566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # be generally two or three times faster. #\n")); 15899566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # #\n")); 15909566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " ##########################################################\n\n\n")); 159176bd3646SJed Brown } 15923ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1593f4091ad2SBarry Smith } 1594f4091ad2SBarry Smith 1595d71ae5a4SJacob Faibussowitsch static PetscErrorCode PetscLogViewWarnNoGpuAwareMpi(MPI_Comm comm, FILE *fd) 1596d71ae5a4SJacob Faibussowitsch { 1597009ab46cSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 1598009ab46cSJunchao Zhang PetscMPIInt size; 15998fe3844cSJunchao Zhang PetscBool deviceInitialized = PETSC_FALSE; 1600c2a741eeSJunchao Zhang 1601c2a741eeSJunchao Zhang PetscFunctionBegin; 16029566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(comm, &size)); 16038fe3844cSJunchao Zhang for (int i = PETSC_DEVICE_HOST + 1; i < PETSC_DEVICE_MAX; ++i) { 16048fe3844cSJunchao Zhang const PetscDeviceType dtype = PetscDeviceTypeCast(i); 16058fe3844cSJunchao Zhang if (PetscDeviceInitialized(dtype)) { /* a non-host device was initialized */ 16068fe3844cSJunchao Zhang deviceInitialized = PETSC_TRUE; 16078fe3844cSJunchao Zhang break; 16088fe3844cSJunchao Zhang } 16098fe3844cSJunchao Zhang } 16108fe3844cSJunchao Zhang /* the last condition says petsc is configured with device but it is a pure CPU run, so don't print misleading warnings */ 16113ba16761SJacob Faibussowitsch if (use_gpu_aware_mpi || size == 1 || !deviceInitialized) PetscFunctionReturn(PETSC_SUCCESS); 16129566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n\n")); 16139566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " ##########################################################\n")); 16149566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # #\n")); 16159566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # WARNING!!! #\n")); 16169566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # #\n")); 16179566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # This code was compiled with GPU support and you've #\n")); 16189566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # created PETSc/GPU objects, but you intentionally #\n")); 16199566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # used -use_gpu_aware_mpi 0, requiring PETSc to copy #\n")); 16209566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # additional data between the GPU and CPU. To obtain #\n")); 16219566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # meaningful timing results on multi-rank runs, use #\n")); 16229566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # GPU-aware MPI instead. #\n")); 16239566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # #\n")); 16249566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " ##########################################################\n\n\n")); 16253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1626c2a741eeSJunchao Zhang #else 162710450e9eSJacob Faibussowitsch (void)comm; 162810450e9eSJacob Faibussowitsch (void)fd; 16293ba16761SJacob Faibussowitsch return PETSC_SUCCESS; 1630c2a741eeSJunchao Zhang #endif 1631c2a741eeSJunchao Zhang } 1632c2a741eeSJunchao Zhang 1633d71ae5a4SJacob Faibussowitsch static PetscErrorCode PetscLogViewWarnGpuTime(MPI_Comm comm, FILE *fd) 1634d71ae5a4SJacob Faibussowitsch { 1635156b51fbSBarry Smith #if defined(PETSC_HAVE_DEVICE) 1636156b51fbSBarry Smith PetscFunctionBegin; 16373ba16761SJacob Faibussowitsch if (!PetscLogGpuTimeFlag || petsc_gflops == 0) PetscFunctionReturn(PETSC_SUCCESS); 1638156b51fbSBarry Smith PetscCall(PetscFPrintf(comm, fd, "\n\n")); 1639156b51fbSBarry Smith PetscCall(PetscFPrintf(comm, fd, " ##########################################################\n")); 1640156b51fbSBarry Smith PetscCall(PetscFPrintf(comm, fd, " # #\n")); 1641156b51fbSBarry Smith PetscCall(PetscFPrintf(comm, fd, " # WARNING!!! #\n")); 1642156b51fbSBarry Smith PetscCall(PetscFPrintf(comm, fd, " # #\n")); 1643156b51fbSBarry Smith PetscCall(PetscFPrintf(comm, fd, " # This code was run with -log_view_gpu_time #\n")); 1644156b51fbSBarry Smith PetscCall(PetscFPrintf(comm, fd, " # This provides accurate timing within the GPU kernels #\n")); 1645156b51fbSBarry Smith PetscCall(PetscFPrintf(comm, fd, " # but can slow down the entire computation by a #\n")); 1646156b51fbSBarry Smith PetscCall(PetscFPrintf(comm, fd, " # measurable amount. For fastest runs we recommend #\n")); 1647156b51fbSBarry Smith PetscCall(PetscFPrintf(comm, fd, " # not using this option. #\n")); 1648156b51fbSBarry Smith PetscCall(PetscFPrintf(comm, fd, " # #\n")); 1649156b51fbSBarry Smith PetscCall(PetscFPrintf(comm, fd, " ##########################################################\n\n\n")); 16503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1651156b51fbSBarry Smith #else 165210450e9eSJacob Faibussowitsch (void)comm; 165310450e9eSJacob Faibussowitsch (void)fd; 16543ba16761SJacob Faibussowitsch return PETSC_SUCCESS; 1655156b51fbSBarry Smith #endif 1656156b51fbSBarry Smith } 1657156b51fbSBarry Smith 165810450e9eSJacob Faibussowitsch static PetscErrorCode PetscLogView_Default(PetscViewer viewer) 1659d71ae5a4SJacob Faibussowitsch { 16605c6c1daeSBarry Smith FILE *fd; 16615c6c1daeSBarry Smith PetscLogDouble zero = 0.0; 16625c6c1daeSBarry Smith PetscStageLog stageLog; 16630298fd71SBarry Smith PetscStageInfo *stageInfo = NULL; 16640298fd71SBarry Smith PetscEventPerfInfo *eventInfo = NULL; 16655c6c1daeSBarry Smith PetscClassPerfInfo *classInfo; 16665c6c1daeSBarry Smith char arch[128], hostname[128], username[128], pname[PETSC_MAX_PATH_LEN], date[128]; 16675c6c1daeSBarry Smith const char *name; 16685c6c1daeSBarry Smith PetscLogDouble locTotalTime, TotalTime, TotalFlops; 16695c6c1daeSBarry Smith PetscLogDouble numMessages, messageLength, avgMessLen, numReductions; 16705c6c1daeSBarry Smith PetscLogDouble stageTime, flops, flopr, mem, mess, messLen, red; 16715c6c1daeSBarry Smith PetscLogDouble fracTime, fracFlops, fracMessages, fracLength, fracReductions, fracMess, fracMessLen, fracRed; 16725c6c1daeSBarry Smith PetscLogDouble fracStageTime, fracStageFlops, fracStageMess, fracStageMessLen, fracStageRed; 16735c6c1daeSBarry Smith PetscLogDouble min, max, tot, ratio, avg, x, y; 1674e3ed9ee7SBarry Smith PetscLogDouble minf, maxf, totf, ratf, mint, maxt, tott, ratt, ratC, totm, totml, totr, mal, malmax, emalmax; 1675d9c66bfbSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 1676156b51fbSBarry Smith PetscLogEvent KSP_Solve, SNES_Solve, TS_Step, TAO_Solve; /* These need to be fixed to be some events registered with certain objects */ 1677958c4211Shannah_mairs PetscLogDouble cct, gct, csz, gsz, gmaxt, gflops, gflopr, fracgflops; 1678bec0b493Shannah_mairs #endif 1679217044c2SLisandro Dalcin PetscMPIInt minC, maxC; 16805c6c1daeSBarry Smith PetscMPIInt size, rank; 16815c6c1daeSBarry Smith PetscBool *localStageUsed, *stageUsed; 16825c6c1daeSBarry Smith PetscBool *localStageVisible, *stageVisible; 16835c6c1daeSBarry Smith int numStages, localNumEvents, numEvents; 168437b78d16SBarry Smith int stage, oclass; 16855c6c1daeSBarry Smith PetscLogEvent event; 16865c6c1daeSBarry Smith char version[256]; 16875c6c1daeSBarry Smith MPI_Comm comm; 1688156b51fbSBarry Smith #if defined(PETSC_HAVE_DEVICE) 1689156b51fbSBarry Smith PetscLogEvent eventid; 1690156b51fbSBarry Smith PetscInt64 nas = 0x7FF0000000000002; 1691156b51fbSBarry Smith #endif 16925c6c1daeSBarry Smith 16935c6c1daeSBarry Smith PetscFunctionBegin; 1694156b51fbSBarry Smith PetscCall(PetscFPTrapPush(PETSC_FP_TRAP_OFF)); 16959566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)viewer, &comm)); 16969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIGetPointer(viewer, &fd)); 16979566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(comm, &size)); 16989566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_rank(comm, &rank)); 16995c6c1daeSBarry Smith /* Get the total elapsed time */ 17003ba16761SJacob Faibussowitsch PetscCall(PetscTime(&locTotalTime)); 17019371c9d4SSatish Balay locTotalTime -= petsc_BaseTime; 17025c6c1daeSBarry Smith 1703faad7b01SPierre Jolivet PetscCall(PetscFPrintf(comm, fd, "****************************************************************************************************************************************************************\n")); 17049566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "*** WIDEN YOUR WINDOW TO 160 CHARACTERS. Use 'enscript -r -fCourier9' to print this document ***\n")); 17059566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "****************************************************************************************************************************************************************\n")); 1706faad7b01SPierre Jolivet PetscCall(PetscFPrintf(comm, fd, "\n------------------------------------------------------------------ PETSc Performance Summary: ------------------------------------------------------------------\n\n")); 17079566063dSJacob Faibussowitsch PetscCall(PetscLogViewWarnSync(comm, fd)); 17089566063dSJacob Faibussowitsch PetscCall(PetscLogViewWarnDebugging(comm, fd)); 17099566063dSJacob Faibussowitsch PetscCall(PetscLogViewWarnNoGpuAwareMpi(comm, fd)); 1710156b51fbSBarry Smith PetscCall(PetscLogViewWarnGpuTime(comm, fd)); 17119566063dSJacob Faibussowitsch PetscCall(PetscGetArchType(arch, sizeof(arch))); 17129566063dSJacob Faibussowitsch PetscCall(PetscGetHostName(hostname, sizeof(hostname))); 17139566063dSJacob Faibussowitsch PetscCall(PetscGetUserName(username, sizeof(username))); 17149566063dSJacob Faibussowitsch PetscCall(PetscGetProgramName(pname, sizeof(pname))); 17159566063dSJacob Faibussowitsch PetscCall(PetscGetDate(date, sizeof(date))); 17169566063dSJacob Faibussowitsch PetscCall(PetscGetVersion(version, sizeof(version))); 17175c6c1daeSBarry Smith if (size == 1) { 17189566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "%s on a %s named %s with %d processor, by %s %s\n", pname, arch, hostname, size, username, date)); 17195c6c1daeSBarry Smith } else { 17209566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "%s on a %s named %s with %d processors, by %s %s\n", pname, arch, hostname, size, username, date)); 17215c6c1daeSBarry Smith } 1722f90b075cSBarry Smith #if defined(PETSC_HAVE_OPENMP) 17239566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Using %" PetscInt_FMT " OpenMP threads\n", PetscNumOMPThreads)); 1724f90b075cSBarry Smith #endif 17259566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Using %s\n", version)); 17265c6c1daeSBarry Smith 17275c6c1daeSBarry Smith /* Must preserve reduction count before we go on */ 17285c6c1daeSBarry Smith red = petsc_allreduce_ct + petsc_gather_ct + petsc_scatter_ct; 17295c6c1daeSBarry Smith 17305c6c1daeSBarry Smith /* Calculate summary information */ 17319566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n Max Max/Min Avg Total\n")); 17325c6c1daeSBarry Smith /* Time */ 1733712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&locTotalTime, &min, 1, MPIU_PETSCLOGDOUBLE, MPI_MIN, comm)); 1734712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&locTotalTime, &max, 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 1735712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&locTotalTime, &tot, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1736217044c2SLisandro Dalcin avg = tot / ((PetscLogDouble)size); 17379371c9d4SSatish Balay if (min != 0.0) ratio = max / min; 17389371c9d4SSatish Balay else ratio = 0.0; 17399566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Time (sec): %5.3e %7.3f %5.3e\n", max, ratio, avg)); 17405c6c1daeSBarry Smith TotalTime = tot; 17415c6c1daeSBarry Smith /* Objects */ 17425c6c1daeSBarry Smith avg = (PetscLogDouble)petsc_numObjects; 1743712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&avg, &min, 1, MPIU_PETSCLOGDOUBLE, MPI_MIN, comm)); 1744712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&avg, &max, 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 1745712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&avg, &tot, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1746217044c2SLisandro Dalcin avg = tot / ((PetscLogDouble)size); 17479371c9d4SSatish Balay if (min != 0.0) ratio = max / min; 17489371c9d4SSatish Balay else ratio = 0.0; 17499566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Objects: %5.3e %7.3f %5.3e\n", max, ratio, avg)); 17505c6c1daeSBarry Smith /* Flops */ 1751712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&petsc_TotalFlops, &min, 1, MPIU_PETSCLOGDOUBLE, MPI_MIN, comm)); 1752712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&petsc_TotalFlops, &max, 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 1753712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&petsc_TotalFlops, &tot, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1754217044c2SLisandro Dalcin avg = tot / ((PetscLogDouble)size); 17559371c9d4SSatish Balay if (min != 0.0) ratio = max / min; 17569371c9d4SSatish Balay else ratio = 0.0; 17579566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Flops: %5.3e %7.3f %5.3e %5.3e\n", max, ratio, avg, tot)); 17585c6c1daeSBarry Smith TotalFlops = tot; 17595c6c1daeSBarry Smith /* Flops/sec -- Must talk to Barry here */ 17609371c9d4SSatish Balay if (locTotalTime != 0.0) flops = petsc_TotalFlops / locTotalTime; 17619371c9d4SSatish Balay else flops = 0.0; 1762712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&flops, &min, 1, MPIU_PETSCLOGDOUBLE, MPI_MIN, comm)); 1763712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&flops, &max, 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 1764712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&flops, &tot, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1765217044c2SLisandro Dalcin avg = tot / ((PetscLogDouble)size); 17669371c9d4SSatish Balay if (min != 0.0) ratio = max / min; 17679371c9d4SSatish Balay else ratio = 0.0; 17689566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Flops/sec: %5.3e %7.3f %5.3e %5.3e\n", max, ratio, avg, tot)); 17695c6c1daeSBarry Smith /* Memory */ 17709566063dSJacob Faibussowitsch PetscCall(PetscMallocGetMaximumUsage(&mem)); 17715c6c1daeSBarry Smith if (mem > 0.0) { 1772712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&mem, &min, 1, MPIU_PETSCLOGDOUBLE, MPI_MIN, comm)); 1773712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&mem, &max, 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 1774712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&mem, &tot, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1775217044c2SLisandro Dalcin avg = tot / ((PetscLogDouble)size); 17769371c9d4SSatish Balay if (min != 0.0) ratio = max / min; 17779371c9d4SSatish Balay else ratio = 0.0; 17789566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Memory (bytes): %5.3e %7.3f %5.3e %5.3e\n", max, ratio, avg, tot)); 17795c6c1daeSBarry Smith } 17805c6c1daeSBarry Smith /* Messages */ 17815c6c1daeSBarry Smith mess = 0.5 * (petsc_irecv_ct + petsc_isend_ct + petsc_recv_ct + petsc_send_ct); 1782712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&mess, &min, 1, MPIU_PETSCLOGDOUBLE, MPI_MIN, comm)); 1783712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&mess, &max, 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 1784712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&mess, &tot, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1785217044c2SLisandro Dalcin avg = tot / ((PetscLogDouble)size); 17869371c9d4SSatish Balay if (min != 0.0) ratio = max / min; 17879371c9d4SSatish Balay else ratio = 0.0; 17889566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "MPI Msg Count: %5.3e %7.3f %5.3e %5.3e\n", max, ratio, avg, tot)); 17895c6c1daeSBarry Smith numMessages = tot; 17905c6c1daeSBarry Smith /* Message Lengths */ 17915c6c1daeSBarry Smith mess = 0.5 * (petsc_irecv_len + petsc_isend_len + petsc_recv_len + petsc_send_len); 1792712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&mess, &min, 1, MPIU_PETSCLOGDOUBLE, MPI_MIN, comm)); 1793712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&mess, &max, 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 1794712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&mess, &tot, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 17959371c9d4SSatish Balay if (numMessages != 0) avg = tot / numMessages; 17969371c9d4SSatish Balay else avg = 0.0; 17979371c9d4SSatish Balay if (min != 0.0) ratio = max / min; 17989371c9d4SSatish Balay else ratio = 0.0; 17999566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "MPI Msg Len (bytes): %5.3e %7.3f %5.3e %5.3e\n", max, ratio, avg, tot)); 18005c6c1daeSBarry Smith messageLength = tot; 18015c6c1daeSBarry Smith /* Reductions */ 1802712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&red, &min, 1, MPIU_PETSCLOGDOUBLE, MPI_MIN, comm)); 1803712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&red, &max, 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 1804712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&red, &tot, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18059371c9d4SSatish Balay if (min != 0.0) ratio = max / min; 18069371c9d4SSatish Balay else ratio = 0.0; 18079566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "MPI Reductions: %5.3e %7.3f\n", max, ratio)); 18085c6c1daeSBarry Smith numReductions = red; /* wrong because uses count from process zero */ 18099566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\nFlop counting convention: 1 flop = 1 real number operation of type (multiply/divide/add/subtract)\n")); 18109566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " e.g., VecAXPY() for real vectors of length N --> 2N flops\n")); 18119566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " and VecAXPY() for complex vectors of length N --> 8N flops\n")); 18125c6c1daeSBarry Smith 18135c6c1daeSBarry Smith /* Get total number of stages -- 18145c6c1daeSBarry Smith Currently, a single processor can register more stages than another, but stages must all be registered in order. 18155c6c1daeSBarry Smith We can removed this requirement if necessary by having a global stage numbering and indirection on the stage ID. 18165c6c1daeSBarry Smith This seems best accomplished by assoicating a communicator with each stage. 18175c6c1daeSBarry Smith */ 18189566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 18199566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&stageLog->numStages, &numStages, 1, MPI_INT, MPI_MAX, comm)); 18209566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(numStages, &localStageUsed)); 18219566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(numStages, &stageUsed)); 18229566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(numStages, &localStageVisible)); 18239566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(numStages, &stageVisible)); 18245c6c1daeSBarry Smith if (numStages > 0) { 18255c6c1daeSBarry Smith stageInfo = stageLog->stageInfo; 18265c6c1daeSBarry Smith for (stage = 0; stage < numStages; stage++) { 18275c6c1daeSBarry Smith if (stage < stageLog->numStages) { 18285c6c1daeSBarry Smith localStageUsed[stage] = stageInfo[stage].used; 18295c6c1daeSBarry Smith localStageVisible[stage] = stageInfo[stage].perfInfo.visible; 18305c6c1daeSBarry Smith } else { 18315c6c1daeSBarry Smith localStageUsed[stage] = PETSC_FALSE; 18325c6c1daeSBarry Smith localStageVisible[stage] = PETSC_TRUE; 18335c6c1daeSBarry Smith } 18345c6c1daeSBarry Smith } 1835712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(localStageUsed, stageUsed, numStages, MPIU_BOOL, MPI_LOR, comm)); 1836712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(localStageVisible, stageVisible, numStages, MPIU_BOOL, MPI_LAND, comm)); 18375c6c1daeSBarry Smith for (stage = 0; stage < numStages; stage++) { 18385c6c1daeSBarry Smith if (stageUsed[stage]) { 18399566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\nSummary of Stages: ----- Time ------ ----- Flop ------ --- Messages --- -- Message Lengths -- -- Reductions --\n")); 18409566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " Avg %%Total Avg %%Total Count %%Total Avg %%Total Count %%Total\n")); 18415c6c1daeSBarry Smith break; 18425c6c1daeSBarry Smith } 18435c6c1daeSBarry Smith } 18445c6c1daeSBarry Smith for (stage = 0; stage < numStages; stage++) { 18455c6c1daeSBarry Smith if (!stageUsed[stage]) continue; 1846820f2d46SBarry Smith /* CANNOT use MPI_Allreduce() since it might fail the line number check */ 18475c6c1daeSBarry Smith if (localStageUsed[stage]) { 1848712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&stageInfo[stage].perfInfo.time, &stageTime, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1849712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&stageInfo[stage].perfInfo.flops, &flops, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1850712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&stageInfo[stage].perfInfo.numMessages, &mess, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1851712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&stageInfo[stage].perfInfo.messageLength, &messLen, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1852712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&stageInfo[stage].perfInfo.numReductions, &red, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18535c6c1daeSBarry Smith name = stageInfo[stage].name; 18545c6c1daeSBarry Smith } else { 1855712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &stageTime, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1856712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &flops, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1857712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &mess, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1858712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &messLen, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1859712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &red, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18605c6c1daeSBarry Smith name = ""; 18615c6c1daeSBarry Smith } 18629371c9d4SSatish Balay mess *= 0.5; 18639371c9d4SSatish Balay messLen *= 0.5; 18649371c9d4SSatish Balay red /= size; 18659371c9d4SSatish Balay if (TotalTime != 0.0) fracTime = stageTime / TotalTime; 18669371c9d4SSatish Balay else fracTime = 0.0; 18679371c9d4SSatish Balay if (TotalFlops != 0.0) fracFlops = flops / TotalFlops; 18689371c9d4SSatish Balay else fracFlops = 0.0; 18695c6c1daeSBarry Smith /* Talk to Barry if (stageTime != 0.0) flops = (size*flops)/stageTime; else flops = 0.0; */ 18709371c9d4SSatish Balay if (numMessages != 0.0) fracMessages = mess / numMessages; 18719371c9d4SSatish Balay else fracMessages = 0.0; 18729371c9d4SSatish Balay if (mess != 0.0) avgMessLen = messLen / mess; 18739371c9d4SSatish Balay else avgMessLen = 0.0; 18749371c9d4SSatish Balay if (messageLength != 0.0) fracLength = messLen / messageLength; 18759371c9d4SSatish Balay else fracLength = 0.0; 18769371c9d4SSatish Balay if (numReductions != 0.0) fracReductions = red / numReductions; 18779371c9d4SSatish Balay else fracReductions = 0.0; 18789371c9d4SSatish Balay PetscCall(PetscFPrintf(comm, fd, "%2d: %15s: %6.4e %5.1f%% %6.4e %5.1f%% %5.3e %5.1f%% %5.3e %5.1f%% %5.3e %5.1f%%\n", stage, name, stageTime / size, 100.0 * fracTime, flops, 100.0 * fracFlops, mess, 100.0 * fracMessages, avgMessLen, 100.0 * fracLength, red, 100.0 * fracReductions)); 18795c6c1daeSBarry Smith } 18805c6c1daeSBarry Smith } 18815c6c1daeSBarry Smith 18829566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n------------------------------------------------------------------------------------------------------------------------\n")); 18839566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "See the 'Profiling' chapter of the users' manual for details on interpreting output.\n")); 18849566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Phase summary info:\n")); 18859566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " Count: number of times phase was executed\n")); 18869566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " Time and Flop: Max - maximum over all processors\n")); 18879566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " Ratio - ratio of maximum to minimum over all processors\n")); 18889566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " Mess: number of messages sent\n")); 18899566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " AvgLen: average message length (bytes)\n")); 18909566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " Reduct: number of global reductions\n")); 18919566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " Global: entire computation\n")); 18929566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " Stage: stages of a computation. Set stages with PetscLogStagePush() and PetscLogStagePop().\n")); 18939566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " %%T - percent time in this phase %%F - percent flop in this phase\n")); 18949566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " %%M - percent messages in this phase %%L - percent message lengths in this phase\n")); 18959566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " %%R - percent reductions in this phase\n")); 18969566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " Total Mflop/s: 10e-6 * (sum of flop over all processors)/(max time over all processors)\n")); 1897e3ed9ee7SBarry Smith if (PetscLogMemory) { 189892d1ba04SBarry Smith PetscCall(PetscFPrintf(comm, fd, " Memory usage is summed over all MPI processes, it is given in mega-bytes\n")); 189954aabf2dSBarry Smith PetscCall(PetscFPrintf(comm, fd, " Malloc Mbytes: Memory allocated and kept during event (sum over all calls to event). May be negative\n")); 190054aabf2dSBarry Smith PetscCall(PetscFPrintf(comm, fd, " EMalloc Mbytes: extra memory allocated during event and then freed (maximum over all calls to events). Never negative\n")); 190154aabf2dSBarry Smith PetscCall(PetscFPrintf(comm, fd, " MMalloc Mbytes: Increase in high water mark of allocated memory (sum over all calls to event). Never negative\n")); 19029566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " RMI Mbytes: Increase in resident memory (sum over all calls to event)\n")); 1903e3ed9ee7SBarry Smith } 1904d9c66bfbSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 19059566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " GPU Mflop/s: 10e-6 * (sum of flop on GPU over all processors)/(max GPU time over all processors)\n")); 19069566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " CpuToGpu Count: total number of CPU to GPU copies per processor\n")); 19079566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " CpuToGpu Size (Mbytes): 10e-6 * (total size of CPU to GPU copies per processor)\n")); 19089566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " GpuToCpu Count: total number of GPU to CPU copies per processor\n")); 19099566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " GpuToCpu Size (Mbytes): 10e-6 * (total size of GPU to CPU copies per processor)\n")); 19109566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " GPU %%F: percent flops on GPU in this event\n")); 1911bec0b493Shannah_mairs #endif 19129566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "------------------------------------------------------------------------------------------------------------------------\n")); 19135c6c1daeSBarry Smith 19149566063dSJacob Faibussowitsch PetscCall(PetscLogViewWarnDebugging(comm, fd)); 19155c6c1daeSBarry Smith 19165c6c1daeSBarry Smith /* Report events */ 19179566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Event Count Time (sec) Flop --- Global --- --- Stage ---- Total")); 191848a46eb9SPierre Jolivet if (PetscLogMemory) PetscCall(PetscFPrintf(comm, fd, " Malloc EMalloc MMalloc RMI")); 1919d9c66bfbSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 19209566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " GPU - CpuToGpu - - GpuToCpu - GPU")); 1921bec0b493Shannah_mairs #endif 19229566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n")); 19239566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " Max Ratio Max Ratio Max Ratio Mess AvgLen Reduct %%T %%F %%M %%L %%R %%T %%F %%M %%L %%R Mflop/s")); 192448a46eb9SPierre Jolivet if (PetscLogMemory) PetscCall(PetscFPrintf(comm, fd, " Mbytes Mbytes Mbytes Mbytes")); 1925d9c66bfbSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 19269566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " Mflop/s Count Size Count Size %%F")); 1927bec0b493Shannah_mairs #endif 19289566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n")); 19299566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "------------------------------------------------------------------------------------------------------------------------")); 193048a46eb9SPierre Jolivet if (PetscLogMemory) PetscCall(PetscFPrintf(comm, fd, "-----------------------------")); 1931d9c66bfbSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 19329566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "---------------------------------------")); 19334863603aSSatish Balay #endif 19349566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n")); 19355c6c1daeSBarry Smith 1936156b51fbSBarry Smith #if defined(PETSC_HAVE_DEVICE) 1937156b51fbSBarry Smith /* this indirect way of accessing these values is needed when PETSc is build with multiple libraries since the symbols are not in libpetscsys */ 1938156b51fbSBarry Smith PetscCall(PetscEventRegLogGetEvent(stageLog->eventLog, "TAOSolve", &TAO_Solve)); 1939156b51fbSBarry Smith PetscCall(PetscEventRegLogGetEvent(stageLog->eventLog, "TSStep", &TS_Step)); 1940156b51fbSBarry Smith PetscCall(PetscEventRegLogGetEvent(stageLog->eventLog, "SNESSolve", &SNES_Solve)); 1941156b51fbSBarry Smith PetscCall(PetscEventRegLogGetEvent(stageLog->eventLog, "KSPSolve", &KSP_Solve)); 1942156b51fbSBarry Smith #endif 1943156b51fbSBarry Smith 19445c6c1daeSBarry Smith /* Problem: The stage name will not show up unless the stage executed on proc 1 */ 19455c6c1daeSBarry Smith for (stage = 0; stage < numStages; stage++) { 19465c6c1daeSBarry Smith if (!stageVisible[stage]) continue; 1947820f2d46SBarry Smith /* CANNOT use MPI_Allreduce() since it might fail the line number check */ 19485c6c1daeSBarry Smith if (localStageUsed[stage]) { 19499566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n--- Event Stage %d: %s\n\n", stage, stageInfo[stage].name)); 1950712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&stageInfo[stage].perfInfo.time, &stageTime, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1951712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&stageInfo[stage].perfInfo.flops, &flops, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1952712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&stageInfo[stage].perfInfo.numMessages, &mess, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1953712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&stageInfo[stage].perfInfo.messageLength, &messLen, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1954712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&stageInfo[stage].perfInfo.numReductions, &red, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 19555c6c1daeSBarry Smith } else { 19569566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n--- Event Stage %d: Unknown\n\n", stage)); 1957712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &stageTime, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1958712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &flops, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1959712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &mess, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1960712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &messLen, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1961712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &red, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 19625c6c1daeSBarry Smith } 19639371c9d4SSatish Balay mess *= 0.5; 19649371c9d4SSatish Balay messLen *= 0.5; 19659371c9d4SSatish Balay red /= size; 19665c6c1daeSBarry Smith 19675c6c1daeSBarry Smith /* Get total number of events in this stage -- 19685c6c1daeSBarry Smith Currently, a single processor can register more events than another, but events must all be registered in order, 19695c6c1daeSBarry Smith just like stages. We can removed this requirement if necessary by having a global event numbering and indirection 1970217044c2SLisandro Dalcin on the event ID. This seems best accomplished by associating a communicator with each stage. 19715c6c1daeSBarry Smith 19725c6c1daeSBarry Smith Problem: If the event did not happen on proc 1, its name will not be available. 19735c6c1daeSBarry Smith Problem: Event visibility is not implemented 19745c6c1daeSBarry Smith */ 19755c6c1daeSBarry Smith if (localStageUsed[stage]) { 19765c6c1daeSBarry Smith eventInfo = stageLog->stageInfo[stage].eventLog->eventInfo; 19775c6c1daeSBarry Smith localNumEvents = stageLog->stageInfo[stage].eventLog->numEvents; 1978a297a907SKarl Rupp } else localNumEvents = 0; 19799566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&localNumEvents, &numEvents, 1, MPI_INT, MPI_MAX, comm)); 19805c6c1daeSBarry Smith for (event = 0; event < numEvents; event++) { 1981820f2d46SBarry Smith /* CANNOT use MPI_Allreduce() since it might fail the line number check */ 19825c6c1daeSBarry Smith if (localStageUsed[stage] && (event < stageLog->stageInfo[stage].eventLog->numEvents) && (eventInfo[event].depth == 0)) { 19839371c9d4SSatish Balay if ((eventInfo[event].count > 0) && (eventInfo[event].time > 0.0)) flopr = eventInfo[event].flops; 19849371c9d4SSatish Balay else flopr = 0.0; 1985712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&flopr, &minf, 1, MPIU_PETSCLOGDOUBLE, MPI_MIN, comm)); 1986712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&flopr, &maxf, 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 1987712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&eventInfo[event].flops, &totf, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1988712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&eventInfo[event].time, &mint, 1, MPIU_PETSCLOGDOUBLE, MPI_MIN, comm)); 1989712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&eventInfo[event].time, &maxt, 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 1990712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&eventInfo[event].time, &tott, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1991712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&eventInfo[event].numMessages, &totm, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1992712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&eventInfo[event].messageLength, &totml, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1993712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&eventInfo[event].numReductions, &totr, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 19949566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&eventInfo[event].count, &minC, 1, MPI_INT, MPI_MIN, comm)); 19959566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&eventInfo[event].count, &maxC, 1, MPI_INT, MPI_MAX, comm)); 1996e3ed9ee7SBarry Smith if (PetscLogMemory) { 1997712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&eventInfo[event].memIncrease, &mem, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1998712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&eventInfo[event].mallocSpace, &mal, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1999712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&eventInfo[event].mallocIncrease, &malmax, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 2000712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&eventInfo[event].mallocIncreaseEvent, &emalmax, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 2001e3ed9ee7SBarry Smith } 2002d9c66bfbSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 2003712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&eventInfo[event].CpuToGpuCount, &cct, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 2004712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&eventInfo[event].GpuToCpuCount, &gct, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 2005712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&eventInfo[event].CpuToGpuSize, &csz, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 2006712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&eventInfo[event].GpuToCpuSize, &gsz, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 2007712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&eventInfo[event].GpuFlops, &gflops, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 2008712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&eventInfo[event].GpuTime, &gmaxt, 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 2009bec0b493Shannah_mairs #endif 20105c6c1daeSBarry Smith name = stageLog->eventLog->eventInfo[event].name; 20115c6c1daeSBarry Smith } else { 20123ba16761SJacob Faibussowitsch int ierr = 0; 20133ba16761SJacob Faibussowitsch 20145c6c1daeSBarry Smith flopr = 0.0; 2015712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&flopr, &minf, 1, MPIU_PETSCLOGDOUBLE, MPI_MIN, comm)); 2016712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&flopr, &maxf, 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 2017712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &totf, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 2018712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &mint, 1, MPIU_PETSCLOGDOUBLE, MPI_MIN, comm)); 2019712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &maxt, 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 2020712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &tott, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 2021712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &totm, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 2022712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &totml, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 2023712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &totr, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 20249566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&ierr, &minC, 1, MPI_INT, MPI_MIN, comm)); 20259566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&ierr, &maxC, 1, MPI_INT, MPI_MAX, comm)); 2026e3ed9ee7SBarry Smith if (PetscLogMemory) { 2027712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &mem, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 2028712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &mal, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 2029712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &malmax, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 2030712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &emalmax, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 2031e3ed9ee7SBarry Smith } 2032d9c66bfbSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 2033712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &cct, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 2034712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &gct, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 2035712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &csz, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 2036712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &gsz, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 2037712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &gflops, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 2038712fec58SPierre Jolivet PetscCall(MPIU_Allreduce(&zero, &gmaxt, 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 2039bec0b493Shannah_mairs #endif 20405c6c1daeSBarry Smith name = ""; 20415c6c1daeSBarry Smith } 20425c6c1daeSBarry Smith if (mint < 0.0) { 2043d0609cedSBarry Smith PetscCall(PetscFPrintf(comm, fd, "WARNING!!! Minimum time %g over all processors for %s is negative! This happens\n on some machines whose times cannot handle too rapid calls.!\n artificially changing minimum to zero.\n", mint, name)); 20445c6c1daeSBarry Smith mint = 0; 20455c6c1daeSBarry Smith } 204608401ef6SPierre Jolivet PetscCheck(minf >= 0.0, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Minimum flop %g over all processors for %s is negative! Not possible!", minf, name); 2047156b51fbSBarry Smith /* Put NaN into the time for all events that may not be time accurately since they may happen asynchronously on the GPU */ 2048156b51fbSBarry Smith #if defined(PETSC_HAVE_DEVICE) 2049156b51fbSBarry Smith if (!PetscLogGpuTimeFlag && petsc_gflops > 0) { 2050156b51fbSBarry Smith memcpy(&gmaxt, &nas, sizeof(PetscLogDouble)); 2051156b51fbSBarry Smith PetscCall(PetscEventRegLogGetEvent(stageLog->eventLog, name, &eventid)); 2052156b51fbSBarry Smith if (eventid != SNES_Solve && eventid != KSP_Solve && eventid != TS_Step && eventid != TAO_Solve) { 2053156b51fbSBarry Smith memcpy(&mint, &nas, sizeof(PetscLogDouble)); 2054156b51fbSBarry Smith memcpy(&maxt, &nas, sizeof(PetscLogDouble)); 2055156b51fbSBarry Smith } 2056156b51fbSBarry Smith } 2057156b51fbSBarry Smith #endif 20589371c9d4SSatish Balay totm *= 0.5; 20599371c9d4SSatish Balay totml *= 0.5; 20609371c9d4SSatish Balay totr /= size; 20615c6c1daeSBarry Smith 2062217044c2SLisandro Dalcin if (maxC != 0) { 20639371c9d4SSatish Balay if (minC != 0) ratC = ((PetscLogDouble)maxC) / minC; 20649371c9d4SSatish Balay else ratC = 0.0; 20659371c9d4SSatish Balay if (mint != 0.0) ratt = maxt / mint; 20669371c9d4SSatish Balay else ratt = 0.0; 20679371c9d4SSatish Balay if (minf != 0.0) ratf = maxf / minf; 20689371c9d4SSatish Balay else ratf = 0.0; 20699371c9d4SSatish Balay if (TotalTime != 0.0) fracTime = tott / TotalTime; 20709371c9d4SSatish Balay else fracTime = 0.0; 20719371c9d4SSatish Balay if (TotalFlops != 0.0) fracFlops = totf / TotalFlops; 20729371c9d4SSatish Balay else fracFlops = 0.0; 20739371c9d4SSatish Balay if (stageTime != 0.0) fracStageTime = tott / stageTime; 20749371c9d4SSatish Balay else fracStageTime = 0.0; 20759371c9d4SSatish Balay if (flops != 0.0) fracStageFlops = totf / flops; 20769371c9d4SSatish Balay else fracStageFlops = 0.0; 20779371c9d4SSatish Balay if (numMessages != 0.0) fracMess = totm / numMessages; 20789371c9d4SSatish Balay else fracMess = 0.0; 20799371c9d4SSatish Balay if (messageLength != 0.0) fracMessLen = totml / messageLength; 20809371c9d4SSatish Balay else fracMessLen = 0.0; 20819371c9d4SSatish Balay if (numReductions != 0.0) fracRed = totr / numReductions; 20829371c9d4SSatish Balay else fracRed = 0.0; 20839371c9d4SSatish Balay if (mess != 0.0) fracStageMess = totm / mess; 20849371c9d4SSatish Balay else fracStageMess = 0.0; 20859371c9d4SSatish Balay if (messLen != 0.0) fracStageMessLen = totml / messLen; 20869371c9d4SSatish Balay else fracStageMessLen = 0.0; 20879371c9d4SSatish Balay if (red != 0.0) fracStageRed = totr / red; 20889371c9d4SSatish Balay else fracStageRed = 0.0; 20899371c9d4SSatish Balay if (totm != 0.0) totml /= totm; 20909371c9d4SSatish Balay else totml = 0.0; 20919371c9d4SSatish Balay if (maxt != 0.0) flopr = totf / maxt; 20929371c9d4SSatish Balay else flopr = 0.0; 209368a21331SBarry Smith if (fracStageTime > 1.0 || fracStageFlops > 1.0 || fracStageMess > 1.0 || fracStageMessLen > 1.0 || fracStageRed > 1.0) 2094a76edefcSRicardo Jesus PetscCall(PetscFPrintf(comm, fd, "%-16s %7d %3.1f %5.4e %3.1f %3.2e %3.1f %2.1e %2.1e %2.1e %2.0f %2.0f %2.0f %2.0f %2.0f Multiple stages %5.0f", name, maxC, ratC, maxt, ratt, maxf, ratf, totm, totml, totr, 100.0 * fracTime, 100.0 * fracFlops, 100.0 * fracMess, 100.0 * fracMessLen, 100.0 * fracRed, PetscAbs(flopr) / 1.0e6)); 209568a21331SBarry Smith else 2096a76edefcSRicardo Jesus PetscCall(PetscFPrintf(comm, fd, "%-16s %7d %3.1f %5.4e %3.1f %3.2e %3.1f %2.1e %2.1e %2.1e %2.0f %2.0f %2.0f %2.0f %2.0f %3.0f %2.0f %2.0f %2.0f %2.0f %5.0f", name, maxC, ratC, maxt, ratt, maxf, ratf, totm, totml, totr, 100.0 * fracTime, 100.0 * fracFlops, 100.0 * fracMess, 100.0 * fracMessLen, 100.0 * fracRed, 100.0 * fracStageTime, 100.0 * fracStageFlops, 100.0 * fracStageMess, 100.0 * fracStageMessLen, 100.0 * fracStageRed, PetscAbs(flopr) / 1.0e6)); 209748a46eb9SPierre Jolivet if (PetscLogMemory) PetscCall(PetscFPrintf(comm, fd, " %5.0f %5.0f %5.0f %5.0f", mal / 1.0e6, emalmax / 1.0e6, malmax / 1.0e6, mem / 1.0e6)); 2098d9c66bfbSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 20999371c9d4SSatish Balay if (totf != 0.0) fracgflops = gflops / totf; 21009371c9d4SSatish Balay else fracgflops = 0.0; 21019371c9d4SSatish Balay if (gmaxt != 0.0) gflopr = gflops / gmaxt; 21029371c9d4SSatish Balay else gflopr = 0.0; 2103a76edefcSRicardo Jesus PetscCall(PetscFPrintf(comm, fd, " %5.0f %4.0f %3.2e %4.0f %3.2e % 2.0f", PetscAbs(gflopr) / 1.0e6, cct / size, csz / (1.0e6 * size), gct / size, gsz / (1.0e6 * size), 100.0 * fracgflops)); 2104bec0b493Shannah_mairs #endif 21059566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n")); 21065c6c1daeSBarry Smith } 21075c6c1daeSBarry Smith } 21085c6c1daeSBarry Smith } 21095c6c1daeSBarry Smith 21105c6c1daeSBarry Smith /* Memory usage and object creation */ 21119566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "------------------------------------------------------------------------------------------------------------------------")); 211248a46eb9SPierre Jolivet if (PetscLogMemory) PetscCall(PetscFPrintf(comm, fd, "-----------------------------")); 2113d9c66bfbSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 21149566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "---------------------------------------")); 21154863603aSSatish Balay #endif 21169566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n")); 21179566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n")); 21185c6c1daeSBarry Smith 21195c6c1daeSBarry Smith /* Right now, only stages on the first processor are reported here, meaning only objects associated with 21205c6c1daeSBarry Smith the global communicator, or MPI_COMM_SELF for proc 1. We really should report global stats and then 21215c6c1daeSBarry Smith stats for stages local to processor sets. 21225c6c1daeSBarry Smith */ 21235c6c1daeSBarry Smith /* We should figure out the longest object name here (now 20 characters) */ 21244851f57dSBarry Smith PetscCall(PetscFPrintf(comm, fd, "Object Type Creations Destructions. Reports information only for process 0.\n")); 21255c6c1daeSBarry Smith for (stage = 0; stage < numStages; stage++) { 21265c6c1daeSBarry Smith if (localStageUsed[stage]) { 21275c6c1daeSBarry Smith classInfo = stageLog->stageInfo[stage].classLog->classInfo; 21289566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n--- Event Stage %d: %s\n\n", stage, stageInfo[stage].name)); 21295c6c1daeSBarry Smith for (oclass = 0; oclass < stageLog->stageInfo[stage].classLog->numClasses; oclass++) { 21305c6c1daeSBarry Smith if ((classInfo[oclass].creations > 0) || (classInfo[oclass].destructions > 0)) { 21314851f57dSBarry Smith PetscCall(PetscFPrintf(comm, fd, "%20s %5d %5d\n", stageLog->classLog->classInfo[oclass].name, classInfo[oclass].creations, classInfo[oclass].destructions)); 21325c6c1daeSBarry Smith } 21335c6c1daeSBarry Smith } 21345c6c1daeSBarry Smith } else { 2135cf019ec6SStefano Zampini if (!localStageVisible[stage]) continue; 21369566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n--- Event Stage %d: Unknown\n\n", stage)); 21375c6c1daeSBarry Smith } 21385c6c1daeSBarry Smith } 21395c6c1daeSBarry Smith 21409566063dSJacob Faibussowitsch PetscCall(PetscFree(localStageUsed)); 21419566063dSJacob Faibussowitsch PetscCall(PetscFree(stageUsed)); 21429566063dSJacob Faibussowitsch PetscCall(PetscFree(localStageVisible)); 21439566063dSJacob Faibussowitsch PetscCall(PetscFree(stageVisible)); 21445c6c1daeSBarry Smith 21455c6c1daeSBarry Smith /* Information unrelated to this particular run */ 21469566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "========================================================================================================================\n")); 21473ba16761SJacob Faibussowitsch PetscCall(PetscTime(&y)); 21483ba16761SJacob Faibussowitsch PetscCall(PetscTime(&x)); 21493ba16761SJacob Faibussowitsch PetscCall(PetscTime(&y)); 21503ba16761SJacob Faibussowitsch PetscCall(PetscTime(&y)); 21513ba16761SJacob Faibussowitsch PetscCall(PetscTime(&y)); 21523ba16761SJacob Faibussowitsch PetscCall(PetscTime(&y)); 21533ba16761SJacob Faibussowitsch PetscCall(PetscTime(&y)); 21543ba16761SJacob Faibussowitsch PetscCall(PetscTime(&y)); 21553ba16761SJacob Faibussowitsch PetscCall(PetscTime(&y)); 21563ba16761SJacob Faibussowitsch PetscCall(PetscTime(&y)); 21573ba16761SJacob Faibussowitsch PetscCall(PetscTime(&y)); 21583ba16761SJacob Faibussowitsch PetscCall(PetscTime(&y)); 21599566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Average time to get PetscTime(): %g\n", (y - x) / 10.0)); 21605c6c1daeSBarry Smith /* MPI information */ 21615c6c1daeSBarry Smith if (size > 1) { 21625c6c1daeSBarry Smith MPI_Status status; 21635c6c1daeSBarry Smith PetscMPIInt tag; 21645c6c1daeSBarry Smith MPI_Comm newcomm; 21655c6c1daeSBarry Smith 21669566063dSJacob Faibussowitsch PetscCallMPI(MPI_Barrier(comm)); 21673ba16761SJacob Faibussowitsch PetscCall(PetscTime(&x)); 21689566063dSJacob Faibussowitsch PetscCallMPI(MPI_Barrier(comm)); 21699566063dSJacob Faibussowitsch PetscCallMPI(MPI_Barrier(comm)); 21709566063dSJacob Faibussowitsch PetscCallMPI(MPI_Barrier(comm)); 21719566063dSJacob Faibussowitsch PetscCallMPI(MPI_Barrier(comm)); 21729566063dSJacob Faibussowitsch PetscCallMPI(MPI_Barrier(comm)); 21733ba16761SJacob Faibussowitsch PetscCall(PetscTime(&y)); 21749566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Average time for MPI_Barrier(): %g\n", (y - x) / 5.0)); 21759566063dSJacob Faibussowitsch PetscCall(PetscCommDuplicate(comm, &newcomm, &tag)); 21769566063dSJacob Faibussowitsch PetscCallMPI(MPI_Barrier(comm)); 21775c6c1daeSBarry Smith if (rank) { 21789566063dSJacob Faibussowitsch PetscCallMPI(MPI_Recv(NULL, 0, MPI_INT, rank - 1, tag, newcomm, &status)); 21799566063dSJacob Faibussowitsch PetscCallMPI(MPI_Send(NULL, 0, MPI_INT, (rank + 1) % size, tag, newcomm)); 21805c6c1daeSBarry Smith } else { 21813ba16761SJacob Faibussowitsch PetscCall(PetscTime(&x)); 21829566063dSJacob Faibussowitsch PetscCallMPI(MPI_Send(NULL, 0, MPI_INT, 1, tag, newcomm)); 21839566063dSJacob Faibussowitsch PetscCallMPI(MPI_Recv(NULL, 0, MPI_INT, size - 1, tag, newcomm, &status)); 21843ba16761SJacob Faibussowitsch PetscCall(PetscTime(&y)); 21859566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Average time for zero size MPI_Send(): %g\n", (y - x) / size)); 21865c6c1daeSBarry Smith } 21879566063dSJacob Faibussowitsch PetscCall(PetscCommDestroy(&newcomm)); 21885c6c1daeSBarry Smith } 21899566063dSJacob Faibussowitsch PetscCall(PetscOptionsView(NULL, viewer)); 21905c6c1daeSBarry Smith 21915c6c1daeSBarry Smith /* Machine and compile information */ 21925c6c1daeSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNELS) 21939566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Compiled with FORTRAN kernels\n")); 21945c6c1daeSBarry Smith #else 21959566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Compiled without FORTRAN kernels\n")); 21965c6c1daeSBarry Smith #endif 2197217044c2SLisandro Dalcin #if defined(PETSC_USE_64BIT_INDICES) 21987de69702SBarry Smith PetscCall(PetscFPrintf(comm, fd, "Compiled with 64-bit PetscInt\n")); 2199217044c2SLisandro Dalcin #elif defined(PETSC_USE___FLOAT128) 22007de69702SBarry Smith PetscCall(PetscFPrintf(comm, fd, "Compiled with 32-bit PetscInt\n")); 2201217044c2SLisandro Dalcin #endif 22025c6c1daeSBarry Smith #if defined(PETSC_USE_REAL_SINGLE) 22039566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Compiled with single precision PetscScalar and PetscReal\n")); 22045f27b2e0SBarry Smith #elif defined(PETSC_USE___FLOAT128) 22059566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Compiled with 128 bit precision PetscScalar and PetscReal\n")); 22065c6c1daeSBarry Smith #endif 22075c6c1daeSBarry Smith #if defined(PETSC_USE_REAL_MAT_SINGLE) 22089566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Compiled with single precision matrices\n")); 22095c6c1daeSBarry Smith #else 22109566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Compiled with full precision matrices (default)\n")); 22115c6c1daeSBarry Smith #endif 22129371c9d4SSatish Balay PetscCall(PetscFPrintf(comm, fd, "sizeof(short) %d sizeof(int) %d sizeof(long) %d sizeof(void*) %d sizeof(PetscScalar) %d sizeof(PetscInt) %d\n", (int)sizeof(short), (int)sizeof(int), (int)sizeof(long), (int)sizeof(void *), (int)sizeof(PetscScalar), (int)sizeof(PetscInt))); 22135c6c1daeSBarry Smith 22149566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Configure options: %s", petscconfigureoptions)); 22159566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "%s", petscmachineinfo)); 22169566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "%s", petsccompilerinfo)); 22179566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "%s", petsccompilerflagsinfo)); 22189566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "%s", petsclinkerinfo)); 22195c6c1daeSBarry Smith 22205c6c1daeSBarry Smith /* Cleanup */ 22219566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n")); 22229566063dSJacob Faibussowitsch PetscCall(PetscLogViewWarnNoGpuAwareMpi(comm, fd)); 22239566063dSJacob Faibussowitsch PetscCall(PetscLogViewWarnDebugging(comm, fd)); 2224156b51fbSBarry Smith PetscCall(PetscFPTrapPop()); 22253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22265c6c1daeSBarry Smith } 22275c6c1daeSBarry Smith 22287d6c928cSSatish Balay /*@C 22297d6c928cSSatish Balay PetscLogView - Prints a summary of the logging. 22305c6c1daeSBarry Smith 22315c6c1daeSBarry Smith Collective over MPI_Comm 22325c6c1daeSBarry Smith 22335c6c1daeSBarry Smith Input Parameter: 2234f14045dbSBarry Smith . viewer - an ASCII viewer 22355c6c1daeSBarry Smith 22365c6c1daeSBarry Smith Options Database Keys: 2237bb1d7374SBarry Smith + -log_view [:filename] - Prints summary of log information 2238bb1d7374SBarry Smith . -log_view :filename.py:ascii_info_detail - Saves logging information from each process as a Python file 2239607d249eSBarry Smith . -log_view :filename.xml:ascii_xml - Saves a summary of the logging information in a nested format (see below for how to view it) 2240d0a29bd7SConnor Ward . -log_view :filename.txt:ascii_flamegraph - Saves logging information in a format suitable for visualising as a Flame Graph (see below for how to view it) 2241156b51fbSBarry Smith . -log_view_memory - Also display memory usage in each event 2242156b51fbSBarry Smith . -log_view_gpu_time - Also display time in each event for GPU kernels (Note this may slow the computation) 2243811af0c4SBarry Smith . -log_all - Saves a file Log.rank for each MPI rank with details of each step of the computation 2244bb1d7374SBarry Smith - -log_trace [filename] - Displays a trace of what each process is doing 22455c6c1daeSBarry Smith 2246d1f92df0SBarry Smith Level: beginner 2247d1f92df0SBarry Smith 22485c6c1daeSBarry Smith Notes: 2249da81f932SPierre Jolivet It is possible to control the logging programmatically but we recommend using the options database approach whenever possible 22505c6c1daeSBarry Smith By default the summary is printed to stdout. 22515c6c1daeSBarry Smith 2252bb1d7374SBarry Smith Before calling this routine you must have called either PetscLogDefaultBegin() or PetscLogNestedBegin() 2253bb1d7374SBarry Smith 2254bb1d7374SBarry Smith If PETSc is configured with --with-logging=0 then this functionality is not available 2255bb1d7374SBarry Smith 2256607d249eSBarry Smith To view the nested XML format filename.xml first copy ${PETSC_DIR}/share/petsc/xml/performance_xml2html.xsl to the current 2257607d249eSBarry Smith directory then open filename.xml with your browser. Specific notes for certain browsers 2258607d249eSBarry Smith $ Firefox and Internet explorer - simply open the file 2259607d249eSBarry Smith $ Google Chrome - you must start up Chrome with the option --allow-file-access-from-files 2260a8d69d7bSBarry Smith $ Safari - see https://ccm.net/faq/36342-safari-how-to-enable-local-file-access 2261607d249eSBarry Smith or one can use the package http://xmlsoft.org/XSLT/xsltproc2.html to translate the xml file to html and then open it with 2262607d249eSBarry Smith your browser. 22632add09c0SLisandro Dalcin Alternatively, use the script ${PETSC_DIR}/lib/petsc/bin/petsc-performance-view to automatically open a new browser 22642add09c0SLisandro Dalcin window and render the XML log file contents. 2265607d249eSBarry Smith 2266bb1d7374SBarry Smith The nested XML format was kindly donated by Koos Huijssen and Christiaan M. Klaij MARITIME RESEARCH INSTITUTE NETHERLANDS 2267bb1d7374SBarry Smith 2268d0a29bd7SConnor Ward The Flame Graph output can be visualised using either the original Flame Graph script (https://github.com/brendangregg/FlameGraph) 2269d0a29bd7SConnor Ward or using speedscope (https://www.speedscope.app). 2270d0a29bd7SConnor Ward Old XML profiles may be converted into this format using the script ${PETSC_DIR}/lib/petsc/bin/xml2flamegraph.py. 2271d0a29bd7SConnor Ward 2272d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogDefaultBegin()`, `PetscLogDump()` 22735c6c1daeSBarry Smith @*/ 2274d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogView(PetscViewer viewer) 2275d71ae5a4SJacob Faibussowitsch { 2276f14045dbSBarry Smith PetscBool isascii; 2277f14045dbSBarry Smith PetscViewerFormat format; 227837b78d16SBarry Smith int stage, lastStage; 227937b78d16SBarry Smith PetscStageLog stageLog; 22805c6c1daeSBarry Smith 22815c6c1daeSBarry Smith PetscFunctionBegin; 228228b400f6SJacob Faibussowitsch PetscCheck(PetscLogPLB, PETSC_COMM_SELF, PETSC_ERR_SUP, "Must use -log_view or PetscLogDefaultBegin() before calling this routine"); 228337b78d16SBarry Smith /* Pop off any stages the user forgot to remove */ 228437b78d16SBarry Smith lastStage = 0; 22859566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 22869566063dSJacob Faibussowitsch PetscCall(PetscStageLogGetCurrent(stageLog, &stage)); 228737b78d16SBarry Smith while (stage >= 0) { 228837b78d16SBarry Smith lastStage = stage; 22899566063dSJacob Faibussowitsch PetscCall(PetscStageLogPop(stageLog)); 22909566063dSJacob Faibussowitsch PetscCall(PetscStageLogGetCurrent(stageLog, &stage)); 229137b78d16SBarry Smith } 22929566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &isascii)); 229328b400f6SJacob Faibussowitsch PetscCheck(isascii, PetscObjectComm((PetscObject)viewer), PETSC_ERR_SUP, "Currently can only view logging to ASCII"); 22949566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 2295f14045dbSBarry Smith if (format == PETSC_VIEWER_DEFAULT || format == PETSC_VIEWER_ASCII_INFO) { 22969566063dSJacob Faibussowitsch PetscCall(PetscLogView_Default(viewer)); 2297f14045dbSBarry Smith } else if (format == PETSC_VIEWER_ASCII_INFO_DETAIL) { 22989566063dSJacob Faibussowitsch PetscCall(PetscLogView_Detailed(viewer)); 229938144912Sdeepblu2718 } else if (format == PETSC_VIEWER_ASCII_CSV) { 23009566063dSJacob Faibussowitsch PetscCall(PetscLogView_CSV(viewer)); 2301bb1d7374SBarry Smith } else if (format == PETSC_VIEWER_ASCII_XML) { 23029566063dSJacob Faibussowitsch PetscCall(PetscLogView_Nested(viewer)); 2303d0a29bd7SConnor Ward } else if (format == PETSC_VIEWER_ASCII_FLAMEGRAPH) { 23049566063dSJacob Faibussowitsch PetscCall(PetscLogView_Flamegraph(viewer)); 23055c6c1daeSBarry Smith } 23069566063dSJacob Faibussowitsch PetscCall(PetscStageLogPush(stageLog, lastStage)); 23073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23085c6c1daeSBarry Smith } 23095c6c1daeSBarry Smith 2310f14045dbSBarry Smith /*@C 2311811af0c4SBarry Smith PetscLogViewFromOptions - Processes command line options to determine if/how a `PetscLog` is to be viewed. 2312f14045dbSBarry Smith 2313811af0c4SBarry Smith Collective on `PETSC_COMM_WORLD` 2314f14045dbSBarry Smith 2315811af0c4SBarry Smith Level: developer 2316f14045dbSBarry Smith 2317d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogView()` 2318f14045dbSBarry Smith @*/ 2319d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogViewFromOptions(void) 2320d71ae5a4SJacob Faibussowitsch { 2321f14045dbSBarry Smith PetscViewer viewer; 2322f14045dbSBarry Smith PetscBool flg; 2323f14045dbSBarry Smith PetscViewerFormat format; 2324f14045dbSBarry Smith 2325f14045dbSBarry Smith PetscFunctionBegin; 23269566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetViewer(PETSC_COMM_WORLD, NULL, NULL, "-log_view", &viewer, &format, &flg)); 2327f14045dbSBarry Smith if (flg) { 23289566063dSJacob Faibussowitsch PetscCall(PetscViewerPushFormat(viewer, format)); 23299566063dSJacob Faibussowitsch PetscCall(PetscLogView(viewer)); 23309566063dSJacob Faibussowitsch PetscCall(PetscViewerPopFormat(viewer)); 23319566063dSJacob Faibussowitsch PetscCall(PetscViewerDestroy(&viewer)); 2332f14045dbSBarry Smith } 23333ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2334f14045dbSBarry Smith } 2335f14045dbSBarry Smith 23365c6c1daeSBarry Smith /*----------------------------------------------- Counter Functions -------------------------------------------------*/ 23375c6c1daeSBarry Smith /*@C 23385c6c1daeSBarry Smith PetscGetFlops - Returns the number of flops used on this processor 23395c6c1daeSBarry Smith since the program began. 23405c6c1daeSBarry Smith 23415c6c1daeSBarry Smith Not Collective 23425c6c1daeSBarry Smith 23435c6c1daeSBarry Smith Output Parameter: 234410450e9eSJacob Faibussowitsch . flops - number of floating point operations 23455c6c1daeSBarry Smith 2346d1f92df0SBarry Smith Level: intermediate 2347d1f92df0SBarry Smith 23485c6c1daeSBarry Smith Notes: 23495c6c1daeSBarry Smith A global counter logs all PETSc flop counts. The user can use 2350811af0c4SBarry Smith `PetscLogFlops()` to increment this counter to include flops for the 23515c6c1daeSBarry Smith application code. 23525c6c1daeSBarry Smith 2353811af0c4SBarry Smith A separate counter `PetscLogGPUFlops()` logs the flops that occur on any GPU associated with this MPI rank 2354811af0c4SBarry Smith 2355d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogGPUFlops()`, `PetscTime()`, `PetscLogFlops()` 23565c6c1daeSBarry Smith @*/ 2357d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscGetFlops(PetscLogDouble *flops) 2358d71ae5a4SJacob Faibussowitsch { 23595c6c1daeSBarry Smith PetscFunctionBegin; 23605c6c1daeSBarry Smith *flops = petsc_TotalFlops; 23613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23625c6c1daeSBarry Smith } 23635c6c1daeSBarry Smith 2364*1c1ad86eSToby Isaac /*@C 2365*1c1ad86eSToby Isaac PetscLogObjectState - Record information about an object with the default log handler 2366*1c1ad86eSToby Isaac 2367*1c1ad86eSToby Isaac Not Collective 2368*1c1ad86eSToby Isaac 2369*1c1ad86eSToby Isaac Input Parameters: 2370*1c1ad86eSToby Isaac + obj - the `PetscObject` 2371*1c1ad86eSToby Isaac . format - a printf-style format string 2372*1c1ad86eSToby Isaac - ... - printf arguments to format 2373*1c1ad86eSToby Isaac 2374*1c1ad86eSToby Isaac Level: developer 2375*1c1ad86eSToby Isaac 2376*1c1ad86eSToby Isaac .seealso: [](ch_profiling), `PetscLogObjectCreate()`, `PetscLogObjectDestroy()` 2377*1c1ad86eSToby Isaac @*/ 2378d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogObjectState(PetscObject obj, const char format[], ...) 2379d71ae5a4SJacob Faibussowitsch { 23805c6c1daeSBarry Smith size_t fullLength; 23815c6c1daeSBarry Smith va_list Argp; 23825c6c1daeSBarry Smith 23835c6c1daeSBarry Smith PetscFunctionBegin; 23843ba16761SJacob Faibussowitsch if (!petsc_logObjects) PetscFunctionReturn(PETSC_SUCCESS); 23855c6c1daeSBarry Smith va_start(Argp, format); 23869566063dSJacob Faibussowitsch PetscCall(PetscVSNPrintf(petsc_objects[obj->id].info, 64, format, &fullLength, Argp)); 23875c6c1daeSBarry Smith va_end(Argp); 23883ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23895c6c1daeSBarry Smith } 23905c6c1daeSBarry Smith 23915c6c1daeSBarry Smith /*MC 23925c6c1daeSBarry Smith PetscLogFlops - Adds floating point operations to the global counter. 23935c6c1daeSBarry Smith 23945c6c1daeSBarry Smith Synopsis: 2395aaa7dc30SBarry Smith #include <petsclog.h> 23965c6c1daeSBarry Smith PetscErrorCode PetscLogFlops(PetscLogDouble f) 23975c6c1daeSBarry Smith 23985c6c1daeSBarry Smith Not Collective 23995c6c1daeSBarry Smith 24005c6c1daeSBarry Smith Input Parameter: 24015c6c1daeSBarry Smith . f - flop counter 24025c6c1daeSBarry Smith 240310450e9eSJacob Faibussowitsch Example Usage: 24045c6c1daeSBarry Smith .vb 24055c6c1daeSBarry Smith PetscLogEvent USER_EVENT; 240610450e9eSJacob Faibussowitsch 24075c6c1daeSBarry Smith PetscLogEventRegister("User event", 0, &USER_EVENT); 24085c6c1daeSBarry Smith PetscLogEventBegin(USER_EVENT, 0, 0, 0, 0); 24095c6c1daeSBarry Smith [code segment to monitor] 24105c6c1daeSBarry Smith PetscLogFlops(user_flops) 24115c6c1daeSBarry Smith PetscLogEventEnd(USER_EVENT, 0, 0, 0, 0); 24125c6c1daeSBarry Smith .ve 24135c6c1daeSBarry Smith 2414d1f92df0SBarry Smith Level: intermediate 2415d1f92df0SBarry Smith 2416811af0c4SBarry Smith Note: 241710450e9eSJacob Faibussowitsch A global counter logs all PETSc flop counts. The user can use PetscLogFlops() to increment 241810450e9eSJacob Faibussowitsch this counter to include flops for the application code. 24195c6c1daeSBarry Smith 2420d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogGPUFlops()`, `PetscLogEventRegister()`, `PetscLogEventBegin()`, `PetscLogEventEnd()`, `PetscGetFlops()` 24215c6c1daeSBarry Smith M*/ 24225c6c1daeSBarry Smith 24235c6c1daeSBarry Smith /*MC 242410450e9eSJacob Faibussowitsch PetscPreLoadBegin - Begin a segment of code that may be preloaded (run twice) to get accurate 242510450e9eSJacob Faibussowitsch timings 24265c6c1daeSBarry Smith 24275c6c1daeSBarry Smith Synopsis: 2428aaa7dc30SBarry Smith #include <petsclog.h> 24295c6c1daeSBarry Smith void PetscPreLoadBegin(PetscBool flag, char *name); 24305c6c1daeSBarry Smith 24315c6c1daeSBarry Smith Not Collective 24325c6c1daeSBarry Smith 2433d8d19677SJose E. Roman Input Parameters: 243410450e9eSJacob Faibussowitsch + flag - `PETSC_TRUE` to run twice, `PETSC_FALSE` to run once, may be overridden with command 243510450e9eSJacob Faibussowitsch line option `-preload true|false` 243610450e9eSJacob Faibussowitsch - name - name of first stage (lines of code timed separately with `-log_view`) to be preloaded 24375c6c1daeSBarry Smith 243810450e9eSJacob Faibussowitsch Example Usage: 24395c6c1daeSBarry Smith .vb 244010450e9eSJacob Faibussowitsch PetscPreLoadBegin(PETSC_TRUE, "first stage"); 244110450e9eSJacob Faibussowitsch // lines of code 24425c6c1daeSBarry Smith PetscPreLoadStage("second stage"); 244310450e9eSJacob Faibussowitsch // lines of code 24445c6c1daeSBarry Smith PetscPreLoadEnd(); 24455c6c1daeSBarry Smith .ve 24465c6c1daeSBarry Smith 2447d1f92df0SBarry Smith Level: intermediate 2448d1f92df0SBarry Smith 2449811af0c4SBarry Smith Note: 245095452b02SPatrick Sanan Only works in C/C++, not Fortran 24515c6c1daeSBarry Smith 245210450e9eSJacob Faibussowitsch Flags available within the macro\: 245310450e9eSJacob Faibussowitsch + PetscPreLoadingUsed - `PETSC_TRUE` if we are or have done preloading 245410450e9eSJacob Faibussowitsch . PetscPreLoadingOn - `PETSC_TRUE` if it is CURRENTLY doing preload 245510450e9eSJacob Faibussowitsch . PetscPreLoadIt - `0` for the first computation (with preloading turned off it is only 245610450e9eSJacob Faibussowitsch `0`) `1` for the second 245710450e9eSJacob Faibussowitsch - PetscPreLoadMax - number of times it will do the computation, only one when preloading is 245810450e9eSJacob Faibussowitsch turned on 245910450e9eSJacob Faibussowitsch 246010450e9eSJacob Faibussowitsch The first two variables are available throughout the program, the second two only between the 246110450e9eSJacob Faibussowitsch `PetscPreLoadBegin()` and `PetscPreLoadEnd()` 24625c6c1daeSBarry Smith 2463d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogEventRegister()`, `PetscLogEventBegin()`, `PetscLogEventEnd()`, `PetscPreLoadEnd()`, `PetscPreLoadStage()` 24645c6c1daeSBarry Smith M*/ 24655c6c1daeSBarry Smith 24665c6c1daeSBarry Smith /*MC 246710450e9eSJacob Faibussowitsch PetscPreLoadEnd - End a segment of code that may be preloaded (run twice) to get accurate 246810450e9eSJacob Faibussowitsch timings 24695c6c1daeSBarry Smith 24705c6c1daeSBarry Smith Synopsis: 2471aaa7dc30SBarry Smith #include <petsclog.h> 24725c6c1daeSBarry Smith void PetscPreLoadEnd(void); 24735c6c1daeSBarry Smith 24745c6c1daeSBarry Smith Not Collective 24755c6c1daeSBarry Smith 247610450e9eSJacob Faibussowitsch Example Usage: 24775c6c1daeSBarry Smith .vb 247810450e9eSJacob Faibussowitsch PetscPreLoadBegin(PETSC_TRUE, "first stage"); 247910450e9eSJacob Faibussowitsch // lines of code 24805c6c1daeSBarry Smith PetscPreLoadStage("second stage"); 248110450e9eSJacob Faibussowitsch // lines of code 24825c6c1daeSBarry Smith PetscPreLoadEnd(); 24835c6c1daeSBarry Smith .ve 24845c6c1daeSBarry Smith 2485d1f92df0SBarry Smith Level: intermediate 2486d1f92df0SBarry Smith 2487811af0c4SBarry Smith Note: 2488811af0c4SBarry Smith Only works in C/C++ not fortran 24895c6c1daeSBarry Smith 2490d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogEventRegister()`, `PetscLogEventBegin()`, `PetscLogEventEnd()`, `PetscPreLoadBegin()`, `PetscPreLoadStage()` 24915c6c1daeSBarry Smith M*/ 24925c6c1daeSBarry Smith 24935c6c1daeSBarry Smith /*MC 249410450e9eSJacob Faibussowitsch PetscPreLoadStage - Start a new segment of code to be timed separately to get accurate timings 24955c6c1daeSBarry Smith 24965c6c1daeSBarry Smith Synopsis: 2497aaa7dc30SBarry Smith #include <petsclog.h> 24985c6c1daeSBarry Smith void PetscPreLoadStage(char *name); 24995c6c1daeSBarry Smith 25005c6c1daeSBarry Smith Not Collective 25015c6c1daeSBarry Smith 250210450e9eSJacob Faibussowitsch Example Usage: 25035c6c1daeSBarry Smith .vb 250410450e9eSJacob Faibussowitsch PetscPreLoadBegin(PETSC_TRUE,"first stage"); 250510450e9eSJacob Faibussowitsch // lines of code 25065c6c1daeSBarry Smith PetscPreLoadStage("second stage"); 250710450e9eSJacob Faibussowitsch // lines of code 25085c6c1daeSBarry Smith PetscPreLoadEnd(); 25095c6c1daeSBarry Smith .ve 25105c6c1daeSBarry Smith 2511d1f92df0SBarry Smith Level: intermediate 2512d1f92df0SBarry Smith 2513811af0c4SBarry Smith Note: 2514811af0c4SBarry Smith Only works in C/C++ not fortran 25155c6c1daeSBarry Smith 2516d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogEventRegister()`, `PetscLogEventBegin()`, `PetscLogEventEnd()`, `PetscPreLoadBegin()`, `PetscPreLoadEnd()` 25175c6c1daeSBarry Smith M*/ 25185c6c1daeSBarry Smith 2519a4af0ceeSJacob Faibussowitsch #if PetscDefined(HAVE_DEVICE) 2520a4af0ceeSJacob Faibussowitsch #include <petsc/private/deviceimpl.h> 25219ffd0706SHong Zhang 2522156b51fbSBarry Smith PetscBool PetscLogGpuTimeFlag = PETSC_FALSE; 2523156b51fbSBarry Smith 2524156b51fbSBarry Smith /* 2525156b51fbSBarry Smith This cannot be called by users between PetscInitialize() and PetscFinalize() at any random location in the code 2526156b51fbSBarry Smith because it will result in timing results that cannot be interpreted. 2527156b51fbSBarry Smith */ 2528d71ae5a4SJacob Faibussowitsch static PetscErrorCode PetscLogGpuTime_Off(void) 2529d71ae5a4SJacob Faibussowitsch { 2530156b51fbSBarry Smith PetscLogGpuTimeFlag = PETSC_FALSE; 25313ba16761SJacob Faibussowitsch return PETSC_SUCCESS; 2532156b51fbSBarry Smith } 2533156b51fbSBarry Smith 2534156b51fbSBarry Smith /*@C 2535156b51fbSBarry Smith PetscLogGpuTime - turn on the logging of GPU time for GPU kernels 2536156b51fbSBarry Smith 2537811af0c4SBarry Smith Options Database Key: 253810450e9eSJacob Faibussowitsch . -log_view_gpu_time - provide the GPU times in the `-log_view` output 2539156b51fbSBarry Smith 2540d1f92df0SBarry Smith Level: advanced 2541d1f92df0SBarry Smith 2542156b51fbSBarry Smith Notes: 254310450e9eSJacob Faibussowitsch Turning on the timing of the GPU kernels can slow down the entire computation and should only 254410450e9eSJacob Faibussowitsch be used when studying the performance of operations on GPU such as vector operations and 254510450e9eSJacob Faibussowitsch matrix-vector operations. 2546156b51fbSBarry Smith 254710450e9eSJacob Faibussowitsch This routine should only be called once near the beginning of the program. Once it is started 254810450e9eSJacob Faibussowitsch it cannot be turned off. 2549156b51fbSBarry Smith 2550d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogView()`, `PetscLogGpuFlops()`, `PetscLogGpuTimeEnd()`, `PetscLogGpuTimeBegin()` 2551156b51fbSBarry Smith @*/ 2552d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogGpuTime(void) 2553d71ae5a4SJacob Faibussowitsch { 2554156b51fbSBarry Smith if (!PetscLogGpuTimeFlag) PetscCall(PetscRegisterFinalize(PetscLogGpuTime_Off)); 2555156b51fbSBarry Smith PetscLogGpuTimeFlag = PETSC_TRUE; 25563ba16761SJacob Faibussowitsch return PETSC_SUCCESS; 2557156b51fbSBarry Smith } 2558156b51fbSBarry Smith 25599ffd0706SHong Zhang /*@C 25609ffd0706SHong Zhang PetscLogGpuTimeBegin - Start timer for device 25619ffd0706SHong Zhang 2562d1f92df0SBarry Smith Level: intermediate 2563d1f92df0SBarry Smith 25649ffd0706SHong Zhang Notes: 256510450e9eSJacob Faibussowitsch When CUDA or HIP is enabled, the timer is run on the GPU, it is a separate logging of time 256610450e9eSJacob Faibussowitsch devoted to GPU computations (excluding kernel launch times). 2567811af0c4SBarry Smith 256810450e9eSJacob Faibussowitsch When CUDA or HIP is not available, the timer is run on the CPU, it is a separate logging of 256910450e9eSJacob Faibussowitsch time devoted to GPU computations (including kernel launch times). 2570811af0c4SBarry Smith 257110450e9eSJacob Faibussowitsch There is no need to call WaitForCUDA() or WaitForHIP() between `PetscLogGpuTimeBegin()` and 257210450e9eSJacob Faibussowitsch `PetscLogGpuTimeEnd()` 2573811af0c4SBarry Smith 257410450e9eSJacob Faibussowitsch This timer should NOT include times for data transfers between the GPU and CPU, nor setup 257510450e9eSJacob Faibussowitsch actions such as allocating space. 2576811af0c4SBarry Smith 257710450e9eSJacob Faibussowitsch The regular logging captures the time for data transfers and any CPU activities during the 257810450e9eSJacob Faibussowitsch event. It is used to compute the flop rate on the GPU as it is actively engaged in running a 257910450e9eSJacob Faibussowitsch kernel. 25809ffd0706SHong Zhang 25819ffd0706SHong Zhang Developer Notes: 258210450e9eSJacob Faibussowitsch The GPU event timer captures the execution time of all the kernels launched in the default 258310450e9eSJacob Faibussowitsch stream by the CPU between `PetscLogGpuTimeBegin()` and `PetsLogGpuTimeEnd()`. 2584811af0c4SBarry Smith 258510450e9eSJacob Faibussowitsch `PetscLogGpuTimeBegin()` and `PetsLogGpuTimeEnd()` insert the begin and end events into the 258610450e9eSJacob Faibussowitsch default stream (stream 0). The device will record a time stamp for the event when it reaches 258710450e9eSJacob Faibussowitsch that event in the stream. The function xxxEventSynchronize() is called in 258810450e9eSJacob Faibussowitsch `PetsLogGpuTimeEnd()` to block CPU execution, but not continued GPU execution, until the 258910450e9eSJacob Faibussowitsch timer event is recorded. 25909ffd0706SHong Zhang 2591d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogView()`, `PetscLogGpuFlops()`, `PetscLogGpuTimeEnd()`, `PetscLogGpuTime()` 25929ffd0706SHong Zhang @*/ 2593d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogGpuTimeBegin(void) 2594d71ae5a4SJacob Faibussowitsch { 25959ffd0706SHong Zhang PetscFunctionBegin; 25963ba16761SJacob Faibussowitsch if (!PetscLogPLB || !PetscLogGpuTimeFlag) PetscFunctionReturn(PETSC_SUCCESS); 2597744d70b0SJunchao Zhang if (PetscDefined(HAVE_DEVICE)) { 2598a4af0ceeSJacob Faibussowitsch PetscDeviceContext dctx; 2599a4af0ceeSJacob Faibussowitsch 26009566063dSJacob Faibussowitsch PetscCall(PetscDeviceContextGetCurrentContext(&dctx)); 26019566063dSJacob Faibussowitsch PetscCall(PetscDeviceContextBeginTimer_Internal(dctx)); 2602a4af0ceeSJacob Faibussowitsch } else { 26039566063dSJacob Faibussowitsch PetscCall(PetscTimeSubtract(&petsc_gtime)); 2604a4af0ceeSJacob Faibussowitsch } 26053ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 26069ffd0706SHong Zhang } 26079ffd0706SHong Zhang 26089ffd0706SHong Zhang /*@C 26099ffd0706SHong Zhang PetscLogGpuTimeEnd - Stop timer for device 26109ffd0706SHong Zhang 26119ffd0706SHong Zhang Level: intermediate 26129ffd0706SHong Zhang 2613d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogView()`, `PetscLogGpuFlops()`, `PetscLogGpuTimeBegin()` 26149ffd0706SHong Zhang @*/ 2615d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogGpuTimeEnd(void) 2616d71ae5a4SJacob Faibussowitsch { 26179ffd0706SHong Zhang PetscFunctionBegin; 26183ba16761SJacob Faibussowitsch if (!PetscLogPLE || !PetscLogGpuTimeFlag) PetscFunctionReturn(PETSC_SUCCESS); 2619744d70b0SJunchao Zhang if (PetscDefined(HAVE_DEVICE)) { 2620a4af0ceeSJacob Faibussowitsch PetscDeviceContext dctx; 2621a4af0ceeSJacob Faibussowitsch PetscLogDouble elapsed; 2622a4af0ceeSJacob Faibussowitsch 26239566063dSJacob Faibussowitsch PetscCall(PetscDeviceContextGetCurrentContext(&dctx)); 26249566063dSJacob Faibussowitsch PetscCall(PetscDeviceContextEndTimer_Internal(dctx, &elapsed)); 2625a4af0ceeSJacob Faibussowitsch petsc_gtime += (elapsed / 1000.0); 2626a4af0ceeSJacob Faibussowitsch } else { 26279566063dSJacob Faibussowitsch PetscCall(PetscTimeAdd(&petsc_gtime)); 2628a4af0ceeSJacob Faibussowitsch } 26293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 26309ffd0706SHong Zhang } 2631c708d6e3SStefano Zampini 26329ffd0706SHong Zhang #endif /* end of PETSC_HAVE_DEVICE */ 26339ffd0706SHong Zhang 26345c6c1daeSBarry Smith #else /* end of -DPETSC_USE_LOG section */ 26355c6c1daeSBarry Smith 2636d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogObjectState(PetscObject obj, const char format[], ...) 2637d71ae5a4SJacob Faibussowitsch { 26385c6c1daeSBarry Smith PetscFunctionBegin; 26393ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 26405c6c1daeSBarry Smith } 26415c6c1daeSBarry Smith 26425c6c1daeSBarry Smith #endif /* PETSC_USE_LOG*/ 26435c6c1daeSBarry Smith 26445c6c1daeSBarry Smith PetscClassId PETSC_LARGEST_CLASSID = PETSC_SMALLEST_CLASSID; 26455c6c1daeSBarry Smith PetscClassId PETSC_OBJECT_CLASSID = 0; 26465c6c1daeSBarry Smith 26475c6c1daeSBarry Smith /*@C 26485c6c1daeSBarry Smith PetscClassIdRegister - Registers a new class name for objects and logging operations in an application code. 26495c6c1daeSBarry Smith 26505c6c1daeSBarry Smith Not Collective 26515c6c1daeSBarry Smith 26525c6c1daeSBarry Smith Input Parameter: 26535c6c1daeSBarry Smith . name - The class name 26545c6c1daeSBarry Smith 26555c6c1daeSBarry Smith Output Parameter: 26565c6c1daeSBarry Smith . oclass - The class id or classid 26575c6c1daeSBarry Smith 26585c6c1daeSBarry Smith Level: developer 26595c6c1daeSBarry Smith 2660d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogEventRegister()` 26615c6c1daeSBarry Smith @*/ 2662d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscClassIdRegister(const char name[], PetscClassId *oclass) 2663d71ae5a4SJacob Faibussowitsch { 26645c6c1daeSBarry Smith #if defined(PETSC_USE_LOG) 26655c6c1daeSBarry Smith PetscStageLog stageLog; 26665c6c1daeSBarry Smith PetscInt stage; 26675c6c1daeSBarry Smith #endif 26685c6c1daeSBarry Smith 26695c6c1daeSBarry Smith PetscFunctionBegin; 26705c6c1daeSBarry Smith *oclass = ++PETSC_LARGEST_CLASSID; 26715c6c1daeSBarry Smith #if defined(PETSC_USE_LOG) 26729566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 26739566063dSJacob Faibussowitsch PetscCall(PetscClassRegLogRegister(stageLog->classLog, name, *oclass)); 267448a46eb9SPierre Jolivet for (stage = 0; stage < stageLog->numStages; stage++) PetscCall(PetscClassPerfLogEnsureSize(stageLog->stageInfo[stage].classLog, stageLog->classLog->numClasses)); 26755c6c1daeSBarry Smith #endif 26763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 26775c6c1daeSBarry Smith } 2678210b5426SBarry Smith 2679210b5426SBarry Smith #if defined(PETSC_USE_LOG) && defined(PETSC_HAVE_MPE) 2680210b5426SBarry Smith #include <mpe.h> 2681210b5426SBarry Smith 2682210b5426SBarry Smith PetscBool PetscBeganMPE = PETSC_FALSE; 2683210b5426SBarry Smith 2684495fc317SBarry Smith PETSC_INTERN PetscErrorCode PetscLogEventBeginMPE(PetscLogEvent, int, PetscObject, PetscObject, PetscObject, PetscObject); 2685495fc317SBarry Smith PETSC_INTERN PetscErrorCode PetscLogEventEndMPE(PetscLogEvent, int, PetscObject, PetscObject, PetscObject, PetscObject); 2686495fc317SBarry Smith 2687210b5426SBarry Smith /*@C 268810450e9eSJacob Faibussowitsch PetscLogMPEBegin - Turns on MPE logging of events. This creates large log files and slows the 268910450e9eSJacob Faibussowitsch program down. 2690210b5426SBarry Smith 2691811af0c4SBarry Smith Collective over `PETSC_COMM_WORLD` 2692210b5426SBarry Smith 2693811af0c4SBarry Smith Options Database Key: 2694a2553e36SBarry Smith . -log_mpe - Prints extensive log information 2695210b5426SBarry Smith 2696d1f92df0SBarry Smith Level: advanced 2697d1f92df0SBarry Smith 2698811af0c4SBarry Smith Note: 269910450e9eSJacob Faibussowitsch A related routine is `PetscLogDefaultBegin()` (with the options key `-log_view`), which is 270010450e9eSJacob Faibussowitsch intended for production runs since it logs only flop rates and object creation (and should 270110450e9eSJacob Faibussowitsch not significantly slow the programs). 2702210b5426SBarry Smith 2703d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogDump()`, `PetscLogDefaultBegin()`, `PetscLogAllBegin()`, `PetscLogEventActivate()`, 2704db781477SPatrick Sanan `PetscLogEventDeactivate()` 2705210b5426SBarry Smith @*/ 2706d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogMPEBegin(void) 2707d71ae5a4SJacob Faibussowitsch { 2708210b5426SBarry Smith PetscFunctionBegin; 2709210b5426SBarry Smith /* Do MPE initialization */ 2710210b5426SBarry Smith if (!MPE_Initialized_logging()) { /* This function exists in mpich 1.1.2 and higher */ 27119566063dSJacob Faibussowitsch PetscCall(PetscInfo(0, "Initializing MPE.\n")); 27129566063dSJacob Faibussowitsch PetscCall(MPE_Init_log()); 2713210b5426SBarry Smith 2714210b5426SBarry Smith PetscBeganMPE = PETSC_TRUE; 2715210b5426SBarry Smith } else { 27169566063dSJacob Faibussowitsch PetscCall(PetscInfo(0, "MPE already initialized. Not attempting to reinitialize.\n")); 2717210b5426SBarry Smith } 27189566063dSJacob Faibussowitsch PetscCall(PetscLogSet(PetscLogEventBeginMPE, PetscLogEventEndMPE)); 27193ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2720210b5426SBarry Smith } 2721210b5426SBarry Smith 2722210b5426SBarry Smith /*@C 2723495fc317SBarry Smith PetscLogMPEDump - Dumps the MPE logging info to file for later use with Jumpshot. 2724210b5426SBarry Smith 272510450e9eSJacob Faibussowitsch Input Parameter: 272610450e9eSJacob Faibussowitsch . sname - The filename to dump to 272710450e9eSJacob Faibussowitsch 2728811af0c4SBarry Smith Collective over `PETSC_COMM_WORLD` 2729210b5426SBarry Smith 2730210b5426SBarry Smith Level: advanced 2731210b5426SBarry Smith 2732d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogDump()`, `PetscLogAllBegin()`, `PetscLogMPEBegin()` 2733210b5426SBarry Smith @*/ 2734d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogMPEDump(const char sname[]) 2735d71ae5a4SJacob Faibussowitsch { 2736210b5426SBarry Smith char name[PETSC_MAX_PATH_LEN]; 2737210b5426SBarry Smith 2738210b5426SBarry Smith PetscFunctionBegin; 2739210b5426SBarry Smith if (PetscBeganMPE) { 27409566063dSJacob Faibussowitsch PetscCall(PetscInfo(0, "Finalizing MPE.\n")); 2741210b5426SBarry Smith if (sname) { 2742c6a7a370SJeremy L Thompson PetscCall(PetscStrncpy(name, sname, sizeof(name))); 2743210b5426SBarry Smith } else { 27449566063dSJacob Faibussowitsch PetscCall(PetscGetProgramName(name, sizeof(name))); 2745210b5426SBarry Smith } 27469566063dSJacob Faibussowitsch PetscCall(MPE_Finish_log(name)); 2747210b5426SBarry Smith } else { 27489566063dSJacob Faibussowitsch PetscCall(PetscInfo(0, "Not finalizing MPE (not started by PETSc).\n")); 2749210b5426SBarry Smith } 27503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2751210b5426SBarry Smith } 2752210b5426SBarry Smith 2753210b5426SBarry Smith #define PETSC_RGB_COLORS_MAX 39 27549371c9d4SSatish Balay static const char *PetscLogMPERGBColors[PETSC_RGB_COLORS_MAX] = {"OliveDrab: ", "BlueViolet: ", "CadetBlue: ", "CornflowerBlue: ", "DarkGoldenrod: ", "DarkGreen: ", "DarkKhaki: ", "DarkOliveGreen: ", 27559371c9d4SSatish Balay "DarkOrange: ", "DarkOrchid: ", "DarkSeaGreen: ", "DarkSlateGray: ", "DarkTurquoise: ", "DeepPink: ", "DarkKhaki: ", "DimGray: ", 27569371c9d4SSatish Balay "DodgerBlue: ", "GreenYellow: ", "HotPink: ", "IndianRed: ", "LavenderBlush: ", "LawnGreen: ", "LemonChiffon: ", "LightCoral: ", 27579371c9d4SSatish Balay "LightCyan: ", "LightPink: ", "LightSalmon: ", "LightSlateGray: ", "LightYellow: ", "LimeGreen: ", "MediumPurple: ", "MediumSeaGreen: ", 27589371c9d4SSatish Balay "MediumSlateBlue:", "MidnightBlue: ", "MintCream: ", "MistyRose: ", "NavajoWhite: ", "NavyBlue: ", "OliveDrab: "}; 2759210b5426SBarry Smith 2760210b5426SBarry Smith /*@C 2761811af0c4SBarry Smith PetscLogMPEGetRGBColor - This routine returns a rgb color useable with `PetscLogEventRegister()` 2762210b5426SBarry Smith 2763210b5426SBarry Smith Not collective. Maybe it should be? 2764210b5426SBarry Smith 27657a7aea1fSJed Brown Output Parameter: 2766210b5426SBarry Smith . str - character string representing the color 2767210b5426SBarry Smith 2768210b5426SBarry Smith Level: developer 2769210b5426SBarry Smith 2770d1f92df0SBarry Smith .seealso: [](ch_profiling), `PetscLogEventRegister()` 2771210b5426SBarry Smith @*/ 2772d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscLogMPEGetRGBColor(const char *str[]) 2773d71ae5a4SJacob Faibussowitsch { 2774210b5426SBarry Smith static int idx = 0; 2775210b5426SBarry Smith 2776210b5426SBarry Smith PetscFunctionBegin; 2777210b5426SBarry Smith *str = PetscLogMPERGBColors[idx]; 2778210b5426SBarry Smith idx = (idx + 1) % PETSC_RGB_COLORS_MAX; 27793ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2780210b5426SBarry Smith } 2781210b5426SBarry Smith 2782210b5426SBarry Smith #endif /* PETSC_USE_LOG && PETSC_HAVE_MPE */ 2783