15c6c1daeSBarry Smith 25c6c1daeSBarry Smith /* 35c6c1daeSBarry Smith PETSc code to log object creation and destruction and PETSc events. 45c6c1daeSBarry Smith 55c6c1daeSBarry Smith This provides the public API used by the rest of PETSc and by users. 65c6c1daeSBarry Smith 75c6c1daeSBarry Smith These routines use a private API that is not used elsewhere in PETSc and is not 85c6c1daeSBarry Smith accessible to users. The private API is defined in logimpl.h and the utils directory. 95c6c1daeSBarry Smith 105c6c1daeSBarry Smith */ 11af0996ceSBarry Smith #include <petsc/private/logimpl.h> /*I "petscsys.h" I*/ 125c6c1daeSBarry Smith #include <petsctime.h> 13665c2dedSJed Brown #include <petscviewer.h> 145c6c1daeSBarry Smith 154851f57dSBarry Smith /* this is not consistently used and is difficult to keep correct if done manually, possibly it should be removed */ 163bb1ff40SBarry Smith PetscErrorCode PetscLogObjectParent(PetscObject p,PetscObject c) 173bb1ff40SBarry Smith { 1827b6d19dSBarry Smith if (!c || !p) return 0; 193bb1ff40SBarry Smith c->parent = p; 203bb1ff40SBarry Smith c->parentid = p->id; 213bb1ff40SBarry Smith return 0; 223bb1ff40SBarry Smith } 233bb1ff40SBarry Smith 24bb72fc59SBarry Smith /*@C 25bb72fc59SBarry Smith PetscLogObjectMemory - Adds to an object a count of additional amount of memory that is used by the object. 26bb72fc59SBarry Smith 27bb72fc59SBarry Smith Not collective. 28bb72fc59SBarry Smith 29bb72fc59SBarry Smith Input Parameters: 30bb72fc59SBarry Smith + obj - the PETSc object 31bb72fc59SBarry Smith - mem - the amount of memory that is being added to the object 32bb72fc59SBarry Smith 33bb72fc59SBarry Smith Level: developer 34bb72fc59SBarry Smith 3595452b02SPatrick Sanan Developer Notes: 364851f57dSBarry Smith This is not used consistently. It is very difficult to manually track the memory usage per object so this should 374851f57dSBarry Smith likely be removed and replaced with an automated system. 38bb72fc59SBarry Smith 39db781477SPatrick Sanan .seealso: `PetscFinalize()`, `PetscInitializeFortran()`, `PetscGetArgs()`, `PetscInitializeNoArguments()` 40bb72fc59SBarry Smith 41bb72fc59SBarry Smith @*/ 423bb1ff40SBarry Smith PetscErrorCode PetscLogObjectMemory(PetscObject p,PetscLogDouble m) 433bb1ff40SBarry Smith { 44d12f57a0SLisandro Dalcin if (!p) return 0; 4527b6d19dSBarry Smith p->mem += m; 463bb1ff40SBarry Smith return 0; 473bb1ff40SBarry Smith } 483bb1ff40SBarry Smith 495c6c1daeSBarry Smith PetscLogEvent PETSC_LARGEST_EVENT = PETSC_EVENT; 505c6c1daeSBarry Smith 515c6c1daeSBarry Smith #if defined(PETSC_USE_LOG) 525c6c1daeSBarry Smith #include <petscmachineinfo.h> 535c6c1daeSBarry Smith #include <petscconfiginfo.h> 545c6c1daeSBarry Smith 555c6c1daeSBarry Smith /* used in the MPI_XXX() count macros in petsclog.h */ 565c6c1daeSBarry Smith 575c6c1daeSBarry Smith /* Action and object logging variables */ 580298fd71SBarry Smith Action *petsc_actions = NULL; 590298fd71SBarry Smith Object *petsc_objects = NULL; 605c6c1daeSBarry Smith PetscBool petsc_logActions = PETSC_FALSE; 615c6c1daeSBarry Smith PetscBool petsc_logObjects = PETSC_FALSE; 625c6c1daeSBarry Smith int petsc_numActions = 0, petsc_maxActions = 100; 635c6c1daeSBarry Smith int petsc_numObjects = 0, petsc_maxObjects = 100; 645c6c1daeSBarry Smith int petsc_numObjectsDestroyed = 0; 655c6c1daeSBarry Smith 665c6c1daeSBarry Smith /* Global counters */ 675c6c1daeSBarry Smith PetscLogDouble petsc_BaseTime = 0.0; 685c6c1daeSBarry Smith PetscLogDouble petsc_TotalFlops = 0.0; /* The number of flops */ 695c6c1daeSBarry Smith PetscLogDouble petsc_tmp_flops = 0.0; /* The incremental number of flops */ 705c6c1daeSBarry Smith PetscLogDouble petsc_send_ct = 0.0; /* The number of sends */ 715c6c1daeSBarry Smith PetscLogDouble petsc_recv_ct = 0.0; /* The number of receives */ 725c6c1daeSBarry Smith PetscLogDouble petsc_send_len = 0.0; /* The total length of all sent messages */ 735c6c1daeSBarry Smith PetscLogDouble petsc_recv_len = 0.0; /* The total length of all received messages */ 745c6c1daeSBarry Smith PetscLogDouble petsc_isend_ct = 0.0; /* The number of immediate sends */ 755c6c1daeSBarry Smith PetscLogDouble petsc_irecv_ct = 0.0; /* The number of immediate receives */ 765c6c1daeSBarry Smith PetscLogDouble petsc_isend_len = 0.0; /* The total length of all immediate send messages */ 775c6c1daeSBarry Smith PetscLogDouble petsc_irecv_len = 0.0; /* The total length of all immediate receive messages */ 785c6c1daeSBarry Smith PetscLogDouble petsc_wait_ct = 0.0; /* The number of waits */ 795c6c1daeSBarry Smith PetscLogDouble petsc_wait_any_ct = 0.0; /* The number of anywaits */ 805c6c1daeSBarry Smith PetscLogDouble petsc_wait_all_ct = 0.0; /* The number of waitalls */ 815c6c1daeSBarry Smith PetscLogDouble petsc_sum_of_waits_ct = 0.0; /* The total number of waits */ 825c6c1daeSBarry Smith PetscLogDouble petsc_allreduce_ct = 0.0; /* The number of reductions */ 835c6c1daeSBarry Smith PetscLogDouble petsc_gather_ct = 0.0; /* The number of gathers and gathervs */ 845c6c1daeSBarry Smith PetscLogDouble petsc_scatter_ct = 0.0; /* The number of scatters and scattervs */ 8520c24465SJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 86bec0b493Shannah_mairs PetscLogDouble petsc_ctog_ct = 0.0; /* The total number of CPU to GPU copies */ 87bec0b493Shannah_mairs PetscLogDouble petsc_gtoc_ct = 0.0; /* The total number of GPU to CPU copies */ 88bec0b493Shannah_mairs PetscLogDouble petsc_ctog_sz = 0.0; /* The total size of CPU to GPU copies */ 89bec0b493Shannah_mairs PetscLogDouble petsc_gtoc_sz = 0.0; /* The total size of GPU to CPU copies */ 9045c4b7c1SBarry Smith PetscLogDouble petsc_ctog_ct_scalar = 0.0; /* The total number of CPU to GPU copies */ 9145c4b7c1SBarry Smith PetscLogDouble petsc_gtoc_ct_scalar = 0.0; /* The total number of GPU to CPU copies */ 9245c4b7c1SBarry Smith PetscLogDouble petsc_ctog_sz_scalar = 0.0; /* The total size of CPU to GPU copies */ 9345c4b7c1SBarry Smith PetscLogDouble petsc_gtoc_sz_scalar = 0.0; /* The total size of GPU to CPU copies */ 94958c4211Shannah_mairs PetscLogDouble petsc_gflops = 0.0; /* The flops done on a GPU */ 95958c4211Shannah_mairs PetscLogDouble petsc_gtime = 0.0; /* The time spent on a GPU */ 96bec0b493Shannah_mairs #endif 975c6c1daeSBarry Smith 985c6c1daeSBarry Smith /* Logging functions */ 990298fd71SBarry Smith PetscErrorCode (*PetscLogPHC)(PetscObject) = NULL; 1000298fd71SBarry Smith PetscErrorCode (*PetscLogPHD)(PetscObject) = NULL; 1010298fd71SBarry Smith PetscErrorCode (*PetscLogPLB)(PetscLogEvent, int, PetscObject, PetscObject, PetscObject, PetscObject) = NULL; 1020298fd71SBarry Smith PetscErrorCode (*PetscLogPLE)(PetscLogEvent, int, PetscObject, PetscObject, PetscObject, PetscObject) = NULL; 1035c6c1daeSBarry Smith 1045c6c1daeSBarry Smith /* Tracing event logging variables */ 1050298fd71SBarry Smith FILE *petsc_tracefile = NULL; 1065c6c1daeSBarry Smith int petsc_tracelevel = 0; 1075c6c1daeSBarry Smith const char *petsc_traceblanks = " "; 1085c6c1daeSBarry Smith char petsc_tracespace[128] = " "; 1095c6c1daeSBarry Smith PetscLogDouble petsc_tracetime = 0.0; 110896238b9SBarry Smith static PetscBool PetscLogInitializeCalled = PETSC_FALSE; 1115c6c1daeSBarry Smith 112*7a101e5eSJacob Faibussowitsch static PetscIntStack current_log_event_stack = NULL; 113*7a101e5eSJacob Faibussowitsch 11495c0884eSLisandro Dalcin PETSC_INTERN PetscErrorCode PetscLogInitialize(void) 115fa2bb9feSLisandro Dalcin { 116fa2bb9feSLisandro Dalcin int stage; 117fa2bb9feSLisandro Dalcin PetscBool opt; 1185c6c1daeSBarry Smith 119fa2bb9feSLisandro Dalcin PetscFunctionBegin; 120fa2bb9feSLisandro Dalcin if (PetscLogInitializeCalled) PetscFunctionReturn(0); 121fa2bb9feSLisandro Dalcin PetscLogInitializeCalled = PETSC_TRUE; 1225c6c1daeSBarry Smith 123*7a101e5eSJacob Faibussowitsch PetscCall(PetscIntStackCreate(¤t_log_event_stack)); 1249566063dSJacob Faibussowitsch PetscCall(PetscOptionsHasName(NULL,NULL, "-log_exclude_actions", &opt)); 125fa2bb9feSLisandro Dalcin if (opt) petsc_logActions = PETSC_FALSE; 1269566063dSJacob Faibussowitsch PetscCall(PetscOptionsHasName(NULL,NULL, "-log_exclude_objects", &opt)); 127fa2bb9feSLisandro Dalcin if (opt) petsc_logObjects = PETSC_FALSE; 128fa2bb9feSLisandro Dalcin if (petsc_logActions) { 1299566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(petsc_maxActions, &petsc_actions)); 130fa2bb9feSLisandro Dalcin } 131fa2bb9feSLisandro Dalcin if (petsc_logObjects) { 1329566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(petsc_maxObjects, &petsc_objects)); 133fa2bb9feSLisandro Dalcin } 134fa2bb9feSLisandro Dalcin PetscLogPHC = PetscLogObjCreateDefault; 135fa2bb9feSLisandro Dalcin PetscLogPHD = PetscLogObjDestroyDefault; 136fa2bb9feSLisandro Dalcin /* Setup default logging structures */ 1379566063dSJacob Faibussowitsch PetscCall(PetscStageLogCreate(&petsc_stageLog)); 1389566063dSJacob Faibussowitsch PetscCall(PetscStageLogRegister(petsc_stageLog, "Main Stage", &stage)); 1395c6c1daeSBarry Smith 140fa2bb9feSLisandro Dalcin /* All processors sync here for more consistent logging */ 1419566063dSJacob Faibussowitsch PetscCallMPI(MPI_Barrier(PETSC_COMM_WORLD)); 142fa2bb9feSLisandro Dalcin PetscTime(&petsc_BaseTime); 1439566063dSJacob Faibussowitsch PetscCall(PetscLogStagePush(stage)); 144fa2bb9feSLisandro Dalcin PetscFunctionReturn(0); 145fa2bb9feSLisandro Dalcin } 1465c6c1daeSBarry Smith 14795c0884eSLisandro Dalcin PETSC_INTERN PetscErrorCode PetscLogFinalize(void) 1485c6c1daeSBarry Smith { 1495c6c1daeSBarry Smith PetscStageLog stageLog; 1505c6c1daeSBarry Smith 1515c6c1daeSBarry Smith PetscFunctionBegin; 1529566063dSJacob Faibussowitsch PetscCall(PetscFree(petsc_actions)); 1539566063dSJacob Faibussowitsch PetscCall(PetscFree(petsc_objects)); 1549566063dSJacob Faibussowitsch PetscCall(PetscLogNestedEnd()); 1559566063dSJacob Faibussowitsch PetscCall(PetscLogSet(NULL, NULL)); 1565c6c1daeSBarry Smith 1575c6c1daeSBarry Smith /* Resetting phase */ 1589566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 1599566063dSJacob Faibussowitsch PetscCall(PetscStageLogDestroy(stageLog)); 160*7a101e5eSJacob Faibussowitsch PetscCall(PetscIntStackDestroy(current_log_event_stack)); 161*7a101e5eSJacob Faibussowitsch current_log_event_stack = NULL; 162a297a907SKarl Rupp 1635c6c1daeSBarry Smith petsc_TotalFlops = 0.0; 1645c6c1daeSBarry Smith petsc_numActions = 0; 1655c6c1daeSBarry Smith petsc_numObjects = 0; 1665c6c1daeSBarry Smith petsc_numObjectsDestroyed = 0; 1675c6c1daeSBarry Smith petsc_maxActions = 100; 1685c6c1daeSBarry Smith petsc_maxObjects = 100; 1690298fd71SBarry Smith petsc_actions = NULL; 1700298fd71SBarry Smith petsc_objects = NULL; 1715c6c1daeSBarry Smith petsc_logActions = PETSC_FALSE; 1725c6c1daeSBarry Smith petsc_logObjects = PETSC_FALSE; 1735c6c1daeSBarry Smith petsc_BaseTime = 0.0; 1745c6c1daeSBarry Smith petsc_TotalFlops = 0.0; 1755c6c1daeSBarry Smith petsc_tmp_flops = 0.0; 1765c6c1daeSBarry Smith petsc_send_ct = 0.0; 1775c6c1daeSBarry Smith petsc_recv_ct = 0.0; 1785c6c1daeSBarry Smith petsc_send_len = 0.0; 1795c6c1daeSBarry Smith petsc_recv_len = 0.0; 1805c6c1daeSBarry Smith petsc_isend_ct = 0.0; 1815c6c1daeSBarry Smith petsc_irecv_ct = 0.0; 1825c6c1daeSBarry Smith petsc_isend_len = 0.0; 1835c6c1daeSBarry Smith petsc_irecv_len = 0.0; 1845c6c1daeSBarry Smith petsc_wait_ct = 0.0; 1855c6c1daeSBarry Smith petsc_wait_any_ct = 0.0; 1865c6c1daeSBarry Smith petsc_wait_all_ct = 0.0; 1875c6c1daeSBarry Smith petsc_sum_of_waits_ct = 0.0; 1885c6c1daeSBarry Smith petsc_allreduce_ct = 0.0; 1895c6c1daeSBarry Smith petsc_gather_ct = 0.0; 1905c6c1daeSBarry Smith petsc_scatter_ct = 0.0; 191d9c66bfbSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 192bec0b493Shannah_mairs petsc_ctog_ct = 0.0; 193bec0b493Shannah_mairs petsc_gtoc_ct = 0.0; 194bec0b493Shannah_mairs petsc_ctog_sz = 0.0; 195bec0b493Shannah_mairs petsc_gtoc_sz = 0.0; 196958c4211Shannah_mairs petsc_gflops = 0.0; 197958c4211Shannah_mairs petsc_gtime = 0.0; 198bec0b493Shannah_mairs #endif 1995c6c1daeSBarry Smith PETSC_LARGEST_EVENT = PETSC_EVENT; 2000298fd71SBarry Smith PetscLogPHC = NULL; 2010298fd71SBarry Smith PetscLogPHD = NULL; 2020298fd71SBarry Smith petsc_tracefile = NULL; 2035c6c1daeSBarry Smith petsc_tracelevel = 0; 2045c6c1daeSBarry Smith petsc_traceblanks = " "; 2055c6c1daeSBarry Smith petsc_tracespace[0] = ' '; petsc_tracespace[1] = 0; 2065c6c1daeSBarry Smith petsc_tracetime = 0.0; 2075c6c1daeSBarry Smith PETSC_LARGEST_CLASSID = PETSC_SMALLEST_CLASSID; 2085c6c1daeSBarry Smith PETSC_OBJECT_CLASSID = 0; 20902c9f0b5SLisandro Dalcin petsc_stageLog = NULL; 210896238b9SBarry Smith PetscLogInitializeCalled = PETSC_FALSE; 2115c6c1daeSBarry Smith PetscFunctionReturn(0); 2125c6c1daeSBarry Smith } 2135c6c1daeSBarry Smith 2145c6c1daeSBarry Smith /*@C 2155c6c1daeSBarry Smith PetscLogSet - Sets the logging functions called at the beginning and ending of every event. 2165c6c1daeSBarry Smith 2175c6c1daeSBarry Smith Not Collective 2185c6c1daeSBarry Smith 2195c6c1daeSBarry Smith Input Parameters: 2205c6c1daeSBarry Smith + b - The function called at beginning of event 2215c6c1daeSBarry Smith - e - The function called at end of event 2225c6c1daeSBarry Smith 2235c6c1daeSBarry Smith Level: developer 2245c6c1daeSBarry Smith 225db781477SPatrick Sanan .seealso: `PetscLogDump()`, `PetscLogDefaultBegin()`, `PetscLogAllBegin()`, `PetscLogTraceBegin()` 2265c6c1daeSBarry Smith @*/ 2275c6c1daeSBarry Smith PetscErrorCode PetscLogSet(PetscErrorCode (*b)(PetscLogEvent, int, PetscObject, PetscObject, PetscObject, PetscObject), 2285c6c1daeSBarry Smith PetscErrorCode (*e)(PetscLogEvent, int, PetscObject, PetscObject, PetscObject, PetscObject)) 2295c6c1daeSBarry Smith { 2305c6c1daeSBarry Smith PetscFunctionBegin; 2315c6c1daeSBarry Smith PetscLogPLB = b; 2325c6c1daeSBarry Smith PetscLogPLE = e; 2335c6c1daeSBarry Smith PetscFunctionReturn(0); 2345c6c1daeSBarry Smith } 2355c6c1daeSBarry Smith 2365c6c1daeSBarry Smith /*@C 2374dd65854SConnor Ward PetscLogIsActive - Check if logging is currently in progress. 2384dd65854SConnor Ward 2394dd65854SConnor Ward Not Collective 2404dd65854SConnor Ward 2414dd65854SConnor Ward Output Parameter: 2424dd65854SConnor Ward . isActive - PETSC_TRUE if logging is in progress, PETSC_FALSE otherwise 2434dd65854SConnor Ward 2444dd65854SConnor Ward Level: beginner 2454dd65854SConnor Ward 246db781477SPatrick Sanan .seealso: `PetscLogDefaultBegin()`, `PetscLogAllBegin()`, `PetscLogSet()` 2474dd65854SConnor Ward @*/ 2484dd65854SConnor Ward PetscErrorCode PetscLogIsActive(PetscBool *isActive) 2494dd65854SConnor Ward { 2504dd65854SConnor Ward PetscFunctionBegin; 2514dd65854SConnor Ward *isActive = (PetscLogPLB && PetscLogPLE) ? PETSC_TRUE : PETSC_FALSE; 2524dd65854SConnor Ward PetscFunctionReturn(0); 2534dd65854SConnor Ward } 2544dd65854SConnor Ward 2554dd65854SConnor Ward /*@C 256bb1d7374SBarry Smith PetscLogDefaultBegin - Turns on logging of objects and events. This logs flop 2575c6c1daeSBarry Smith rates and object creation and should not slow programs down too much. 2585c6c1daeSBarry Smith This routine may be called more than once. 2595c6c1daeSBarry Smith 2605c6c1daeSBarry Smith Logically Collective over PETSC_COMM_WORLD 2615c6c1daeSBarry Smith 2625c6c1daeSBarry Smith Options Database Keys: 263a2553e36SBarry Smith . -log_view [viewertype:filename:viewerformat] - Prints summary of flop and timing information to the 264a2553e36SBarry Smith screen (for code configured with --with-log=1 (which is the default)) 2655c6c1daeSBarry Smith 2665c6c1daeSBarry Smith Usage: 2675c6c1daeSBarry Smith .vb 2685c6c1daeSBarry Smith PetscInitialize(...); 269bb1d7374SBarry Smith PetscLogDefaultBegin(); 2705c6c1daeSBarry Smith ... code ... 2715c6c1daeSBarry Smith PetscLogView(viewer); or PetscLogDump(); 2725c6c1daeSBarry Smith PetscFinalize(); 2735c6c1daeSBarry Smith .ve 2745c6c1daeSBarry Smith 2755c6c1daeSBarry Smith Notes: 2765c6c1daeSBarry Smith PetscLogView(viewer) or PetscLogDump() actually cause the printing of 2775c6c1daeSBarry Smith the logging information. 2785c6c1daeSBarry Smith 2795c6c1daeSBarry Smith Level: advanced 2805c6c1daeSBarry Smith 281db781477SPatrick Sanan .seealso: `PetscLogDump()`, `PetscLogAllBegin()`, `PetscLogView()`, `PetscLogTraceBegin()` 2825c6c1daeSBarry Smith @*/ 283bb1d7374SBarry Smith PetscErrorCode PetscLogDefaultBegin(void) 2845c6c1daeSBarry Smith { 2855c6c1daeSBarry Smith PetscFunctionBegin; 2869566063dSJacob Faibussowitsch PetscCall(PetscLogSet(PetscLogEventBeginDefault, PetscLogEventEndDefault)); 2875c6c1daeSBarry Smith PetscFunctionReturn(0); 2885c6c1daeSBarry Smith } 2895c6c1daeSBarry Smith 2905c6c1daeSBarry Smith /*@C 2915c6c1daeSBarry Smith PetscLogAllBegin - Turns on extensive logging of objects and events. Logs 2925c6c1daeSBarry Smith all events. This creates large log files and slows the program down. 2935c6c1daeSBarry Smith 2945c6c1daeSBarry Smith Logically Collective on PETSC_COMM_WORLD 2955c6c1daeSBarry Smith 2965c6c1daeSBarry Smith Options Database Keys: 297a2553e36SBarry Smith . -log_all - Prints extensive log information 2985c6c1daeSBarry Smith 2995c6c1daeSBarry Smith Usage: 3005c6c1daeSBarry Smith .vb 3015c6c1daeSBarry Smith PetscInitialize(...); 3025c6c1daeSBarry Smith PetscLogAllBegin(); 3035c6c1daeSBarry Smith ... code ... 3045c6c1daeSBarry Smith PetscLogDump(filename); 3055c6c1daeSBarry Smith PetscFinalize(); 3065c6c1daeSBarry Smith .ve 3075c6c1daeSBarry Smith 3085c6c1daeSBarry Smith Notes: 309bb1d7374SBarry Smith A related routine is PetscLogDefaultBegin() (with the options key -log), which is 3105c6c1daeSBarry Smith intended for production runs since it logs only flop rates and object 3115c6c1daeSBarry Smith creation (and shouldn't significantly slow the programs). 3125c6c1daeSBarry Smith 3135c6c1daeSBarry Smith Level: advanced 3145c6c1daeSBarry Smith 315db781477SPatrick Sanan .seealso: `PetscLogDump()`, `PetscLogDefaultBegin()`, `PetscLogTraceBegin()` 3165c6c1daeSBarry Smith @*/ 3175c6c1daeSBarry Smith PetscErrorCode PetscLogAllBegin(void) 3185c6c1daeSBarry Smith { 3195c6c1daeSBarry Smith PetscFunctionBegin; 3209566063dSJacob Faibussowitsch PetscCall(PetscLogSet(PetscLogEventBeginComplete, PetscLogEventEndComplete)); 3215c6c1daeSBarry Smith PetscFunctionReturn(0); 3225c6c1daeSBarry Smith } 3235c6c1daeSBarry Smith 324956f8c0dSBarry Smith /*@C 3255c6c1daeSBarry Smith PetscLogTraceBegin - Activates trace logging. Every time a PETSc event 3265c6c1daeSBarry Smith begins or ends, the event name is printed. 3275c6c1daeSBarry Smith 3285c6c1daeSBarry Smith Logically Collective on PETSC_COMM_WORLD 3295c6c1daeSBarry Smith 3305c6c1daeSBarry Smith Input Parameter: 3315c6c1daeSBarry Smith . file - The file to print trace in (e.g. stdout) 3325c6c1daeSBarry Smith 3335c6c1daeSBarry Smith Options Database Key: 3345c6c1daeSBarry Smith . -log_trace [filename] - Activates PetscLogTraceBegin() 3355c6c1daeSBarry Smith 3365c6c1daeSBarry Smith Notes: 3375c6c1daeSBarry Smith PetscLogTraceBegin() prints the processor number, the execution time (sec), 3385c6c1daeSBarry Smith then "Event begin:" or "Event end:" followed by the event name. 3395c6c1daeSBarry Smith 3405c6c1daeSBarry Smith PetscLogTraceBegin() allows tracing of all PETSc calls, which is useful 3415c6c1daeSBarry Smith to determine where a program is hanging without running in the 3425c6c1daeSBarry Smith debugger. Can be used in conjunction with the -info option. 3435c6c1daeSBarry Smith 3445c6c1daeSBarry Smith Level: intermediate 3455c6c1daeSBarry Smith 346db781477SPatrick Sanan .seealso: `PetscLogDump()`, `PetscLogAllBegin()`, `PetscLogView()`, `PetscLogDefaultBegin()` 3475c6c1daeSBarry Smith @*/ 3485c6c1daeSBarry Smith PetscErrorCode PetscLogTraceBegin(FILE *file) 3495c6c1daeSBarry Smith { 3505c6c1daeSBarry Smith PetscFunctionBegin; 3515c6c1daeSBarry Smith petsc_tracefile = file; 352a297a907SKarl Rupp 3539566063dSJacob Faibussowitsch PetscCall(PetscLogSet(PetscLogEventBeginTrace, PetscLogEventEndTrace)); 3545c6c1daeSBarry Smith PetscFunctionReturn(0); 3555c6c1daeSBarry Smith } 3565c6c1daeSBarry Smith 3575c6c1daeSBarry Smith /*@ 3585c6c1daeSBarry Smith PetscLogActions - Determines whether actions are logged for the graphical viewer. 3595c6c1daeSBarry Smith 3605c6c1daeSBarry Smith Not Collective 3615c6c1daeSBarry Smith 3625c6c1daeSBarry Smith Input Parameter: 3635c6c1daeSBarry Smith . flag - PETSC_TRUE if actions are to be logged 3645c6c1daeSBarry Smith 3655c6c1daeSBarry Smith Level: intermediate 3665c6c1daeSBarry Smith 3675c6c1daeSBarry Smith Note: Logging of actions continues to consume more memory as the program 3685c6c1daeSBarry Smith runs. Long running programs should consider turning this feature off. 3695c6c1daeSBarry Smith 3705c6c1daeSBarry Smith Options Database Keys: 3715c6c1daeSBarry Smith . -log_exclude_actions - Turns off actions logging 3725c6c1daeSBarry Smith 373db781477SPatrick Sanan .seealso: `PetscLogStagePush()`, `PetscLogStagePop()` 3745c6c1daeSBarry Smith @*/ 3755c6c1daeSBarry Smith PetscErrorCode PetscLogActions(PetscBool flag) 3765c6c1daeSBarry Smith { 3775c6c1daeSBarry Smith PetscFunctionBegin; 3785c6c1daeSBarry Smith petsc_logActions = flag; 3795c6c1daeSBarry Smith PetscFunctionReturn(0); 3805c6c1daeSBarry Smith } 3815c6c1daeSBarry Smith 3825c6c1daeSBarry Smith /*@ 3835c6c1daeSBarry Smith PetscLogObjects - Determines whether objects are logged for the graphical viewer. 3845c6c1daeSBarry Smith 3855c6c1daeSBarry Smith Not Collective 3865c6c1daeSBarry Smith 3875c6c1daeSBarry Smith Input Parameter: 3885c6c1daeSBarry Smith . flag - PETSC_TRUE if objects are to be logged 3895c6c1daeSBarry Smith 3905c6c1daeSBarry Smith Level: intermediate 3915c6c1daeSBarry Smith 3925c6c1daeSBarry Smith Note: Logging of objects continues to consume more memory as the program 3935c6c1daeSBarry Smith runs. Long running programs should consider turning this feature off. 3945c6c1daeSBarry Smith 3955c6c1daeSBarry Smith Options Database Keys: 3965c6c1daeSBarry Smith . -log_exclude_objects - Turns off objects logging 3975c6c1daeSBarry Smith 398db781477SPatrick Sanan .seealso: `PetscLogStagePush()`, `PetscLogStagePop()` 3995c6c1daeSBarry Smith @*/ 4005c6c1daeSBarry Smith PetscErrorCode PetscLogObjects(PetscBool flag) 4015c6c1daeSBarry Smith { 4025c6c1daeSBarry Smith PetscFunctionBegin; 4035c6c1daeSBarry Smith petsc_logObjects = flag; 4045c6c1daeSBarry Smith PetscFunctionReturn(0); 4055c6c1daeSBarry Smith } 4065c6c1daeSBarry Smith 4075c6c1daeSBarry Smith /*------------------------------------------------ Stage Functions --------------------------------------------------*/ 4085c6c1daeSBarry Smith /*@C 40974c0405dSRichard Tran Mills PetscLogStageRegister - Attaches a character string name to a logging stage. 4105c6c1daeSBarry Smith 4115c6c1daeSBarry Smith Not Collective 4125c6c1daeSBarry Smith 4135c6c1daeSBarry Smith Input Parameter: 4145c6c1daeSBarry Smith . sname - The name to associate with that stage 4155c6c1daeSBarry Smith 4165c6c1daeSBarry Smith Output Parameter: 4175c6c1daeSBarry Smith . stage - The stage number 4185c6c1daeSBarry Smith 4195c6c1daeSBarry Smith Level: intermediate 4205c6c1daeSBarry Smith 421db781477SPatrick Sanan .seealso: `PetscLogStagePush()`, `PetscLogStagePop()` 4225c6c1daeSBarry Smith @*/ 4235c6c1daeSBarry Smith PetscErrorCode PetscLogStageRegister(const char sname[],PetscLogStage *stage) 4245c6c1daeSBarry Smith { 4255c6c1daeSBarry Smith PetscStageLog stageLog; 4265c6c1daeSBarry Smith PetscLogEvent event; 4275c6c1daeSBarry Smith 4285c6c1daeSBarry Smith PetscFunctionBegin; 4299566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 4309566063dSJacob Faibussowitsch PetscCall(PetscStageLogRegister(stageLog, sname, stage)); 4315c6c1daeSBarry Smith /* Copy events already changed in the main stage, this sucks */ 4329566063dSJacob Faibussowitsch PetscCall(PetscEventPerfLogEnsureSize(stageLog->stageInfo[*stage].eventLog, stageLog->eventLog->numEvents)); 4335c6c1daeSBarry Smith for (event = 0; event < stageLog->eventLog->numEvents; event++) { 4349566063dSJacob Faibussowitsch PetscCall(PetscEventPerfInfoCopy(&stageLog->stageInfo[0].eventLog->eventInfo[event],&stageLog->stageInfo[*stage].eventLog->eventInfo[event])); 4355c6c1daeSBarry Smith } 4369566063dSJacob Faibussowitsch PetscCall(PetscClassPerfLogEnsureSize(stageLog->stageInfo[*stage].classLog, stageLog->classLog->numClasses)); 4375c6c1daeSBarry Smith PetscFunctionReturn(0); 4385c6c1daeSBarry Smith } 4395c6c1daeSBarry Smith 4405c6c1daeSBarry Smith /*@C 4415c6c1daeSBarry Smith PetscLogStagePush - This function pushes a stage on the stack. 4425c6c1daeSBarry Smith 4435c6c1daeSBarry Smith Not Collective 4445c6c1daeSBarry Smith 4455c6c1daeSBarry Smith Input Parameter: 4465c6c1daeSBarry Smith . stage - The stage on which to log 4475c6c1daeSBarry Smith 4485c6c1daeSBarry Smith Usage: 4495c6c1daeSBarry Smith If the option -log_sumary is used to run the program containing the 4505c6c1daeSBarry Smith following code, then 2 sets of summary data will be printed during 4515c6c1daeSBarry Smith PetscFinalize(). 4525c6c1daeSBarry Smith .vb 4535c6c1daeSBarry Smith PetscInitialize(int *argc,char ***args,0,0); 4545c6c1daeSBarry Smith [stage 0 of code] 4555c6c1daeSBarry Smith PetscLogStagePush(1); 4565c6c1daeSBarry Smith [stage 1 of code] 4575c6c1daeSBarry Smith PetscLogStagePop(); 4585c6c1daeSBarry Smith PetscBarrier(...); 4595c6c1daeSBarry Smith [more stage 0 of code] 4605c6c1daeSBarry Smith PetscFinalize(); 4615c6c1daeSBarry Smith .ve 4625c6c1daeSBarry Smith 4635c6c1daeSBarry Smith Notes: 4645c6c1daeSBarry Smith Use PetscLogStageRegister() to register a stage. 4655c6c1daeSBarry Smith 4665c6c1daeSBarry Smith Level: intermediate 4675c6c1daeSBarry Smith 468db781477SPatrick Sanan .seealso: `PetscLogStagePop()`, `PetscLogStageRegister()`, `PetscBarrier()` 4695c6c1daeSBarry Smith @*/ 4705c6c1daeSBarry Smith PetscErrorCode PetscLogStagePush(PetscLogStage stage) 4715c6c1daeSBarry Smith { 4725c6c1daeSBarry Smith PetscStageLog stageLog; 4735c6c1daeSBarry Smith 4745c6c1daeSBarry Smith PetscFunctionBegin; 4759566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 4769566063dSJacob Faibussowitsch PetscCall(PetscStageLogPush(stageLog, stage)); 4775c6c1daeSBarry Smith PetscFunctionReturn(0); 4785c6c1daeSBarry Smith } 4795c6c1daeSBarry Smith 4805c6c1daeSBarry Smith /*@C 4815c6c1daeSBarry Smith PetscLogStagePop - This function pops a stage from the stack. 4825c6c1daeSBarry Smith 4835c6c1daeSBarry Smith Not Collective 4845c6c1daeSBarry Smith 4855c6c1daeSBarry Smith Usage: 4865c6c1daeSBarry Smith If the option -log_sumary is used to run the program containing the 4875c6c1daeSBarry Smith following code, then 2 sets of summary data will be printed during 4885c6c1daeSBarry Smith PetscFinalize(). 4895c6c1daeSBarry Smith .vb 4905c6c1daeSBarry Smith PetscInitialize(int *argc,char ***args,0,0); 4915c6c1daeSBarry Smith [stage 0 of code] 4925c6c1daeSBarry Smith PetscLogStagePush(1); 4935c6c1daeSBarry Smith [stage 1 of code] 4945c6c1daeSBarry Smith PetscLogStagePop(); 4955c6c1daeSBarry Smith PetscBarrier(...); 4965c6c1daeSBarry Smith [more stage 0 of code] 4975c6c1daeSBarry Smith PetscFinalize(); 4985c6c1daeSBarry Smith .ve 4995c6c1daeSBarry Smith 5005c6c1daeSBarry Smith Notes: 5015c6c1daeSBarry Smith Use PetscLogStageRegister() to register a stage. 5025c6c1daeSBarry Smith 5035c6c1daeSBarry Smith Level: intermediate 5045c6c1daeSBarry Smith 505db781477SPatrick Sanan .seealso: `PetscLogStagePush()`, `PetscLogStageRegister()`, `PetscBarrier()` 5065c6c1daeSBarry Smith @*/ 5075c6c1daeSBarry Smith PetscErrorCode PetscLogStagePop(void) 5085c6c1daeSBarry Smith { 5095c6c1daeSBarry Smith PetscStageLog stageLog; 5105c6c1daeSBarry Smith 5115c6c1daeSBarry Smith PetscFunctionBegin; 5129566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 5139566063dSJacob Faibussowitsch PetscCall(PetscStageLogPop(stageLog)); 5145c6c1daeSBarry Smith PetscFunctionReturn(0); 5155c6c1daeSBarry Smith } 5165c6c1daeSBarry Smith 5175c6c1daeSBarry Smith /*@ 5185c6c1daeSBarry Smith PetscLogStageSetActive - Determines stage activity for PetscLogEventBegin() and PetscLogEventEnd(). 5195c6c1daeSBarry Smith 5205c6c1daeSBarry Smith Not Collective 5215c6c1daeSBarry Smith 5225c6c1daeSBarry Smith Input Parameters: 5235c6c1daeSBarry Smith + stage - The stage 5245c6c1daeSBarry Smith - isActive - The activity flag, PETSC_TRUE for logging, else PETSC_FALSE (defaults to PETSC_TRUE) 5255c6c1daeSBarry Smith 5265c6c1daeSBarry Smith Level: intermediate 5275c6c1daeSBarry Smith 528db781477SPatrick Sanan .seealso: `PetscLogStagePush()`, `PetscLogStagePop()`, `PetscLogEventBegin()`, `PetscLogEventEnd()`, `PetscPreLoadBegin()`, `PetscPreLoadEnd()`, `PetscPreLoadStage()` 5295c6c1daeSBarry Smith @*/ 5305c6c1daeSBarry Smith PetscErrorCode PetscLogStageSetActive(PetscLogStage stage, PetscBool isActive) 5315c6c1daeSBarry Smith { 5325c6c1daeSBarry Smith PetscStageLog stageLog; 5335c6c1daeSBarry Smith 5345c6c1daeSBarry Smith PetscFunctionBegin; 5359566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 5369566063dSJacob Faibussowitsch PetscCall(PetscStageLogSetActive(stageLog, stage, isActive)); 5375c6c1daeSBarry Smith PetscFunctionReturn(0); 5385c6c1daeSBarry Smith } 5395c6c1daeSBarry Smith 5405c6c1daeSBarry Smith /*@ 5415c6c1daeSBarry Smith PetscLogStageGetActive - Returns stage activity for PetscLogEventBegin() and PetscLogEventEnd(). 5425c6c1daeSBarry Smith 5435c6c1daeSBarry Smith Not Collective 5445c6c1daeSBarry Smith 5455c6c1daeSBarry Smith Input Parameter: 5465c6c1daeSBarry Smith . stage - The stage 5475c6c1daeSBarry Smith 5485c6c1daeSBarry Smith Output Parameter: 5495c6c1daeSBarry Smith . isActive - The activity flag, PETSC_TRUE for logging, else PETSC_FALSE (defaults to PETSC_TRUE) 5505c6c1daeSBarry Smith 5515c6c1daeSBarry Smith Level: intermediate 5525c6c1daeSBarry Smith 553db781477SPatrick Sanan .seealso: `PetscLogStagePush()`, `PetscLogStagePop()`, `PetscLogEventBegin()`, `PetscLogEventEnd()`, `PetscPreLoadBegin()`, `PetscPreLoadEnd()`, `PetscPreLoadStage()` 5545c6c1daeSBarry Smith @*/ 5555c6c1daeSBarry Smith PetscErrorCode PetscLogStageGetActive(PetscLogStage stage, PetscBool *isActive) 5565c6c1daeSBarry Smith { 5575c6c1daeSBarry Smith PetscStageLog stageLog; 5585c6c1daeSBarry Smith 5595c6c1daeSBarry Smith PetscFunctionBegin; 5609566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 5619566063dSJacob Faibussowitsch PetscCall(PetscStageLogGetActive(stageLog, stage, isActive)); 5625c6c1daeSBarry Smith PetscFunctionReturn(0); 5635c6c1daeSBarry Smith } 5645c6c1daeSBarry Smith 5655c6c1daeSBarry Smith /*@ 5665c6c1daeSBarry Smith PetscLogStageSetVisible - Determines stage visibility in PetscLogView() 5675c6c1daeSBarry Smith 5685c6c1daeSBarry Smith Not Collective 5695c6c1daeSBarry Smith 5705c6c1daeSBarry Smith Input Parameters: 5715c6c1daeSBarry Smith + stage - The stage 5725c6c1daeSBarry Smith - isVisible - The visibility flag, PETSC_TRUE to print, else PETSC_FALSE (defaults to PETSC_TRUE) 5735c6c1daeSBarry Smith 5745c6c1daeSBarry Smith Level: intermediate 5755c6c1daeSBarry Smith 576db781477SPatrick Sanan .seealso: `PetscLogStagePush()`, `PetscLogStagePop()`, `PetscLogView()` 5775c6c1daeSBarry Smith @*/ 5785c6c1daeSBarry Smith PetscErrorCode PetscLogStageSetVisible(PetscLogStage stage, PetscBool isVisible) 5795c6c1daeSBarry Smith { 5805c6c1daeSBarry Smith PetscStageLog stageLog; 5815c6c1daeSBarry Smith 5825c6c1daeSBarry Smith PetscFunctionBegin; 5839566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 5849566063dSJacob Faibussowitsch PetscCall(PetscStageLogSetVisible(stageLog, stage, isVisible)); 5855c6c1daeSBarry Smith PetscFunctionReturn(0); 5865c6c1daeSBarry Smith } 5875c6c1daeSBarry Smith 5885c6c1daeSBarry Smith /*@ 5895c6c1daeSBarry Smith PetscLogStageGetVisible - Returns stage visibility in PetscLogView() 5905c6c1daeSBarry Smith 5915c6c1daeSBarry Smith Not Collective 5925c6c1daeSBarry Smith 5935c6c1daeSBarry Smith Input Parameter: 5945c6c1daeSBarry Smith . stage - The stage 5955c6c1daeSBarry Smith 5965c6c1daeSBarry Smith Output Parameter: 5975c6c1daeSBarry Smith . isVisible - The visibility flag, PETSC_TRUE to print, else PETSC_FALSE (defaults to PETSC_TRUE) 5985c6c1daeSBarry Smith 5995c6c1daeSBarry Smith Level: intermediate 6005c6c1daeSBarry Smith 601db781477SPatrick Sanan .seealso: `PetscLogStagePush()`, `PetscLogStagePop()`, `PetscLogView()` 6025c6c1daeSBarry Smith @*/ 6035c6c1daeSBarry Smith PetscErrorCode PetscLogStageGetVisible(PetscLogStage stage, PetscBool *isVisible) 6045c6c1daeSBarry Smith { 6055c6c1daeSBarry Smith PetscStageLog stageLog; 6065c6c1daeSBarry Smith 6075c6c1daeSBarry Smith PetscFunctionBegin; 6089566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 6099566063dSJacob Faibussowitsch PetscCall(PetscStageLogGetVisible(stageLog, stage, isVisible)); 6105c6c1daeSBarry Smith PetscFunctionReturn(0); 6115c6c1daeSBarry Smith } 6125c6c1daeSBarry Smith 6135c6c1daeSBarry Smith /*@C 6145c6c1daeSBarry Smith PetscLogStageGetId - Returns the stage id when given the stage name. 6155c6c1daeSBarry Smith 6165c6c1daeSBarry Smith Not Collective 6175c6c1daeSBarry Smith 6185c6c1daeSBarry Smith Input Parameter: 6195c6c1daeSBarry Smith . name - The stage name 6205c6c1daeSBarry Smith 6215c6c1daeSBarry Smith Output Parameter: 6225a4a3fabSBarry Smith . stage - The stage, , or -1 if no stage with that name exists 6235c6c1daeSBarry Smith 6245c6c1daeSBarry Smith Level: intermediate 6255c6c1daeSBarry Smith 626db781477SPatrick Sanan .seealso: `PetscLogStagePush()`, `PetscLogStagePop()`, `PetscPreLoadBegin()`, `PetscPreLoadEnd()`, `PetscPreLoadStage()` 6275c6c1daeSBarry Smith @*/ 6285c6c1daeSBarry Smith PetscErrorCode PetscLogStageGetId(const char name[], PetscLogStage *stage) 6295c6c1daeSBarry Smith { 6305c6c1daeSBarry Smith PetscStageLog stageLog; 6315c6c1daeSBarry Smith 6325c6c1daeSBarry Smith PetscFunctionBegin; 6339566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 6349566063dSJacob Faibussowitsch PetscCall(PetscStageLogGetStage(stageLog, name, stage)); 6355c6c1daeSBarry Smith PetscFunctionReturn(0); 6365c6c1daeSBarry Smith } 6375c6c1daeSBarry Smith 6385c6c1daeSBarry Smith /*------------------------------------------------ Event Functions --------------------------------------------------*/ 639*7a101e5eSJacob Faibussowitsch 6405c6c1daeSBarry Smith /*@C 6415c6c1daeSBarry Smith PetscLogEventRegister - Registers an event name for logging operations in an application code. 6425c6c1daeSBarry Smith 6435c6c1daeSBarry Smith Not Collective 6445c6c1daeSBarry Smith 645d8d19677SJose E. Roman Input Parameters: 6465c6c1daeSBarry Smith + name - The name associated with the event 6475c6c1daeSBarry Smith - classid - The classid associated to the class for this event, obtain either with 6485c6c1daeSBarry Smith PetscClassIdRegister() or use a predefined one such as KSP_CLASSID, SNES_CLASSID, the predefined ones 6495c6c1daeSBarry Smith are only available in C code 6505c6c1daeSBarry Smith 6515c6c1daeSBarry Smith Output Parameter: 6525c6c1daeSBarry Smith . event - The event id for use with PetscLogEventBegin() and PetscLogEventEnd(). 6535c6c1daeSBarry Smith 6545c6c1daeSBarry Smith Example of Usage: 6555c6c1daeSBarry Smith .vb 6565c6c1daeSBarry Smith PetscLogEvent USER_EVENT; 6575c6c1daeSBarry Smith PetscClassId classid; 6585c6c1daeSBarry Smith PetscLogDouble user_event_flops; 6595c6c1daeSBarry Smith PetscClassIdRegister("class name",&classid); 6605c6c1daeSBarry Smith PetscLogEventRegister("User event name",classid,&USER_EVENT); 6615c6c1daeSBarry Smith PetscLogEventBegin(USER_EVENT,0,0,0,0); 6625c6c1daeSBarry Smith [code segment to monitor] 6635c6c1daeSBarry Smith PetscLogFlops(user_event_flops); 6645c6c1daeSBarry Smith PetscLogEventEnd(USER_EVENT,0,0,0,0); 6655c6c1daeSBarry Smith .ve 6665c6c1daeSBarry Smith 6675c6c1daeSBarry Smith Notes: 6685c6c1daeSBarry Smith PETSc automatically logs library events if the code has been 669a2553e36SBarry Smith configured with --with-log (which is the default) and 670a2553e36SBarry Smith -log_view or -log_all is specified. PetscLogEventRegister() is 6715c6c1daeSBarry Smith intended for logging user events to supplement this PETSc 6725c6c1daeSBarry Smith information. 6735c6c1daeSBarry Smith 674495fc317SBarry Smith PETSc can gather data for use with the utilities Jumpshot 6755c6c1daeSBarry Smith (part of the MPICH distribution). If PETSc has been compiled 6765c6c1daeSBarry Smith with flag -DPETSC_HAVE_MPE (MPE is an additional utility within 6775c6c1daeSBarry Smith MPICH), the user can employ another command line option, -log_mpe, 6785c6c1daeSBarry Smith to create a logfile, "mpe.log", which can be visualized 679495fc317SBarry Smith Jumpshot. 6805c6c1daeSBarry Smith 6815c6c1daeSBarry Smith The classid is associated with each event so that classes of events 6825c6c1daeSBarry Smith can be disabled simultaneously, such as all matrix events. The user 6835c6c1daeSBarry Smith can either use an existing classid, such as MAT_CLASSID, or create 6845c6c1daeSBarry Smith their own as shown in the example. 6855c6c1daeSBarry Smith 686c5deb1d5SJed Brown If an existing event with the same name exists, its event handle is 687c5deb1d5SJed Brown returned instead of creating a new event. 688c5deb1d5SJed Brown 6895c6c1daeSBarry Smith Level: intermediate 6905c6c1daeSBarry Smith 691db781477SPatrick Sanan .seealso: `PetscLogEventBegin()`, `PetscLogEventEnd()`, `PetscLogFlops()`, 692db781477SPatrick Sanan `PetscLogEventActivate()`, `PetscLogEventDeactivate()`, `PetscClassIdRegister()` 6935c6c1daeSBarry Smith @*/ 6945c6c1daeSBarry Smith PetscErrorCode PetscLogEventRegister(const char name[],PetscClassId classid,PetscLogEvent *event) 6955c6c1daeSBarry Smith { 6965c6c1daeSBarry Smith PetscStageLog stageLog; 6975c6c1daeSBarry Smith int stage; 6985c6c1daeSBarry Smith 6995c6c1daeSBarry Smith PetscFunctionBegin; 7005c6c1daeSBarry Smith *event = PETSC_DECIDE; 7019566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 7029566063dSJacob Faibussowitsch PetscCall(PetscEventRegLogGetEvent(stageLog->eventLog, name, event)); 703c5deb1d5SJed Brown if (*event > 0) PetscFunctionReturn(0); 7049566063dSJacob Faibussowitsch PetscCall(PetscEventRegLogRegister(stageLog->eventLog, name, classid, event)); 7055c6c1daeSBarry Smith for (stage = 0; stage < stageLog->numStages; stage++) { 7069566063dSJacob Faibussowitsch PetscCall(PetscEventPerfLogEnsureSize(stageLog->stageInfo[stage].eventLog, stageLog->eventLog->numEvents)); 7079566063dSJacob Faibussowitsch PetscCall(PetscClassPerfLogEnsureSize(stageLog->stageInfo[stage].classLog, stageLog->classLog->numClasses)); 7085c6c1daeSBarry Smith } 7095c6c1daeSBarry Smith PetscFunctionReturn(0); 7105c6c1daeSBarry Smith } 7115c6c1daeSBarry Smith 7125c6c1daeSBarry Smith /*@ 713217044c2SLisandro Dalcin PetscLogEventSetCollective - Indicates that a particular event is collective. 714217044c2SLisandro Dalcin 715217044c2SLisandro Dalcin Not Collective 716217044c2SLisandro Dalcin 717d8d19677SJose E. Roman Input Parameters: 718217044c2SLisandro Dalcin + event - The event id 719217044c2SLisandro Dalcin - collective - Bolean flag indicating whether a particular event is collective 720217044c2SLisandro Dalcin 721217044c2SLisandro Dalcin Note: 722217044c2SLisandro Dalcin New events returned from PetscLogEventRegister() are collective by default. 723217044c2SLisandro Dalcin 724217044c2SLisandro Dalcin Level: developer 725217044c2SLisandro Dalcin 726db781477SPatrick Sanan .seealso: `PetscLogEventRegister()` 727217044c2SLisandro Dalcin @*/ 728217044c2SLisandro Dalcin PetscErrorCode PetscLogEventSetCollective(PetscLogEvent event,PetscBool collective) 729217044c2SLisandro Dalcin { 730217044c2SLisandro Dalcin PetscStageLog stageLog; 731217044c2SLisandro Dalcin PetscEventRegLog eventRegLog; 732217044c2SLisandro Dalcin 733217044c2SLisandro Dalcin PetscFunctionBegin; 7349566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 7359566063dSJacob Faibussowitsch PetscCall(PetscStageLogGetEventRegLog(stageLog,&eventRegLog)); 736cc73adaaSBarry Smith PetscCheck(event >= 0 && event <= eventRegLog->numEvents,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Invalid event id"); 737217044c2SLisandro Dalcin eventRegLog->eventInfo[event].collective = collective; 738217044c2SLisandro Dalcin PetscFunctionReturn(0); 739217044c2SLisandro Dalcin } 740217044c2SLisandro Dalcin 741217044c2SLisandro Dalcin /*@ 742fa2bb9feSLisandro Dalcin PetscLogEventIncludeClass - Activates event logging for a PETSc object class in every stage. 743fa2bb9feSLisandro Dalcin 744fa2bb9feSLisandro Dalcin Not Collective 745fa2bb9feSLisandro Dalcin 746fa2bb9feSLisandro Dalcin Input Parameter: 747fa2bb9feSLisandro Dalcin . classid - The object class, for example MAT_CLASSID, SNES_CLASSID, etc. 748fa2bb9feSLisandro Dalcin 749fa2bb9feSLisandro Dalcin Level: developer 750fa2bb9feSLisandro Dalcin 751c2e3fba1SPatrick Sanan .seealso: `PetscLogEventActivateClass()`, `PetscLogEventDeactivateClass()`, `PetscLogEventActivate()`, `PetscLogEventDeactivate()` 752fa2bb9feSLisandro Dalcin @*/ 753fa2bb9feSLisandro Dalcin PetscErrorCode PetscLogEventIncludeClass(PetscClassId classid) 754fa2bb9feSLisandro Dalcin { 755fa2bb9feSLisandro Dalcin PetscStageLog stageLog; 756fa2bb9feSLisandro Dalcin int stage; 757fa2bb9feSLisandro Dalcin 758fa2bb9feSLisandro Dalcin PetscFunctionBegin; 7599566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 760fa2bb9feSLisandro Dalcin for (stage = 0; stage < stageLog->numStages; stage++) { 7619566063dSJacob Faibussowitsch PetscCall(PetscEventPerfLogActivateClass(stageLog->stageInfo[stage].eventLog, stageLog->eventLog, classid)); 762fa2bb9feSLisandro Dalcin } 763fa2bb9feSLisandro Dalcin PetscFunctionReturn(0); 764fa2bb9feSLisandro Dalcin } 765fa2bb9feSLisandro Dalcin 766fa2bb9feSLisandro Dalcin /*@ 767fa2bb9feSLisandro Dalcin PetscLogEventExcludeClass - Deactivates event logging for a PETSc object class in every stage. 768fa2bb9feSLisandro Dalcin 769fa2bb9feSLisandro Dalcin Not Collective 770fa2bb9feSLisandro Dalcin 771fa2bb9feSLisandro Dalcin Input Parameter: 772fa2bb9feSLisandro Dalcin . classid - The object class, for example MAT_CLASSID, SNES_CLASSID, etc. 773fa2bb9feSLisandro Dalcin 774fa2bb9feSLisandro Dalcin Level: developer 775fa2bb9feSLisandro Dalcin 776c2e3fba1SPatrick Sanan .seealso: `PetscLogEventDeactivateClass()`, `PetscLogEventActivateClass()`, `PetscLogEventDeactivate()`, `PetscLogEventActivate()` 777fa2bb9feSLisandro Dalcin @*/ 778fa2bb9feSLisandro Dalcin PetscErrorCode PetscLogEventExcludeClass(PetscClassId classid) 779fa2bb9feSLisandro Dalcin { 780fa2bb9feSLisandro Dalcin PetscStageLog stageLog; 781fa2bb9feSLisandro Dalcin int stage; 782fa2bb9feSLisandro Dalcin 783fa2bb9feSLisandro Dalcin PetscFunctionBegin; 7849566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 785fa2bb9feSLisandro Dalcin for (stage = 0; stage < stageLog->numStages; stage++) { 7869566063dSJacob Faibussowitsch PetscCall(PetscEventPerfLogDeactivateClass(stageLog->stageInfo[stage].eventLog, stageLog->eventLog, classid)); 787fa2bb9feSLisandro Dalcin } 788fa2bb9feSLisandro Dalcin PetscFunctionReturn(0); 789fa2bb9feSLisandro Dalcin } 790fa2bb9feSLisandro Dalcin 791fa2bb9feSLisandro Dalcin /*@ 7925c6c1daeSBarry Smith PetscLogEventActivate - Indicates that a particular event should be logged. 7935c6c1daeSBarry Smith 7945c6c1daeSBarry Smith Not Collective 7955c6c1daeSBarry Smith 7965c6c1daeSBarry Smith Input Parameter: 7975c6c1daeSBarry Smith . event - The event id 7985c6c1daeSBarry Smith 7995c6c1daeSBarry Smith Usage: 8005c6c1daeSBarry Smith .vb 8015c6c1daeSBarry Smith PetscLogEventDeactivate(VEC_SetValues); 8025c6c1daeSBarry Smith [code where you do not want to log VecSetValues()] 8035c6c1daeSBarry Smith PetscLogEventActivate(VEC_SetValues); 8045c6c1daeSBarry Smith [code where you do want to log VecSetValues()] 8055c6c1daeSBarry Smith .ve 8065c6c1daeSBarry Smith 8075c6c1daeSBarry Smith Note: 8085c6c1daeSBarry Smith The event may be either a pre-defined PETSc event (found in include/petsclog.h) 8095c6c1daeSBarry Smith or an event number obtained with PetscLogEventRegister(). 8105c6c1daeSBarry Smith 8115c6c1daeSBarry Smith Level: advanced 8125c6c1daeSBarry Smith 813db781477SPatrick Sanan .seealso: `PlogEventDeactivate()`, `PlogEventDeactivatePush()`, `PetscLogEventDeactivatePop()` 8145c6c1daeSBarry Smith @*/ 8155c6c1daeSBarry Smith PetscErrorCode PetscLogEventActivate(PetscLogEvent event) 8165c6c1daeSBarry Smith { 8175c6c1daeSBarry Smith PetscStageLog stageLog; 8185c6c1daeSBarry Smith int stage; 8195c6c1daeSBarry Smith 8205c6c1daeSBarry Smith PetscFunctionBegin; 8219566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 8229566063dSJacob Faibussowitsch PetscCall(PetscStageLogGetCurrent(stageLog, &stage)); 8239566063dSJacob Faibussowitsch PetscCall(PetscEventPerfLogActivate(stageLog->stageInfo[stage].eventLog, event)); 8245c6c1daeSBarry Smith PetscFunctionReturn(0); 8255c6c1daeSBarry Smith } 8265c6c1daeSBarry Smith 8275c6c1daeSBarry Smith /*@ 8285c6c1daeSBarry Smith PetscLogEventDeactivate - Indicates that a particular event should not be logged. 8295c6c1daeSBarry Smith 8305c6c1daeSBarry Smith Not Collective 8315c6c1daeSBarry Smith 8325c6c1daeSBarry Smith Input Parameter: 8335c6c1daeSBarry Smith . event - The event id 8345c6c1daeSBarry Smith 8355c6c1daeSBarry Smith Usage: 8365c6c1daeSBarry Smith .vb 8375c6c1daeSBarry Smith PetscLogEventDeactivate(VEC_SetValues); 8385c6c1daeSBarry Smith [code where you do not want to log VecSetValues()] 8395c6c1daeSBarry Smith PetscLogEventActivate(VEC_SetValues); 8405c6c1daeSBarry Smith [code where you do want to log VecSetValues()] 8415c6c1daeSBarry Smith .ve 8425c6c1daeSBarry Smith 8435c6c1daeSBarry Smith Note: 8445c6c1daeSBarry Smith The event may be either a pre-defined PETSc event (found in 8455c6c1daeSBarry Smith include/petsclog.h) or an event number obtained with PetscLogEventRegister()). 8465c6c1daeSBarry Smith 8475c6c1daeSBarry Smith Level: advanced 8485c6c1daeSBarry Smith 849db781477SPatrick Sanan .seealso: `PetscLogEventActivate()`, `PetscLogEventDeactivatePush()`, `PetscLogEventDeactivatePop()` 8505c6c1daeSBarry Smith @*/ 8515c6c1daeSBarry Smith PetscErrorCode PetscLogEventDeactivate(PetscLogEvent event) 8525c6c1daeSBarry Smith { 8535c6c1daeSBarry Smith PetscStageLog stageLog; 8545c6c1daeSBarry Smith int stage; 8555c6c1daeSBarry Smith 8565c6c1daeSBarry Smith PetscFunctionBegin; 8579566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 8589566063dSJacob Faibussowitsch PetscCall(PetscStageLogGetCurrent(stageLog, &stage)); 8599566063dSJacob Faibussowitsch PetscCall(PetscEventPerfLogDeactivate(stageLog->stageInfo[stage].eventLog, event)); 8605c6c1daeSBarry Smith PetscFunctionReturn(0); 8615c6c1daeSBarry Smith } 8625c6c1daeSBarry Smith 8635c6c1daeSBarry Smith /*@ 864c00cb57fSBarry Smith PetscLogEventDeactivatePush - Indicates that a particular event should not be logged. 865c00cb57fSBarry Smith 866c00cb57fSBarry Smith Not Collective 867c00cb57fSBarry Smith 868c00cb57fSBarry Smith Input Parameter: 869c00cb57fSBarry Smith . event - The event id 870c00cb57fSBarry Smith 871c00cb57fSBarry Smith Usage: 872c00cb57fSBarry Smith .vb 873c00cb57fSBarry Smith PetscLogEventDeactivatePush(VEC_SetValues); 874c00cb57fSBarry Smith [code where you do not want to log VecSetValues()] 875c00cb57fSBarry Smith PetscLogEventDeactivatePop(VEC_SetValues); 876c00cb57fSBarry Smith [code where you do want to log VecSetValues()] 877c00cb57fSBarry Smith .ve 878c00cb57fSBarry Smith 879c00cb57fSBarry Smith Note: 880c00cb57fSBarry Smith The event may be either a pre-defined PETSc event (found in 881c00cb57fSBarry Smith include/petsclog.h) or an event number obtained with PetscLogEventRegister()). 882c00cb57fSBarry Smith 883c00cb57fSBarry Smith Level: advanced 884c00cb57fSBarry Smith 885db781477SPatrick Sanan .seealso: `PetscLogEventActivate()`, `PetscLogEventDeactivatePop()` 886c00cb57fSBarry Smith @*/ 887c00cb57fSBarry Smith PetscErrorCode PetscLogEventDeactivatePush(PetscLogEvent event) 888c00cb57fSBarry Smith { 889c00cb57fSBarry Smith PetscStageLog stageLog; 890c00cb57fSBarry Smith int stage; 891c00cb57fSBarry Smith 892c00cb57fSBarry Smith PetscFunctionBegin; 8939566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 8949566063dSJacob Faibussowitsch PetscCall(PetscStageLogGetCurrent(stageLog, &stage)); 8959566063dSJacob Faibussowitsch PetscCall(PetscEventPerfLogDeactivatePush(stageLog->stageInfo[stage].eventLog, event)); 896c00cb57fSBarry Smith PetscFunctionReturn(0); 897c00cb57fSBarry Smith } 898c00cb57fSBarry Smith 899c00cb57fSBarry Smith /*@ 900c00cb57fSBarry Smith PetscLogEventDeactivatePop - Indicates that a particular event should be logged. 901c00cb57fSBarry Smith 902c00cb57fSBarry Smith Not Collective 903c00cb57fSBarry Smith 904c00cb57fSBarry Smith Input Parameter: 905c00cb57fSBarry Smith . event - The event id 906c00cb57fSBarry Smith 907c00cb57fSBarry Smith Usage: 908c00cb57fSBarry Smith .vb 909c00cb57fSBarry Smith PetscLogEventDeactivatePush(VEC_SetValues); 910c00cb57fSBarry Smith [code where you do not want to log VecSetValues()] 911c00cb57fSBarry Smith PetscLogEventDeactivatePop(VEC_SetValues); 912c00cb57fSBarry Smith [code where you do want to log VecSetValues()] 913c00cb57fSBarry Smith .ve 914c00cb57fSBarry Smith 915c00cb57fSBarry Smith Note: 916c00cb57fSBarry Smith The event may be either a pre-defined PETSc event (found in 917c00cb57fSBarry Smith include/petsclog.h) or an event number obtained with PetscLogEventRegister()). 918c00cb57fSBarry Smith 919c00cb57fSBarry Smith Level: advanced 920c00cb57fSBarry Smith 921db781477SPatrick Sanan .seealso: `PetscLogEventActivate()`, `PetscLogEventDeactivatePush()` 922c00cb57fSBarry Smith @*/ 923c00cb57fSBarry Smith PetscErrorCode PetscLogEventDeactivatePop(PetscLogEvent event) 924c00cb57fSBarry Smith { 925c00cb57fSBarry Smith PetscStageLog stageLog; 926c00cb57fSBarry Smith int stage; 927c00cb57fSBarry Smith 928c00cb57fSBarry Smith PetscFunctionBegin; 9299566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 9309566063dSJacob Faibussowitsch PetscCall(PetscStageLogGetCurrent(stageLog, &stage)); 9319566063dSJacob Faibussowitsch PetscCall(PetscEventPerfLogDeactivatePop(stageLog->stageInfo[stage].eventLog, event)); 932c00cb57fSBarry Smith PetscFunctionReturn(0); 933c00cb57fSBarry Smith } 934c00cb57fSBarry Smith 935c00cb57fSBarry Smith /*@ 9365c6c1daeSBarry Smith PetscLogEventSetActiveAll - Sets the event activity in every stage. 9375c6c1daeSBarry Smith 9385c6c1daeSBarry Smith Not Collective 9395c6c1daeSBarry Smith 9405c6c1daeSBarry Smith Input Parameters: 9415c6c1daeSBarry Smith + event - The event id 9425c6c1daeSBarry Smith - isActive - The activity flag determining whether the event is logged 9435c6c1daeSBarry Smith 9445c6c1daeSBarry Smith Level: advanced 9455c6c1daeSBarry Smith 946c2e3fba1SPatrick Sanan .seealso: `PlogEventActivate()`, `PlogEventDeactivate()` 9475c6c1daeSBarry Smith @*/ 9485c6c1daeSBarry Smith PetscErrorCode PetscLogEventSetActiveAll(PetscLogEvent event, PetscBool isActive) 9495c6c1daeSBarry Smith { 9505c6c1daeSBarry Smith PetscStageLog stageLog; 9515c6c1daeSBarry Smith int stage; 9525c6c1daeSBarry Smith 9535c6c1daeSBarry Smith PetscFunctionBegin; 9549566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 9555c6c1daeSBarry Smith for (stage = 0; stage < stageLog->numStages; stage++) { 9565c6c1daeSBarry Smith if (isActive) { 9579566063dSJacob Faibussowitsch PetscCall(PetscEventPerfLogActivate(stageLog->stageInfo[stage].eventLog, event)); 9585c6c1daeSBarry Smith } else { 9599566063dSJacob Faibussowitsch PetscCall(PetscEventPerfLogDeactivate(stageLog->stageInfo[stage].eventLog, event)); 9605c6c1daeSBarry Smith } 9615c6c1daeSBarry Smith } 9625c6c1daeSBarry Smith PetscFunctionReturn(0); 9635c6c1daeSBarry Smith } 9645c6c1daeSBarry Smith 9655c6c1daeSBarry Smith /*@ 9665c6c1daeSBarry Smith PetscLogEventActivateClass - Activates event logging for a PETSc object class. 9675c6c1daeSBarry Smith 9685c6c1daeSBarry Smith Not Collective 9695c6c1daeSBarry Smith 9705c6c1daeSBarry Smith Input Parameter: 9715c6c1daeSBarry Smith . classid - The event class, for example MAT_CLASSID, SNES_CLASSID, etc. 9725c6c1daeSBarry Smith 9735c6c1daeSBarry Smith Level: developer 9745c6c1daeSBarry Smith 975c2e3fba1SPatrick Sanan .seealso: `PetscLogEventDeactivateClass()`, `PetscLogEventActivate()`, `PetscLogEventDeactivate()` 9765c6c1daeSBarry Smith @*/ 9775c6c1daeSBarry Smith PetscErrorCode PetscLogEventActivateClass(PetscClassId classid) 9785c6c1daeSBarry Smith { 9795c6c1daeSBarry Smith PetscStageLog stageLog; 9805c6c1daeSBarry Smith int stage; 9815c6c1daeSBarry Smith 9825c6c1daeSBarry Smith PetscFunctionBegin; 9839566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 9849566063dSJacob Faibussowitsch PetscCall(PetscStageLogGetCurrent(stageLog, &stage)); 9859566063dSJacob Faibussowitsch PetscCall(PetscEventPerfLogActivateClass(stageLog->stageInfo[stage].eventLog, stageLog->eventLog, classid)); 9865c6c1daeSBarry Smith PetscFunctionReturn(0); 9875c6c1daeSBarry Smith } 9885c6c1daeSBarry Smith 9895c6c1daeSBarry Smith /*@ 9905c6c1daeSBarry Smith PetscLogEventDeactivateClass - Deactivates event logging for a PETSc object class. 9915c6c1daeSBarry Smith 9925c6c1daeSBarry Smith Not Collective 9935c6c1daeSBarry Smith 9945c6c1daeSBarry Smith Input Parameter: 9955c6c1daeSBarry Smith . classid - The event class, for example MAT_CLASSID, SNES_CLASSID, etc. 9965c6c1daeSBarry Smith 9975c6c1daeSBarry Smith Level: developer 9985c6c1daeSBarry Smith 999c2e3fba1SPatrick Sanan .seealso: `PetscLogEventActivateClass()`, `PetscLogEventActivate()`, `PetscLogEventDeactivate()` 10005c6c1daeSBarry Smith @*/ 10015c6c1daeSBarry Smith PetscErrorCode PetscLogEventDeactivateClass(PetscClassId classid) 10025c6c1daeSBarry Smith { 10035c6c1daeSBarry Smith PetscStageLog stageLog; 10045c6c1daeSBarry Smith int stage; 10055c6c1daeSBarry Smith 10065c6c1daeSBarry Smith PetscFunctionBegin; 10079566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 10089566063dSJacob Faibussowitsch PetscCall(PetscStageLogGetCurrent(stageLog, &stage)); 10099566063dSJacob Faibussowitsch PetscCall(PetscEventPerfLogDeactivateClass(stageLog->stageInfo[stage].eventLog, stageLog->eventLog, classid)); 10105c6c1daeSBarry Smith PetscFunctionReturn(0); 10115c6c1daeSBarry Smith } 10125c6c1daeSBarry Smith 10135c6c1daeSBarry Smith /*MC 101462872c28SLisandro Dalcin PetscLogEventSync - Synchronizes the beginning of a user event. 101562872c28SLisandro Dalcin 101662872c28SLisandro Dalcin Synopsis: 101762872c28SLisandro Dalcin #include <petsclog.h> 101862872c28SLisandro Dalcin PetscErrorCode PetscLogEventSync(int e,MPI_Comm comm) 101962872c28SLisandro Dalcin 102062872c28SLisandro Dalcin Collective 102162872c28SLisandro Dalcin 102262872c28SLisandro Dalcin Input Parameters: 102362872c28SLisandro Dalcin + e - integer associated with the event obtained from PetscLogEventRegister() 102462872c28SLisandro Dalcin - comm - an MPI communicator 102562872c28SLisandro Dalcin 102662872c28SLisandro Dalcin Usage: 102762872c28SLisandro Dalcin .vb 102862872c28SLisandro Dalcin PetscLogEvent USER_EVENT; 102962872c28SLisandro Dalcin PetscLogEventRegister("User event",0,&USER_EVENT); 103062872c28SLisandro Dalcin PetscLogEventSync(USER_EVENT,PETSC_COMM_WORLD); 103162872c28SLisandro Dalcin PetscLogEventBegin(USER_EVENT,0,0,0,0); 103262872c28SLisandro Dalcin [code segment to monitor] 103362872c28SLisandro Dalcin PetscLogEventEnd(USER_EVENT,0,0,0,0); 103462872c28SLisandro Dalcin .ve 103562872c28SLisandro Dalcin 103662872c28SLisandro Dalcin Notes: 103762872c28SLisandro Dalcin This routine should be called only if there is not a 103862872c28SLisandro Dalcin PetscObject available to pass to PetscLogEventBegin(). 103962872c28SLisandro Dalcin 104062872c28SLisandro Dalcin Level: developer 104162872c28SLisandro Dalcin 1042db781477SPatrick Sanan .seealso: `PetscLogEventRegister()`, `PetscLogEventBegin()`, `PetscLogEventEnd()` 104362872c28SLisandro Dalcin 104462872c28SLisandro Dalcin M*/ 104562872c28SLisandro Dalcin 104662872c28SLisandro Dalcin /*MC 10475c6c1daeSBarry Smith PetscLogEventBegin - Logs the beginning of a user event. 10485c6c1daeSBarry Smith 10495c6c1daeSBarry Smith Synopsis: 1050aaa7dc30SBarry Smith #include <petsclog.h> 1051f2ba6396SBarry Smith PetscErrorCode PetscLogEventBegin(int e,PetscObject o1,PetscObject o2,PetscObject o3,PetscObject o4) 10525c6c1daeSBarry Smith 10535c6c1daeSBarry Smith Not Collective 10545c6c1daeSBarry Smith 10555c6c1daeSBarry Smith Input Parameters: 10565c6c1daeSBarry Smith + e - integer associated with the event obtained from PetscLogEventRegister() 10575c6c1daeSBarry Smith - o1,o2,o3,o4 - objects associated with the event, or 0 10585c6c1daeSBarry Smith 10595c6c1daeSBarry Smith Fortran Synopsis: 10605c6c1daeSBarry Smith void PetscLogEventBegin(int e,PetscErrorCode ierr) 10615c6c1daeSBarry Smith 10625c6c1daeSBarry Smith Usage: 10635c6c1daeSBarry Smith .vb 10645c6c1daeSBarry Smith PetscLogEvent USER_EVENT; 10655c6c1daeSBarry Smith PetscLogDouble user_event_flops; 10665c6c1daeSBarry Smith PetscLogEventRegister("User event",0,&USER_EVENT); 10675c6c1daeSBarry Smith PetscLogEventBegin(USER_EVENT,0,0,0,0); 10685c6c1daeSBarry Smith [code segment to monitor] 10695c6c1daeSBarry Smith PetscLogFlops(user_event_flops); 10705c6c1daeSBarry Smith PetscLogEventEnd(USER_EVENT,0,0,0,0); 10715c6c1daeSBarry Smith .ve 10725c6c1daeSBarry Smith 10735c6c1daeSBarry Smith Notes: 10745c6c1daeSBarry Smith You need to register each integer event with the command 1075a2553e36SBarry Smith PetscLogEventRegister(). 10765c6c1daeSBarry Smith 1077d0609cedSBarry Smith Developer Notes: 1078d0609cedSBarry Smith PetscLogEventBegin() and PetscLogEventBegin() return error codes instead of explicitly handling the 1079d0609cedSBarry Smith errors that occur in the macro directly because other packages that use this macros have used them in their 1080d0609cedSBarry Smith own functions or methods that do not return error codes and it would be disruptive to change the current 1081d0609cedSBarry Smith behavior. 1082d0609cedSBarry Smith 10835c6c1daeSBarry Smith Level: intermediate 10845c6c1daeSBarry Smith 1085db781477SPatrick Sanan .seealso: `PetscLogEventRegister()`, `PetscLogEventEnd()`, `PetscLogFlops()` 10865c6c1daeSBarry Smith 10875c6c1daeSBarry Smith M*/ 10885c6c1daeSBarry Smith 10895c6c1daeSBarry Smith /*MC 10905c6c1daeSBarry Smith PetscLogEventEnd - Log the end of a user event. 10915c6c1daeSBarry Smith 10925c6c1daeSBarry Smith Synopsis: 1093aaa7dc30SBarry Smith #include <petsclog.h> 1094f2ba6396SBarry Smith PetscErrorCode PetscLogEventEnd(int e,PetscObject o1,PetscObject o2,PetscObject o3,PetscObject o4) 10955c6c1daeSBarry Smith 10965c6c1daeSBarry Smith Not Collective 10975c6c1daeSBarry Smith 10985c6c1daeSBarry Smith Input Parameters: 10995c6c1daeSBarry Smith + e - integer associated with the event obtained with PetscLogEventRegister() 11005c6c1daeSBarry Smith - o1,o2,o3,o4 - objects associated with the event, or 0 11015c6c1daeSBarry Smith 11025c6c1daeSBarry Smith Fortran Synopsis: 11035c6c1daeSBarry Smith void PetscLogEventEnd(int e,PetscErrorCode ierr) 11045c6c1daeSBarry Smith 11055c6c1daeSBarry Smith Usage: 11065c6c1daeSBarry Smith .vb 11075c6c1daeSBarry Smith PetscLogEvent USER_EVENT; 11085c6c1daeSBarry Smith PetscLogDouble user_event_flops; 11095c6c1daeSBarry Smith PetscLogEventRegister("User event",0,&USER_EVENT,); 11105c6c1daeSBarry Smith PetscLogEventBegin(USER_EVENT,0,0,0,0); 11115c6c1daeSBarry Smith [code segment to monitor] 11125c6c1daeSBarry Smith PetscLogFlops(user_event_flops); 11135c6c1daeSBarry Smith PetscLogEventEnd(USER_EVENT,0,0,0,0); 11145c6c1daeSBarry Smith .ve 11155c6c1daeSBarry Smith 11165c6c1daeSBarry Smith Notes: 11175c6c1daeSBarry Smith You should also register each additional integer event with the command 1118a2553e36SBarry Smith PetscLogEventRegister(). 11195c6c1daeSBarry Smith 11205c6c1daeSBarry Smith Level: intermediate 11215c6c1daeSBarry Smith 1122db781477SPatrick Sanan .seealso: `PetscLogEventRegister()`, `PetscLogEventBegin()`, `PetscLogFlops()` 11235c6c1daeSBarry Smith 11245c6c1daeSBarry Smith M*/ 11255c6c1daeSBarry Smith 11265c6c1daeSBarry Smith /*@C 11275c6c1daeSBarry Smith PetscLogEventGetId - Returns the event id when given the event name. 11285c6c1daeSBarry Smith 11295c6c1daeSBarry Smith Not Collective 11305c6c1daeSBarry Smith 11315c6c1daeSBarry Smith Input Parameter: 11325c6c1daeSBarry Smith . name - The event name 11335c6c1daeSBarry Smith 11345c6c1daeSBarry Smith Output Parameter: 1135c5deb1d5SJed Brown . event - The event, or -1 if no event with that name exists 11365c6c1daeSBarry Smith 11375c6c1daeSBarry Smith Level: intermediate 11385c6c1daeSBarry Smith 1139db781477SPatrick Sanan .seealso: `PetscLogEventBegin()`, `PetscLogEventEnd()`, `PetscLogStageGetId()` 11405c6c1daeSBarry Smith @*/ 11415c6c1daeSBarry Smith PetscErrorCode PetscLogEventGetId(const char name[], PetscLogEvent *event) 11425c6c1daeSBarry Smith { 11435c6c1daeSBarry Smith PetscStageLog stageLog; 11445c6c1daeSBarry Smith 11455c6c1daeSBarry Smith PetscFunctionBegin; 11469566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 11479566063dSJacob Faibussowitsch PetscCall(PetscEventRegLogGetEvent(stageLog->eventLog, name, event)); 11485c6c1daeSBarry Smith PetscFunctionReturn(0); 11495c6c1daeSBarry Smith } 11505c6c1daeSBarry Smith 1151*7a101e5eSJacob Faibussowitsch PetscErrorCode PetscLogPushCurrentEvent_Internal(PetscLogEvent event) 1152*7a101e5eSJacob Faibussowitsch { 1153*7a101e5eSJacob Faibussowitsch PetscFunctionBegin; 1154*7a101e5eSJacob Faibussowitsch PetscCall(PetscIntStackPush(current_log_event_stack,event)); 1155*7a101e5eSJacob Faibussowitsch PetscFunctionReturn(0); 1156*7a101e5eSJacob Faibussowitsch } 1157*7a101e5eSJacob Faibussowitsch 1158*7a101e5eSJacob Faibussowitsch PetscErrorCode PetscLogPopCurrentEvent_Internal(void) 1159*7a101e5eSJacob Faibussowitsch { 1160*7a101e5eSJacob Faibussowitsch PetscFunctionBegin; 1161*7a101e5eSJacob Faibussowitsch PetscCall(PetscIntStackPop(current_log_event_stack,NULL)); 1162*7a101e5eSJacob Faibussowitsch PetscFunctionReturn(0); 1163*7a101e5eSJacob Faibussowitsch } 1164*7a101e5eSJacob Faibussowitsch 1165*7a101e5eSJacob Faibussowitsch PetscErrorCode PetscLogGetCurrentEvent_Internal(PetscLogEvent *event) 1166*7a101e5eSJacob Faibussowitsch { 1167*7a101e5eSJacob Faibussowitsch PetscBool empty; 1168*7a101e5eSJacob Faibussowitsch 1169*7a101e5eSJacob Faibussowitsch PetscFunctionBegin; 1170*7a101e5eSJacob Faibussowitsch PetscValidIntPointer(event,1); 1171*7a101e5eSJacob Faibussowitsch *event = PETSC_DECIDE; 1172*7a101e5eSJacob Faibussowitsch PetscCall(PetscIntStackEmpty(current_log_event_stack,&empty)); 1173*7a101e5eSJacob Faibussowitsch if (!empty) PetscCall(PetscIntStackTop(current_log_event_stack,event)); 1174*7a101e5eSJacob Faibussowitsch PetscFunctionReturn(0); 1175*7a101e5eSJacob Faibussowitsch } 1176*7a101e5eSJacob Faibussowitsch 1177*7a101e5eSJacob Faibussowitsch PetscErrorCode PetscLogEventPause_Internal(PetscLogEvent event) 1178*7a101e5eSJacob Faibussowitsch { 1179*7a101e5eSJacob Faibussowitsch PetscFunctionBegin; 1180*7a101e5eSJacob Faibussowitsch if (event != PETSC_DECIDE) PetscCall(PetscLogEventEnd(event,NULL,NULL,NULL,NULL)); 1181*7a101e5eSJacob Faibussowitsch PetscFunctionReturn(0); 1182*7a101e5eSJacob Faibussowitsch } 1183*7a101e5eSJacob Faibussowitsch 1184*7a101e5eSJacob Faibussowitsch PetscErrorCode PetscLogEventResume_Internal(PetscLogEvent event) 1185*7a101e5eSJacob Faibussowitsch { 1186*7a101e5eSJacob Faibussowitsch PetscStageLog stageLog; 1187*7a101e5eSJacob Faibussowitsch PetscEventPerfLog eventLog; 1188*7a101e5eSJacob Faibussowitsch int stage; 1189*7a101e5eSJacob Faibussowitsch 1190*7a101e5eSJacob Faibussowitsch PetscFunctionBegin; 1191*7a101e5eSJacob Faibussowitsch if (event == PETSC_DECIDE) PetscFunctionReturn(0); 1192*7a101e5eSJacob Faibussowitsch PetscCall(PetscLogEventBegin(event,NULL,NULL,NULL,NULL)); 1193*7a101e5eSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 1194*7a101e5eSJacob Faibussowitsch PetscCall(PetscStageLogGetCurrent(stageLog,&stage)); 1195*7a101e5eSJacob Faibussowitsch PetscCall(PetscStageLogGetEventPerfLog(stageLog,stage,&eventLog)); 1196*7a101e5eSJacob Faibussowitsch eventLog->eventInfo[event].count--; 1197*7a101e5eSJacob Faibussowitsch PetscFunctionReturn(0); 1198*7a101e5eSJacob Faibussowitsch } 1199*7a101e5eSJacob Faibussowitsch 12005c6c1daeSBarry Smith /*------------------------------------------------ Output Functions -------------------------------------------------*/ 12015c6c1daeSBarry Smith /*@C 12025c6c1daeSBarry Smith PetscLogDump - Dumps logs of objects to a file. This file is intended to 12035c6c1daeSBarry Smith be read by bin/petscview. This program no longer exists. 12045c6c1daeSBarry Smith 12055c6c1daeSBarry Smith Collective on PETSC_COMM_WORLD 12065c6c1daeSBarry Smith 12075c6c1daeSBarry Smith Input Parameter: 12085c6c1daeSBarry Smith . name - an optional file name 12095c6c1daeSBarry Smith 12105c6c1daeSBarry Smith Usage: 12115c6c1daeSBarry Smith .vb 12125c6c1daeSBarry Smith PetscInitialize(...); 1213bb1d7374SBarry Smith PetscLogDefaultBegin(); or PetscLogAllBegin(); 12145c6c1daeSBarry Smith ... code ... 12155c6c1daeSBarry Smith PetscLogDump(filename); 12165c6c1daeSBarry Smith PetscFinalize(); 12175c6c1daeSBarry Smith .ve 12185c6c1daeSBarry Smith 12195c6c1daeSBarry Smith Notes: 12205c6c1daeSBarry Smith The default file name is 12215c6c1daeSBarry Smith $ Log.<rank> 12225c6c1daeSBarry Smith where <rank> is the processor number. If no name is specified, 12235c6c1daeSBarry Smith this file will be used. 12245c6c1daeSBarry Smith 12255c6c1daeSBarry Smith Level: advanced 12265c6c1daeSBarry Smith 1227db781477SPatrick Sanan .seealso: `PetscLogDefaultBegin()`, `PetscLogAllBegin()`, `PetscLogView()` 12285c6c1daeSBarry Smith @*/ 12295c6c1daeSBarry Smith PetscErrorCode PetscLogDump(const char sname[]) 12305c6c1daeSBarry Smith { 12315c6c1daeSBarry Smith PetscStageLog stageLog; 12325c6c1daeSBarry Smith PetscEventPerfInfo *eventInfo; 12335c6c1daeSBarry Smith FILE *fd; 12345c6c1daeSBarry Smith char file[PETSC_MAX_PATH_LEN], fname[PETSC_MAX_PATH_LEN]; 12355c6c1daeSBarry Smith PetscLogDouble flops, _TotalTime; 12365c6c1daeSBarry Smith PetscMPIInt rank; 12375c6c1daeSBarry Smith int action, object, curStage; 12385c6c1daeSBarry Smith PetscLogEvent event; 12395c6c1daeSBarry Smith 12405c6c1daeSBarry Smith PetscFunctionBegin; 12415c6c1daeSBarry Smith /* Calculate the total elapsed time */ 12428563dfccSBarry Smith PetscTime(&_TotalTime); 12435c6c1daeSBarry Smith _TotalTime -= petsc_BaseTime; 12445c6c1daeSBarry Smith /* Open log file */ 12459566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_rank(PETSC_COMM_WORLD, &rank)); 12467ff663adSLisandro Dalcin if (sname && sname[0]) sprintf(file, "%s.%d", sname, rank); 1247a297a907SKarl Rupp else sprintf(file, "Log.%d", rank); 12489566063dSJacob Faibussowitsch PetscCall(PetscFixFilename(file, fname)); 12499566063dSJacob Faibussowitsch PetscCall(PetscFOpen(PETSC_COMM_WORLD, fname, "w", &fd)); 125008401ef6SPierre Jolivet PetscCheck(!(rank == 0) || !(!fd),PETSC_COMM_SELF,PETSC_ERR_FILE_OPEN, "Cannot open file: %s", fname); 12515c6c1daeSBarry Smith /* Output totals */ 12529566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(PETSC_COMM_WORLD, fd, "Total Flop %14e %16.8e\n", petsc_TotalFlops, _TotalTime)); 12539566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(PETSC_COMM_WORLD, fd, "Clock Resolution %g\n", 0.0)); 12545c6c1daeSBarry Smith /* Output actions */ 12555c6c1daeSBarry Smith if (petsc_logActions) { 12569566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(PETSC_COMM_WORLD, fd, "Actions accomplished %d\n", petsc_numActions)); 12575c6c1daeSBarry Smith for (action = 0; action < petsc_numActions; action++) { 1258d0609cedSBarry Smith PetscCall(PetscFPrintf(PETSC_COMM_WORLD, fd, "%g %d %d %d %d %d %d %g %g %g\n", 12595c6c1daeSBarry Smith petsc_actions[action].time, petsc_actions[action].action, (int)petsc_actions[action].event, (int)petsc_actions[action].classid, petsc_actions[action].id1, 1260d0609cedSBarry Smith petsc_actions[action].id2, petsc_actions[action].id3, petsc_actions[action].flops, petsc_actions[action].mem, petsc_actions[action].maxmem)); 12615c6c1daeSBarry Smith } 12625c6c1daeSBarry Smith } 12635c6c1daeSBarry Smith /* Output objects */ 12645c6c1daeSBarry Smith if (petsc_logObjects) { 12659566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(PETSC_COMM_WORLD, fd, "Objects created %d destroyed %d\n", petsc_numObjects, petsc_numObjectsDestroyed)); 12665c6c1daeSBarry Smith for (object = 0; object < petsc_numObjects; object++) { 12679566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(PETSC_COMM_WORLD, fd, "Parent ID: %d Memory: %d\n", petsc_objects[object].parent, (int) petsc_objects[object].mem)); 12685c6c1daeSBarry Smith if (!petsc_objects[object].name[0]) { 12699566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(PETSC_COMM_WORLD, fd,"No Name\n")); 12705c6c1daeSBarry Smith } else { 12719566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(PETSC_COMM_WORLD, fd, "Name: %s\n", petsc_objects[object].name)); 12725c6c1daeSBarry Smith } 12735c6c1daeSBarry Smith if (petsc_objects[object].info[0] != 0) { 12749566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(PETSC_COMM_WORLD, fd, "No Info\n")); 12755c6c1daeSBarry Smith } else { 12769566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(PETSC_COMM_WORLD, fd, "Info: %s\n", petsc_objects[object].info)); 12775c6c1daeSBarry Smith } 12785c6c1daeSBarry Smith } 12795c6c1daeSBarry Smith } 12805c6c1daeSBarry Smith /* Output events */ 12819566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(PETSC_COMM_WORLD, fd, "Event log:\n")); 12829566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 12839566063dSJacob Faibussowitsch PetscCall(PetscIntStackTop(stageLog->stack, &curStage)); 12845c6c1daeSBarry Smith eventInfo = stageLog->stageInfo[curStage].eventLog->eventInfo; 12855c6c1daeSBarry Smith for (event = 0; event < stageLog->stageInfo[curStage].eventLog->numEvents; event++) { 1286a297a907SKarl Rupp if (eventInfo[event].time != 0.0) flops = eventInfo[event].flops/eventInfo[event].time; 1287a297a907SKarl Rupp else flops = 0.0; 1288d0609cedSBarry Smith PetscCall(PetscFPrintf(PETSC_COMM_WORLD, fd, "%d %16d %16g %16g %16g\n", event, eventInfo[event].count,eventInfo[event].flops, eventInfo[event].time, flops)); 12895c6c1daeSBarry Smith } 12909566063dSJacob Faibussowitsch PetscCall(PetscFClose(PETSC_COMM_WORLD, fd)); 12915c6c1daeSBarry Smith PetscFunctionReturn(0); 12925c6c1daeSBarry Smith } 12935c6c1daeSBarry Smith 1294f14045dbSBarry Smith /* 1295f14045dbSBarry Smith PetscLogView_Detailed - Each process prints the times for its own events 1296f14045dbSBarry Smith 1297f14045dbSBarry Smith */ 1298f14045dbSBarry Smith PetscErrorCode PetscLogView_Detailed(PetscViewer viewer) 1299f14045dbSBarry Smith { 13002dff6485SMatthew G. Knepley PetscStageLog stageLog; 1301217044c2SLisandro Dalcin PetscEventPerfInfo *eventInfo = NULL, *stageInfo = NULL; 1302217044c2SLisandro Dalcin PetscLogDouble locTotalTime, numRed, maxMem; 13032dff6485SMatthew G. Knepley int numStages,numEvents,stage,event; 1304217044c2SLisandro Dalcin MPI_Comm comm = PetscObjectComm((PetscObject) viewer); 13052dff6485SMatthew G. Knepley PetscMPIInt rank,size; 1306f14045dbSBarry Smith 1307f14045dbSBarry Smith PetscFunctionBegin; 13089566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(comm, &size)); 13099566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_rank(comm, &rank)); 13102dff6485SMatthew G. Knepley /* Must preserve reduction count before we go on */ 13112dff6485SMatthew G. Knepley numRed = petsc_allreduce_ct + petsc_gather_ct + petsc_scatter_ct; 13122d1ec343SBarry Smith /* Get the total elapsed time */ 13132d1ec343SBarry Smith PetscTime(&locTotalTime); locTotalTime -= petsc_BaseTime; 13149566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"size = %d\n",size)); 13159566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"LocalTimes = {}\n")); 13169566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"LocalMessages = {}\n")); 13179566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"LocalMessageLens = {}\n")); 13189566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"LocalReductions = {}\n")); 13199566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"LocalFlop = {}\n")); 13209566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"LocalObjects = {}\n")); 13219566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"LocalMemory = {}\n")); 13229566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 13239566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&stageLog->numStages, &numStages, 1, MPI_INT, MPI_MAX, comm)); 13249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"Stages = {}\n")); 13252d1ec343SBarry Smith for (stage=0; stage<numStages; stage++) { 13269566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"Stages[\"%s\"] = {}\n",stageLog->stageInfo[stage].name)); 13279566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"Stages[\"%s\"][\"summary\"] = {}\n",stageLog->stageInfo[stage].name)); 13289566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&stageLog->stageInfo[stage].eventLog->numEvents, &numEvents, 1, MPI_INT, MPI_MAX, comm)); 13292d1ec343SBarry Smith for (event = 0; event < numEvents; event++) { 13309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"Stages[\"%s\"][\"%s\"] = {}\n",stageLog->stageInfo[stage].name,stageLog->eventLog->eventInfo[event].name)); 13312d1ec343SBarry Smith } 13322d1ec343SBarry Smith } 13339566063dSJacob Faibussowitsch PetscCall(PetscMallocGetMaximumUsage(&maxMem)); 13349566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPushSynchronized(viewer)); 13359566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer,"LocalTimes[%d] = %g\n",rank,locTotalTime)); 13369566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer,"LocalMessages[%d] = %g\n",rank,(petsc_irecv_ct + petsc_isend_ct + petsc_recv_ct + petsc_send_ct))); 13379566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer,"LocalMessageLens[%d] = %g\n",rank,(petsc_irecv_len + petsc_isend_len + petsc_recv_len + petsc_send_len))); 13389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer,"LocalReductions[%d] = %g\n",rank,numRed)); 13399566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer,"LocalFlop[%d] = %g\n",rank,petsc_TotalFlops)); 13409566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer,"LocalObjects[%d] = %d\n",rank,petsc_numObjects)); 13419566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer,"LocalMemory[%d] = %g\n",rank,maxMem)); 13429566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 13432d1ec343SBarry Smith for (stage=0; stage<numStages; stage++) { 1344217044c2SLisandro Dalcin stageInfo = &stageLog->stageInfo[stage].perfInfo; 1345d0609cedSBarry Smith PetscCall(PetscViewerASCIISynchronizedPrintf(viewer,"Stages[\"%s\"][\"summary\"][%d] = {\"time\" : %g, \"numMessages\" : %g, \"messageLength\" : %g, \"numReductions\" : %g, \"flop\" : %g}\n", 13462dff6485SMatthew G. Knepley stageLog->stageInfo[stage].name,rank, 1347d0609cedSBarry Smith stageInfo->time,stageInfo->numMessages,stageInfo->messageLength,stageInfo->numReductions,stageInfo->flops)); 13489566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&stageLog->stageInfo[stage].eventLog->numEvents, &numEvents, 1, MPI_INT, MPI_MAX, comm)); 13492d1ec343SBarry Smith for (event = 0; event < numEvents; event++) { 1350217044c2SLisandro Dalcin eventInfo = &stageLog->stageInfo[stage].eventLog->eventInfo[event]; 1351d0609cedSBarry Smith PetscCall(PetscViewerASCIISynchronizedPrintf(viewer,"Stages[\"%s\"][\"%s\"][%d] = {\"count\" : %d, \"time\" : %g, \"syncTime\" : %g, \"numMessages\" : %g, \"messageLength\" : %g, \"numReductions\" : %g, \"flop\" : %g", 1352217044c2SLisandro Dalcin stageLog->stageInfo[stage].name,stageLog->eventLog->eventInfo[event].name,rank, 1353d0609cedSBarry Smith eventInfo->count,eventInfo->time,eventInfo->syncTime,eventInfo->numMessages,eventInfo->messageLength,eventInfo->numReductions,eventInfo->flops)); 1354891e75beSMatthew G. Knepley if (eventInfo->dof[0] >= 0.) { 1355891e75beSMatthew G. Knepley PetscInt d, e; 13565d68e14cSMatthew G. Knepley 13579566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, ", \"dof\" : [")); 1358891e75beSMatthew G. Knepley for (d = 0; d < 8; ++d) { 13599566063dSJacob Faibussowitsch if (d > 0) PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, ", ")); 13609566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, "%g", eventInfo->dof[d])); 1361891e75beSMatthew G. Knepley } 13629566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, "]")); 13639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, ", \"error\" : [")); 13645d68e14cSMatthew G. Knepley for (e = 0; e < 8; ++e) { 13659566063dSJacob Faibussowitsch if (e > 0) PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, ", ")); 13669566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, "%g", eventInfo->errors[e])); 13675d68e14cSMatthew G. Knepley } 13689566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, "]")); 13695d68e14cSMatthew G. Knepley } 13709566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer,"}\n")); 13712d1ec343SBarry Smith } 13722d1ec343SBarry Smith } 13739566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 13749566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPopSynchronized(viewer)); 1375f14045dbSBarry Smith PetscFunctionReturn(0); 1376f14045dbSBarry Smith } 1377f14045dbSBarry Smith 137838144912Sdeepblu2718 /* 137938144912Sdeepblu2718 PetscLogView_CSV - Each process prints the times for its own events in Comma-Separated Value Format 138038144912Sdeepblu2718 */ 138138144912Sdeepblu2718 PetscErrorCode PetscLogView_CSV(PetscViewer viewer) 138238144912Sdeepblu2718 { 138338144912Sdeepblu2718 PetscStageLog stageLog; 1384669c5be0SSatish Balay PetscEventPerfInfo *eventInfo = NULL; 138538144912Sdeepblu2718 PetscLogDouble locTotalTime, maxMem; 138638144912Sdeepblu2718 int numStages,numEvents,stage,event; 138738144912Sdeepblu2718 MPI_Comm comm = PetscObjectComm((PetscObject) viewer); 138838144912Sdeepblu2718 PetscMPIInt rank,size; 138938144912Sdeepblu2718 139038144912Sdeepblu2718 PetscFunctionBegin; 13919566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(comm, &size)); 13929566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_rank(comm, &rank)); 139338144912Sdeepblu2718 /* Must preserve reduction count before we go on */ 139438144912Sdeepblu2718 /* Get the total elapsed time */ 139538144912Sdeepblu2718 PetscTime(&locTotalTime); locTotalTime -= petsc_BaseTime; 13969566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 13979566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&stageLog->numStages, &numStages, 1, MPI_INT, MPI_MAX, comm)); 13989566063dSJacob Faibussowitsch PetscCall(PetscMallocGetMaximumUsage(&maxMem)); 13999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPushSynchronized(viewer)); 1400d0609cedSBarry Smith PetscCall(PetscViewerASCIIPrintf(viewer,"Stage Name,Event Name,Rank,Count,Time,Num Messages,Message Length,Num Reductions,FLOP,dof0,dof1,dof2,dof3,dof4,dof5,dof6,dof7,e0,e1,e2,e3,e4,e5,e6,e7,%d\n", size)); 14019566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 140238144912Sdeepblu2718 for (stage=0; stage<numStages; stage++) { 14039e29573dSMatthew G. Knepley PetscEventPerfInfo *stageInfo = &stageLog->stageInfo[stage].perfInfo; 14049e29573dSMatthew G. Knepley 1405d0609cedSBarry Smith PetscCall(PetscViewerASCIISynchronizedPrintf(viewer,"%s,summary,%d,1,%g,%g,%g,%g,%g\n", 1406d0609cedSBarry Smith stageLog->stageInfo[stage].name,rank,stageInfo->time,stageInfo->numMessages,stageInfo->messageLength,stageInfo->numReductions,stageInfo->flops)); 14079566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&stageLog->stageInfo[stage].eventLog->numEvents, &numEvents, 1, MPI_INT, MPI_MAX, comm)); 140838144912Sdeepblu2718 for (event = 0; event < numEvents; event++) { 140938144912Sdeepblu2718 eventInfo = &stageLog->stageInfo[stage].eventLog->eventInfo[event]; 1410d0609cedSBarry Smith PetscCall(PetscViewerASCIISynchronizedPrintf(viewer,"%s,%s,%d,%d,%g,%g,%g,%g,%g",stageLog->stageInfo[stage].name, 1411a2fddd78SAlbert Cowie stageLog->eventLog->eventInfo[event].name,rank,eventInfo->count,eventInfo->time,eventInfo->numMessages, 1412d0609cedSBarry Smith eventInfo->messageLength,eventInfo->numReductions,eventInfo->flops)); 141338144912Sdeepblu2718 if (eventInfo->dof[0] >= 0.) { 141438144912Sdeepblu2718 PetscInt d, e; 141538144912Sdeepblu2718 141638144912Sdeepblu2718 for (d = 0; d < 8; ++d) { 14179566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, ",%g", eventInfo->dof[d])); 141838144912Sdeepblu2718 } 141938144912Sdeepblu2718 for (e = 0; e < 8; ++e) { 14209566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer, ",%g", eventInfo->errors[e])); 142138144912Sdeepblu2718 } 142238144912Sdeepblu2718 } 14239566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIISynchronizedPrintf(viewer,"\n")); 142438144912Sdeepblu2718 } 142538144912Sdeepblu2718 } 14269566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 14279566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPopSynchronized(viewer)); 142838144912Sdeepblu2718 PetscFunctionReturn(0); 142938144912Sdeepblu2718 } 143038144912Sdeepblu2718 1431217044c2SLisandro Dalcin static PetscErrorCode PetscLogViewWarnSync(MPI_Comm comm,FILE *fd) 1432217044c2SLisandro Dalcin { 1433217044c2SLisandro Dalcin PetscFunctionBegin; 1434217044c2SLisandro Dalcin if (!PetscLogSyncOn) PetscFunctionReturn(0); 14359566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n\n")); 14369566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " ##########################################################\n")); 14379566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # #\n")); 14389566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # WARNING!!! #\n")); 14399566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # #\n")); 14409566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # This program was run with logging synchronization. #\n")); 14419566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # This option provides more meaningful imbalance #\n")); 14429566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # figures at the expense of slowing things down and #\n")); 14439566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # providing a distorted view of the overall runtime. #\n")); 14449566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # #\n")); 14459566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " ##########################################################\n\n\n")); 1446217044c2SLisandro Dalcin PetscFunctionReturn(0); 1447217044c2SLisandro Dalcin } 1448217044c2SLisandro Dalcin 1449f4091ad2SBarry Smith static PetscErrorCode PetscLogViewWarnDebugging(MPI_Comm comm,FILE *fd) 1450f4091ad2SBarry Smith { 1451f4091ad2SBarry Smith PetscFunctionBegin; 145276bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 14539566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n\n")); 14549566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " ##########################################################\n")); 14559566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # #\n")); 14569566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # WARNING!!! #\n")); 14579566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # #\n")); 14589566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # This code was compiled with a debugging option. #\n")); 14599566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # To get timing results run ./configure #\n")); 14609566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # using --with-debugging=no, the performance will #\n")); 14619566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # be generally two or three times faster. #\n")); 14629566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # #\n")); 14639566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " ##########################################################\n\n\n")); 146476bd3646SJed Brown } 1465f4091ad2SBarry Smith PetscFunctionReturn(0); 1466f4091ad2SBarry Smith } 1467f4091ad2SBarry Smith 1468c2a741eeSJunchao Zhang static PetscErrorCode PetscLogViewWarnNoGpuAwareMpi(MPI_Comm comm,FILE *fd) 1469c2a741eeSJunchao Zhang { 1470009ab46cSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 1471009ab46cSJunchao Zhang PetscMPIInt size; 1472c2a741eeSJunchao Zhang 1473c2a741eeSJunchao Zhang PetscFunctionBegin; 14749566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(comm, &size)); 1475340fe3cdSSatish Balay if (use_gpu_aware_mpi || size == 1) PetscFunctionReturn(0); 14769566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n\n")); 14779566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " ##########################################################\n")); 14789566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # #\n")); 14799566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # WARNING!!! #\n")); 14809566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # #\n")); 14819566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # This code was compiled with GPU support and you've #\n")); 14829566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # created PETSc/GPU objects, but you intentionally #\n")); 14839566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # used -use_gpu_aware_mpi 0, requiring PETSc to copy #\n")); 14849566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # additional data between the GPU and CPU. To obtain #\n")); 14859566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # meaningful timing results on multi-rank runs, use #\n")); 14869566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # GPU-aware MPI instead. #\n")); 14879566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " # #\n")); 14889566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " ##########################################################\n\n\n")); 1489c2a741eeSJunchao Zhang PetscFunctionReturn(0); 1490c2a741eeSJunchao Zhang #else 1491c2a741eeSJunchao Zhang return 0; 1492c2a741eeSJunchao Zhang #endif 1493c2a741eeSJunchao Zhang } 1494c2a741eeSJunchao Zhang 1495156b51fbSBarry Smith static PetscErrorCode PetscLogViewWarnGpuTime(MPI_Comm comm,FILE *fd) 1496156b51fbSBarry Smith { 1497156b51fbSBarry Smith #if defined(PETSC_HAVE_DEVICE) 1498156b51fbSBarry Smith 1499156b51fbSBarry Smith PetscFunctionBegin; 1500156b51fbSBarry Smith if (!PetscLogGpuTimeFlag || petsc_gflops == 0) PetscFunctionReturn(0); 1501156b51fbSBarry Smith PetscCall(PetscFPrintf(comm, fd, "\n\n")); 1502156b51fbSBarry Smith PetscCall(PetscFPrintf(comm, fd, " ##########################################################\n")); 1503156b51fbSBarry Smith PetscCall(PetscFPrintf(comm, fd, " # #\n")); 1504156b51fbSBarry Smith PetscCall(PetscFPrintf(comm, fd, " # WARNING!!! #\n")); 1505156b51fbSBarry Smith PetscCall(PetscFPrintf(comm, fd, " # #\n")); 1506156b51fbSBarry Smith PetscCall(PetscFPrintf(comm, fd, " # This code was run with -log_view_gpu_time #\n")); 1507156b51fbSBarry Smith PetscCall(PetscFPrintf(comm, fd, " # This provides accurate timing within the GPU kernels #\n")); 1508156b51fbSBarry Smith PetscCall(PetscFPrintf(comm, fd, " # but can slow down the entire computation by a #\n")); 1509156b51fbSBarry Smith PetscCall(PetscFPrintf(comm, fd, " # measurable amount. For fastest runs we recommend #\n")); 1510156b51fbSBarry Smith PetscCall(PetscFPrintf(comm, fd, " # not using this option. #\n")); 1511156b51fbSBarry Smith PetscCall(PetscFPrintf(comm, fd, " # #\n")); 1512156b51fbSBarry Smith PetscCall(PetscFPrintf(comm, fd, " ##########################################################\n\n\n")); 1513156b51fbSBarry Smith PetscFunctionReturn(0); 1514156b51fbSBarry Smith #else 1515156b51fbSBarry Smith return 0; 1516156b51fbSBarry Smith #endif 1517156b51fbSBarry Smith } 1518156b51fbSBarry Smith 1519f14045dbSBarry Smith PetscErrorCode PetscLogView_Default(PetscViewer viewer) 15205c6c1daeSBarry Smith { 15215c6c1daeSBarry Smith FILE *fd; 15225c6c1daeSBarry Smith PetscLogDouble zero = 0.0; 15235c6c1daeSBarry Smith PetscStageLog stageLog; 15240298fd71SBarry Smith PetscStageInfo *stageInfo = NULL; 15250298fd71SBarry Smith PetscEventPerfInfo *eventInfo = NULL; 15265c6c1daeSBarry Smith PetscClassPerfInfo *classInfo; 15275c6c1daeSBarry Smith char arch[128],hostname[128],username[128],pname[PETSC_MAX_PATH_LEN],date[128]; 15285c6c1daeSBarry Smith const char *name; 15295c6c1daeSBarry Smith PetscLogDouble locTotalTime, TotalTime, TotalFlops; 15305c6c1daeSBarry Smith PetscLogDouble numMessages, messageLength, avgMessLen, numReductions; 15315c6c1daeSBarry Smith PetscLogDouble stageTime, flops, flopr, mem, mess, messLen, red; 15325c6c1daeSBarry Smith PetscLogDouble fracTime, fracFlops, fracMessages, fracLength, fracReductions, fracMess, fracMessLen, fracRed; 15335c6c1daeSBarry Smith PetscLogDouble fracStageTime, fracStageFlops, fracStageMess, fracStageMessLen, fracStageRed; 15345c6c1daeSBarry Smith PetscLogDouble min, max, tot, ratio, avg, x, y; 1535e3ed9ee7SBarry Smith PetscLogDouble minf, maxf, totf, ratf, mint, maxt, tott, ratt, ratC, totm, totml, totr, mal, malmax, emalmax; 1536d9c66bfbSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 1537156b51fbSBarry Smith PetscLogEvent KSP_Solve, SNES_Solve, TS_Step, TAO_Solve; /* These need to be fixed to be some events registered with certain objects */ 1538958c4211Shannah_mairs PetscLogDouble cct, gct, csz, gsz, gmaxt, gflops, gflopr, fracgflops; 1539bec0b493Shannah_mairs #endif 1540217044c2SLisandro Dalcin PetscMPIInt minC, maxC; 15415c6c1daeSBarry Smith PetscMPIInt size, rank; 15425c6c1daeSBarry Smith PetscBool *localStageUsed, *stageUsed; 15435c6c1daeSBarry Smith PetscBool *localStageVisible, *stageVisible; 15445c6c1daeSBarry Smith int numStages, localNumEvents, numEvents; 154537b78d16SBarry Smith int stage, oclass; 15465c6c1daeSBarry Smith PetscLogEvent event; 1547d0609cedSBarry Smith PetscErrorCode ierr = 0; 15485c6c1daeSBarry Smith char version[256]; 15495c6c1daeSBarry Smith MPI_Comm comm; 1550156b51fbSBarry Smith #if defined(PETSC_HAVE_DEVICE) 1551156b51fbSBarry Smith PetscLogEvent eventid; 1552156b51fbSBarry Smith PetscInt64 nas = 0x7FF0000000000002; 1553156b51fbSBarry Smith #endif 15545c6c1daeSBarry Smith 15555c6c1daeSBarry Smith PetscFunctionBegin; 1556156b51fbSBarry Smith PetscCall(PetscFPTrapPush(PETSC_FP_TRAP_OFF)); 15579566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)viewer,&comm)); 15589566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIGetPointer(viewer,&fd)); 15599566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(comm, &size)); 15609566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_rank(comm, &rank)); 15615c6c1daeSBarry Smith /* Get the total elapsed time */ 15628563dfccSBarry Smith PetscTime(&locTotalTime); locTotalTime -= petsc_BaseTime; 15635c6c1daeSBarry Smith 1564faad7b01SPierre Jolivet PetscCall(PetscFPrintf(comm, fd, "****************************************************************************************************************************************************************\n")); 15659566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "*** WIDEN YOUR WINDOW TO 160 CHARACTERS. Use 'enscript -r -fCourier9' to print this document ***\n")); 15669566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "****************************************************************************************************************************************************************\n")); 1567faad7b01SPierre Jolivet PetscCall(PetscFPrintf(comm, fd, "\n------------------------------------------------------------------ PETSc Performance Summary: ------------------------------------------------------------------\n\n")); 15689566063dSJacob Faibussowitsch PetscCall(PetscLogViewWarnSync(comm,fd)); 15699566063dSJacob Faibussowitsch PetscCall(PetscLogViewWarnDebugging(comm,fd)); 15709566063dSJacob Faibussowitsch PetscCall(PetscLogViewWarnNoGpuAwareMpi(comm,fd)); 1571156b51fbSBarry Smith PetscCall(PetscLogViewWarnGpuTime(comm,fd)); 15729566063dSJacob Faibussowitsch PetscCall(PetscGetArchType(arch,sizeof(arch))); 15739566063dSJacob Faibussowitsch PetscCall(PetscGetHostName(hostname,sizeof(hostname))); 15749566063dSJacob Faibussowitsch PetscCall(PetscGetUserName(username,sizeof(username))); 15759566063dSJacob Faibussowitsch PetscCall(PetscGetProgramName(pname,sizeof(pname))); 15769566063dSJacob Faibussowitsch PetscCall(PetscGetDate(date,sizeof(date))); 15779566063dSJacob Faibussowitsch PetscCall(PetscGetVersion(version,sizeof(version))); 15785c6c1daeSBarry Smith if (size == 1) { 15799566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm,fd,"%s on a %s named %s with %d processor, by %s %s\n", pname, arch, hostname, size, username, date)); 15805c6c1daeSBarry Smith } else { 15819566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm,fd,"%s on a %s named %s with %d processors, by %s %s\n", pname, arch, hostname, size, username, date)); 15825c6c1daeSBarry Smith } 1583f90b075cSBarry Smith #if defined(PETSC_HAVE_OPENMP) 15849566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm,fd,"Using %" PetscInt_FMT " OpenMP threads\n", PetscNumOMPThreads)); 1585f90b075cSBarry Smith #endif 15869566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Using %s\n", version)); 15875c6c1daeSBarry Smith 15885c6c1daeSBarry Smith /* Must preserve reduction count before we go on */ 15895c6c1daeSBarry Smith red = petsc_allreduce_ct + petsc_gather_ct + petsc_scatter_ct; 15905c6c1daeSBarry Smith 15915c6c1daeSBarry Smith /* Calculate summary information */ 15929566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n Max Max/Min Avg Total\n")); 15935c6c1daeSBarry Smith /* Time */ 15949566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&locTotalTime, &min, 1, MPIU_PETSCLOGDOUBLE, MPI_MIN, comm)); 15959566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&locTotalTime, &max, 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 15969566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&locTotalTime, &tot, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1597217044c2SLisandro Dalcin avg = tot/((PetscLogDouble) size); 1598217044c2SLisandro Dalcin if (min != 0.0) ratio = max/min; else ratio = 0.0; 15999566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Time (sec): %5.3e %7.3f %5.3e\n", max, ratio, avg)); 16005c6c1daeSBarry Smith TotalTime = tot; 16015c6c1daeSBarry Smith /* Objects */ 16025c6c1daeSBarry Smith avg = (PetscLogDouble) petsc_numObjects; 16039566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&avg, &min, 1, MPIU_PETSCLOGDOUBLE, MPI_MIN, comm)); 16049566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&avg, &max, 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 16059566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&avg, &tot, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1606217044c2SLisandro Dalcin avg = tot/((PetscLogDouble) size); 1607217044c2SLisandro Dalcin if (min != 0.0) ratio = max/min; else ratio = 0.0; 16089566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Objects: %5.3e %7.3f %5.3e\n", max, ratio, avg)); 16095c6c1daeSBarry Smith /* Flops */ 16109566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&petsc_TotalFlops, &min, 1, MPIU_PETSCLOGDOUBLE, MPI_MIN, comm)); 16119566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&petsc_TotalFlops, &max, 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 16129566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&petsc_TotalFlops, &tot, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1613217044c2SLisandro Dalcin avg = tot/((PetscLogDouble) size); 1614217044c2SLisandro Dalcin if (min != 0.0) ratio = max/min; else ratio = 0.0; 16159566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Flops: %5.3e %7.3f %5.3e %5.3e\n", max, ratio, avg, tot)); 16165c6c1daeSBarry Smith TotalFlops = tot; 16175c6c1daeSBarry Smith /* Flops/sec -- Must talk to Barry here */ 1618217044c2SLisandro Dalcin if (locTotalTime != 0.0) flops = petsc_TotalFlops/locTotalTime; else flops = 0.0; 16199566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&flops, &min, 1, MPIU_PETSCLOGDOUBLE, MPI_MIN, comm)); 16209566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&flops, &max, 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 16219566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&flops, &tot, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1622217044c2SLisandro Dalcin avg = tot/((PetscLogDouble) size); 1623217044c2SLisandro Dalcin if (min != 0.0) ratio = max/min; else ratio = 0.0; 16249566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Flops/sec: %5.3e %7.3f %5.3e %5.3e\n", max, ratio, avg, tot)); 16255c6c1daeSBarry Smith /* Memory */ 16269566063dSJacob Faibussowitsch PetscCall(PetscMallocGetMaximumUsage(&mem)); 16275c6c1daeSBarry Smith if (mem > 0.0) { 16289566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&mem, &min, 1, MPIU_PETSCLOGDOUBLE, MPI_MIN, comm)); 16299566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&mem, &max, 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 16309566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&mem, &tot, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1631217044c2SLisandro Dalcin avg = tot/((PetscLogDouble) size); 1632217044c2SLisandro Dalcin if (min != 0.0) ratio = max/min; else ratio = 0.0; 16339566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Memory (bytes): %5.3e %7.3f %5.3e %5.3e\n", max, ratio, avg, tot)); 16345c6c1daeSBarry Smith } 16355c6c1daeSBarry Smith /* Messages */ 16365c6c1daeSBarry Smith mess = 0.5*(petsc_irecv_ct + petsc_isend_ct + petsc_recv_ct + petsc_send_ct); 16379566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&mess, &min, 1, MPIU_PETSCLOGDOUBLE, MPI_MIN, comm)); 16389566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&mess, &max, 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 16399566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&mess, &tot, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1640217044c2SLisandro Dalcin avg = tot/((PetscLogDouble) size); 1641217044c2SLisandro Dalcin if (min != 0.0) ratio = max/min; else ratio = 0.0; 16429566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "MPI Msg Count: %5.3e %7.3f %5.3e %5.3e\n", max, ratio, avg, tot)); 16435c6c1daeSBarry Smith numMessages = tot; 16445c6c1daeSBarry Smith /* Message Lengths */ 16455c6c1daeSBarry Smith mess = 0.5*(petsc_irecv_len + petsc_isend_len + petsc_recv_len + petsc_send_len); 16469566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&mess, &min, 1, MPIU_PETSCLOGDOUBLE, MPI_MIN, comm)); 16479566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&mess, &max, 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 16489566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&mess, &tot, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1649217044c2SLisandro Dalcin if (numMessages != 0) avg = tot/numMessages; else avg = 0.0; 1650217044c2SLisandro Dalcin if (min != 0.0) ratio = max/min; else ratio = 0.0; 16519566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "MPI Msg Len (bytes): %5.3e %7.3f %5.3e %5.3e\n", max, ratio, avg, tot)); 16525c6c1daeSBarry Smith messageLength = tot; 16535c6c1daeSBarry Smith /* Reductions */ 16549566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&red, &min, 1, MPIU_PETSCLOGDOUBLE, MPI_MIN, comm)); 16559566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&red, &max, 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 16569566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&red, &tot, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1657217044c2SLisandro Dalcin if (min != 0.0) ratio = max/min; else ratio = 0.0; 16589566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "MPI Reductions: %5.3e %7.3f\n", max, ratio)); 16595c6c1daeSBarry Smith numReductions = red; /* wrong because uses count from process zero */ 16609566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\nFlop counting convention: 1 flop = 1 real number operation of type (multiply/divide/add/subtract)\n")); 16619566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " e.g., VecAXPY() for real vectors of length N --> 2N flops\n")); 16629566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " and VecAXPY() for complex vectors of length N --> 8N flops\n")); 16635c6c1daeSBarry Smith 16645c6c1daeSBarry Smith /* Get total number of stages -- 16655c6c1daeSBarry Smith Currently, a single processor can register more stages than another, but stages must all be registered in order. 16665c6c1daeSBarry Smith We can removed this requirement if necessary by having a global stage numbering and indirection on the stage ID. 16675c6c1daeSBarry Smith This seems best accomplished by assoicating a communicator with each stage. 16685c6c1daeSBarry Smith */ 16699566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 16709566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&stageLog->numStages, &numStages, 1, MPI_INT, MPI_MAX, comm)); 16719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(numStages, &localStageUsed)); 16729566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(numStages, &stageUsed)); 16739566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(numStages, &localStageVisible)); 16749566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(numStages, &stageVisible)); 16755c6c1daeSBarry Smith if (numStages > 0) { 16765c6c1daeSBarry Smith stageInfo = stageLog->stageInfo; 16775c6c1daeSBarry Smith for (stage = 0; stage < numStages; stage++) { 16785c6c1daeSBarry Smith if (stage < stageLog->numStages) { 16795c6c1daeSBarry Smith localStageUsed[stage] = stageInfo[stage].used; 16805c6c1daeSBarry Smith localStageVisible[stage] = stageInfo[stage].perfInfo.visible; 16815c6c1daeSBarry Smith } else { 16825c6c1daeSBarry Smith localStageUsed[stage] = PETSC_FALSE; 16835c6c1daeSBarry Smith localStageVisible[stage] = PETSC_TRUE; 16845c6c1daeSBarry Smith } 16855c6c1daeSBarry Smith } 16869566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(localStageUsed, stageUsed, numStages, MPIU_BOOL, MPI_LOR, comm)); 16879566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(localStageVisible, stageVisible, numStages, MPIU_BOOL, MPI_LAND, comm)); 16885c6c1daeSBarry Smith for (stage = 0; stage < numStages; stage++) { 16895c6c1daeSBarry Smith if (stageUsed[stage]) { 16909566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\nSummary of Stages: ----- Time ------ ----- Flop ------ --- Messages --- -- Message Lengths -- -- Reductions --\n")); 16919566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " Avg %%Total Avg %%Total Count %%Total Avg %%Total Count %%Total\n")); 16925c6c1daeSBarry Smith break; 16935c6c1daeSBarry Smith } 16945c6c1daeSBarry Smith } 16955c6c1daeSBarry Smith for (stage = 0; stage < numStages; stage++) { 16965c6c1daeSBarry Smith if (!stageUsed[stage]) continue; 1697820f2d46SBarry Smith /* CANNOT use MPI_Allreduce() since it might fail the line number check */ 16985c6c1daeSBarry Smith if (localStageUsed[stage]) { 16999566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&stageInfo[stage].perfInfo.time, &stageTime, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 17009566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&stageInfo[stage].perfInfo.flops, &flops, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 17019566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&stageInfo[stage].perfInfo.numMessages, &mess, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 17029566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&stageInfo[stage].perfInfo.messageLength, &messLen, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 17039566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&stageInfo[stage].perfInfo.numReductions, &red, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 17045c6c1daeSBarry Smith name = stageInfo[stage].name; 17055c6c1daeSBarry Smith } else { 17069566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &stageTime, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 17079566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &flops, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 17089566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &mess, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 17099566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &messLen, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 17109566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &red, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 17115c6c1daeSBarry Smith name = ""; 17125c6c1daeSBarry Smith } 17135c6c1daeSBarry Smith mess *= 0.5; messLen *= 0.5; red /= size; 17145c6c1daeSBarry Smith if (TotalTime != 0.0) fracTime = stageTime/TotalTime; else fracTime = 0.0; 17155c6c1daeSBarry Smith if (TotalFlops != 0.0) fracFlops = flops/TotalFlops; else fracFlops = 0.0; 17165c6c1daeSBarry Smith /* Talk to Barry if (stageTime != 0.0) flops = (size*flops)/stageTime; else flops = 0.0; */ 17175c6c1daeSBarry Smith if (numMessages != 0.0) fracMessages = mess/numMessages; else fracMessages = 0.0; 1718e96a4d02SJunchao Zhang if (mess != 0.0) avgMessLen = messLen/mess; else avgMessLen = 0.0; 17195c6c1daeSBarry Smith if (messageLength != 0.0) fracLength = messLen/messageLength; else fracLength = 0.0; 17205c6c1daeSBarry Smith if (numReductions != 0.0) fracReductions = red/numReductions; else fracReductions = 0.0; 1721d0609cedSBarry Smith PetscCall(PetscFPrintf(comm, fd, "%2d: %15s: %6.4e %5.1f%% %6.4e %5.1f%% %5.3e %5.1f%% %5.3e %5.1f%% %5.3e %5.1f%%\n", 17225c6c1daeSBarry Smith stage, name, stageTime/size, 100.0*fracTime, flops, 100.0*fracFlops, 1723d0609cedSBarry Smith mess, 100.0*fracMessages, avgMessLen, 100.0*fracLength, red, 100.0*fracReductions)); 17245c6c1daeSBarry Smith } 17255c6c1daeSBarry Smith } 17265c6c1daeSBarry Smith 17279566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd,"\n------------------------------------------------------------------------------------------------------------------------\n")); 17289566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "See the 'Profiling' chapter of the users' manual for details on interpreting output.\n")); 17299566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Phase summary info:\n")); 17309566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " Count: number of times phase was executed\n")); 17319566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " Time and Flop: Max - maximum over all processors\n")); 17329566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " Ratio - ratio of maximum to minimum over all processors\n")); 17339566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " Mess: number of messages sent\n")); 17349566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " AvgLen: average message length (bytes)\n")); 17359566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " Reduct: number of global reductions\n")); 17369566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " Global: entire computation\n")); 17379566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " Stage: stages of a computation. Set stages with PetscLogStagePush() and PetscLogStagePop().\n")); 17389566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " %%T - percent time in this phase %%F - percent flop in this phase\n")); 17399566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " %%M - percent messages in this phase %%L - percent message lengths in this phase\n")); 17409566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " %%R - percent reductions in this phase\n")); 17419566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " Total Mflop/s: 10e-6 * (sum of flop over all processors)/(max time over all processors)\n")); 1742e3ed9ee7SBarry Smith if (PetscLogMemory) { 174354aabf2dSBarry Smith PetscCall(PetscFPrintf(comm, fd, " Malloc Mbytes: Memory allocated and kept during event (sum over all calls to event). May be negative\n")); 174454aabf2dSBarry Smith PetscCall(PetscFPrintf(comm, fd, " EMalloc Mbytes: extra memory allocated during event and then freed (maximum over all calls to events). Never negative\n")); 174554aabf2dSBarry Smith PetscCall(PetscFPrintf(comm, fd, " MMalloc Mbytes: Increase in high water mark of allocated memory (sum over all calls to event). Never negative\n")); 17469566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " RMI Mbytes: Increase in resident memory (sum over all calls to event)\n")); 1747e3ed9ee7SBarry Smith } 1748d9c66bfbSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 17499566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " GPU Mflop/s: 10e-6 * (sum of flop on GPU over all processors)/(max GPU time over all processors)\n")); 17509566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " CpuToGpu Count: total number of CPU to GPU copies per processor\n")); 17519566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " CpuToGpu Size (Mbytes): 10e-6 * (total size of CPU to GPU copies per processor)\n")); 17529566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " GpuToCpu Count: total number of GPU to CPU copies per processor\n")); 17539566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " GpuToCpu Size (Mbytes): 10e-6 * (total size of GPU to CPU copies per processor)\n")); 17549566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, " GPU %%F: percent flops on GPU in this event\n")); 1755bec0b493Shannah_mairs #endif 17569566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "------------------------------------------------------------------------------------------------------------------------\n")); 17575c6c1daeSBarry Smith 17589566063dSJacob Faibussowitsch PetscCall(PetscLogViewWarnDebugging(comm,fd)); 17595c6c1daeSBarry Smith 17605c6c1daeSBarry Smith /* Report events */ 17619566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd,"Event Count Time (sec) Flop --- Global --- --- Stage ---- Total")); 1762e3ed9ee7SBarry Smith if (PetscLogMemory) { 17639566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd," Malloc EMalloc MMalloc RMI")); 1764e3ed9ee7SBarry Smith } 1765d9c66bfbSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 17669566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd," GPU - CpuToGpu - - GpuToCpu - GPU")); 1767bec0b493Shannah_mairs #endif 17689566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd,"\n")); 17699566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd," Max Ratio Max Ratio Max Ratio Mess AvgLen Reduct %%T %%F %%M %%L %%R %%T %%F %%M %%L %%R Mflop/s")); 1770e3ed9ee7SBarry Smith if (PetscLogMemory) { 17719566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd," Mbytes Mbytes Mbytes Mbytes")); 1772e3ed9ee7SBarry Smith } 1773d9c66bfbSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 17749566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd," Mflop/s Count Size Count Size %%F")); 1775bec0b493Shannah_mairs #endif 17769566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd,"\n")); 17779566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd,"------------------------------------------------------------------------------------------------------------------------")); 17784863603aSSatish Balay if (PetscLogMemory) { 17799566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd,"-----------------------------")); 17804863603aSSatish Balay } 1781d9c66bfbSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 17829566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd,"---------------------------------------")); 17834863603aSSatish Balay #endif 17849566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd,"\n")); 17855c6c1daeSBarry Smith 1786156b51fbSBarry Smith #if defined(PETSC_HAVE_DEVICE) 1787156b51fbSBarry Smith /* this indirect way of accessing these values is needed when PETSc is build with multiple libraries since the symbols are not in libpetscsys */ 1788156b51fbSBarry Smith PetscCall(PetscEventRegLogGetEvent(stageLog->eventLog, "TAOSolve", &TAO_Solve)); 1789156b51fbSBarry Smith PetscCall(PetscEventRegLogGetEvent(stageLog->eventLog, "TSStep", &TS_Step)); 1790156b51fbSBarry Smith PetscCall(PetscEventRegLogGetEvent(stageLog->eventLog, "SNESSolve", &SNES_Solve)); 1791156b51fbSBarry Smith PetscCall(PetscEventRegLogGetEvent(stageLog->eventLog, "KSPSolve", &KSP_Solve)); 1792156b51fbSBarry Smith #endif 1793156b51fbSBarry Smith 17945c6c1daeSBarry Smith /* Problem: The stage name will not show up unless the stage executed on proc 1 */ 17955c6c1daeSBarry Smith for (stage = 0; stage < numStages; stage++) { 17965c6c1daeSBarry Smith if (!stageVisible[stage]) continue; 1797820f2d46SBarry Smith /* CANNOT use MPI_Allreduce() since it might fail the line number check */ 17985c6c1daeSBarry Smith if (localStageUsed[stage]) { 17999566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n--- Event Stage %d: %s\n\n", stage, stageInfo[stage].name)); 18009566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&stageInfo[stage].perfInfo.time, &stageTime, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18019566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&stageInfo[stage].perfInfo.flops, &flops, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18029566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&stageInfo[stage].perfInfo.numMessages, &mess, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18039566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&stageInfo[stage].perfInfo.messageLength, &messLen, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18049566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&stageInfo[stage].perfInfo.numReductions, &red, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18055c6c1daeSBarry Smith } else { 18069566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n--- Event Stage %d: Unknown\n\n", stage)); 18079566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &stageTime, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18089566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &flops, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18099566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &mess, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18109566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &messLen, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18119566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &red, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18125c6c1daeSBarry Smith } 18135c6c1daeSBarry Smith mess *= 0.5; messLen *= 0.5; red /= size; 18145c6c1daeSBarry Smith 18155c6c1daeSBarry Smith /* Get total number of events in this stage -- 18165c6c1daeSBarry Smith Currently, a single processor can register more events than another, but events must all be registered in order, 18175c6c1daeSBarry Smith just like stages. We can removed this requirement if necessary by having a global event numbering and indirection 1818217044c2SLisandro Dalcin on the event ID. This seems best accomplished by associating a communicator with each stage. 18195c6c1daeSBarry Smith 18205c6c1daeSBarry Smith Problem: If the event did not happen on proc 1, its name will not be available. 18215c6c1daeSBarry Smith Problem: Event visibility is not implemented 18225c6c1daeSBarry Smith */ 18235c6c1daeSBarry Smith if (localStageUsed[stage]) { 18245c6c1daeSBarry Smith eventInfo = stageLog->stageInfo[stage].eventLog->eventInfo; 18255c6c1daeSBarry Smith localNumEvents = stageLog->stageInfo[stage].eventLog->numEvents; 1826a297a907SKarl Rupp } else localNumEvents = 0; 18279566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&localNumEvents, &numEvents, 1, MPI_INT, MPI_MAX, comm)); 18285c6c1daeSBarry Smith for (event = 0; event < numEvents; event++) { 1829820f2d46SBarry Smith /* CANNOT use MPI_Allreduce() since it might fail the line number check */ 18305c6c1daeSBarry Smith if (localStageUsed[stage] && (event < stageLog->stageInfo[stage].eventLog->numEvents) && (eventInfo[event].depth == 0)) { 1831217044c2SLisandro Dalcin if ((eventInfo[event].count > 0) && (eventInfo[event].time > 0.0)) flopr = eventInfo[event].flops; else flopr = 0.0; 18329566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&flopr, &minf, 1, MPIU_PETSCLOGDOUBLE, MPI_MIN, comm)); 18339566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&flopr, &maxf, 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 18349566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&eventInfo[event].flops, &totf, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18359566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&eventInfo[event].time, &mint, 1, MPIU_PETSCLOGDOUBLE, MPI_MIN, comm)); 18369566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&eventInfo[event].time, &maxt, 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 18379566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&eventInfo[event].time, &tott, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18389566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&eventInfo[event].numMessages, &totm, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18399566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&eventInfo[event].messageLength, &totml, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18409566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&eventInfo[event].numReductions, &totr, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18419566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&eventInfo[event].count, &minC, 1, MPI_INT, MPI_MIN, comm)); 18429566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&eventInfo[event].count, &maxC, 1, MPI_INT, MPI_MAX, comm)); 1843e3ed9ee7SBarry Smith if (PetscLogMemory) { 18449566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&eventInfo[event].memIncrease, &mem, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18459566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&eventInfo[event].mallocSpace, &mal, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18469566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&eventInfo[event].mallocIncrease, &malmax,1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18479566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&eventInfo[event].mallocIncreaseEvent, &emalmax,1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1848e3ed9ee7SBarry Smith } 1849d9c66bfbSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 18509566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&eventInfo[event].CpuToGpuCount, &cct, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18519566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&eventInfo[event].GpuToCpuCount, &gct, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18529566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&eventInfo[event].CpuToGpuSize, &csz, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18539566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&eventInfo[event].GpuToCpuSize, &gsz, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18549566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&eventInfo[event].GpuFlops, &gflops,1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18559566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&eventInfo[event].GpuTime, &gmaxt ,1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 1856bec0b493Shannah_mairs #endif 18575c6c1daeSBarry Smith name = stageLog->eventLog->eventInfo[event].name; 18585c6c1daeSBarry Smith } else { 18595c6c1daeSBarry Smith flopr = 0.0; 18609566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&flopr, &minf, 1, MPIU_PETSCLOGDOUBLE, MPI_MIN, comm)); 18619566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&flopr, &maxf, 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 18629566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &totf, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18639566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &mint, 1, MPIU_PETSCLOGDOUBLE, MPI_MIN, comm)); 18649566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &maxt, 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 18659566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &tott, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18669566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &totm, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18679566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &totml, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18689566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &totr, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18699566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&ierr, &minC, 1, MPI_INT, MPI_MIN, comm)); 18709566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&ierr, &maxC, 1, MPI_INT, MPI_MAX, comm)); 1871e3ed9ee7SBarry Smith if (PetscLogMemory) { 18729566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &mem, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18739566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &mal, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18749566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &malmax, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18759566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &emalmax,1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 1876e3ed9ee7SBarry Smith } 1877d9c66bfbSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 18789566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &cct, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18799566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &gct, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18809566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &csz, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18819566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &gsz, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18829566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &gflops, 1, MPIU_PETSCLOGDOUBLE, MPI_SUM, comm)); 18839566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allreduce(&zero, &gmaxt , 1, MPIU_PETSCLOGDOUBLE, MPI_MAX, comm)); 1884bec0b493Shannah_mairs #endif 18855c6c1daeSBarry Smith name = ""; 18865c6c1daeSBarry Smith } 18875c6c1daeSBarry Smith if (mint < 0.0) { 1888d0609cedSBarry Smith PetscCall(PetscFPrintf(comm, fd, "WARNING!!! Minimum time %g over all processors for %s is negative! This happens\n on some machines whose times cannot handle too rapid calls.!\n artificially changing minimum to zero.\n",mint,name)); 18895c6c1daeSBarry Smith mint = 0; 18905c6c1daeSBarry Smith } 189108401ef6SPierre Jolivet PetscCheck(minf >= 0.0,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Minimum flop %g over all processors for %s is negative! Not possible!",minf,name); 1892156b51fbSBarry Smith /* Put NaN into the time for all events that may not be time accurately since they may happen asynchronously on the GPU */ 1893156b51fbSBarry Smith #if defined(PETSC_HAVE_DEVICE) 1894156b51fbSBarry Smith if (!PetscLogGpuTimeFlag && petsc_gflops > 0) { 1895156b51fbSBarry Smith memcpy(&gmaxt,&nas,sizeof(PetscLogDouble)); 1896156b51fbSBarry Smith PetscCall(PetscEventRegLogGetEvent(stageLog->eventLog, name, &eventid)); 1897156b51fbSBarry Smith if (eventid != SNES_Solve && eventid != KSP_Solve && eventid != TS_Step && eventid != TAO_Solve) { 1898156b51fbSBarry Smith memcpy(&mint,&nas,sizeof(PetscLogDouble)); 1899156b51fbSBarry Smith memcpy(&maxt,&nas,sizeof(PetscLogDouble)); 1900156b51fbSBarry Smith } 1901156b51fbSBarry Smith } 1902156b51fbSBarry Smith #endif 19035c6c1daeSBarry Smith totm *= 0.5; totml *= 0.5; totr /= size; 19045c6c1daeSBarry Smith 1905217044c2SLisandro Dalcin if (maxC != 0) { 1906217044c2SLisandro Dalcin if (minC != 0) ratC = ((PetscLogDouble)maxC)/minC;else ratC = 0.0; 19075c6c1daeSBarry Smith if (mint != 0.0) ratt = maxt/mint; else ratt = 0.0; 19085c6c1daeSBarry Smith if (minf != 0.0) ratf = maxf/minf; else ratf = 0.0; 19095c6c1daeSBarry Smith if (TotalTime != 0.0) fracTime = tott/TotalTime; else fracTime = 0.0; 19105c6c1daeSBarry Smith if (TotalFlops != 0.0) fracFlops = totf/TotalFlops; else fracFlops = 0.0; 19115c6c1daeSBarry Smith if (stageTime != 0.0) fracStageTime = tott/stageTime; else fracStageTime = 0.0; 19125c6c1daeSBarry Smith if (flops != 0.0) fracStageFlops = totf/flops; else fracStageFlops = 0.0; 19135c6c1daeSBarry Smith if (numMessages != 0.0) fracMess = totm/numMessages; else fracMess = 0.0; 19145c6c1daeSBarry Smith if (messageLength != 0.0) fracMessLen = totml/messageLength; else fracMessLen = 0.0; 19155c6c1daeSBarry Smith if (numReductions != 0.0) fracRed = totr/numReductions; else fracRed = 0.0; 19165c6c1daeSBarry Smith if (mess != 0.0) fracStageMess = totm/mess; else fracStageMess = 0.0; 19175c6c1daeSBarry Smith if (messLen != 0.0) fracStageMessLen = totml/messLen; else fracStageMessLen = 0.0; 19185c6c1daeSBarry Smith if (red != 0.0) fracStageRed = totr/red; else fracStageRed = 0.0; 19195c6c1daeSBarry Smith if (totm != 0.0) totml /= totm; else totml = 0.0; 19205c6c1daeSBarry Smith if (maxt != 0.0) flopr = totf/maxt; else flopr = 0.0; 19219566063dSJacob Faibussowitsch if (fracStageTime > 1.00) PetscCall(PetscFPrintf(comm, fd,"Warning -- total time of event greater than time of entire stage -- something is wrong with the timer\n")); 1922d0609cedSBarry Smith PetscCall(PetscFPrintf(comm, fd, 1923e3ed9ee7SBarry Smith "%-16s %7d%4.1f %5.4e%4.1f %3.2e%4.1f %2.1e %2.1e %2.1e%3.0f%3.0f%3.0f%3.0f%3.0f %3.0f%3.0f%3.0f%3.0f%3.0f %5.0f", 1924217044c2SLisandro Dalcin name, maxC, ratC, maxt, ratt, maxf, ratf, totm, totml, totr, 19255c6c1daeSBarry Smith 100.0*fracTime, 100.0*fracFlops, 100.0*fracMess, 100.0*fracMessLen, 100.0*fracRed, 19265c6c1daeSBarry Smith 100.0*fracStageTime, 100.0*fracStageFlops, 100.0*fracStageMess, 100.0*fracStageMessLen, 100.0*fracStageRed, 1927d0609cedSBarry Smith PetscAbs(flopr)/1.0e6)); 1928e3ed9ee7SBarry Smith if (PetscLogMemory) { 19299566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd," %5.0f %5.0f %5.0f %5.0f",mal/1.0e6,emalmax/1.0e6,malmax/1.0e6,mem/1.0e6)); 1930e3ed9ee7SBarry Smith } 1931d9c66bfbSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 1932958c4211Shannah_mairs if (totf != 0.0) fracgflops = gflops/totf; else fracgflops = 0.0; 1933958c4211Shannah_mairs if (gmaxt != 0.0) gflopr = gflops/gmaxt; else gflopr = 0.0; 19349566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd," %5.0f %4.0f %3.2e %4.0f %3.2e% 3.0f",PetscAbs(gflopr)/1.0e6,cct/size,csz/(1.0e6*size),gct/size,gsz/(1.0e6*size),100.0*fracgflops)); 1935bec0b493Shannah_mairs #endif 19369566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd,"\n")); 19375c6c1daeSBarry Smith } 19385c6c1daeSBarry Smith } 19395c6c1daeSBarry Smith } 19405c6c1daeSBarry Smith 19415c6c1daeSBarry Smith /* Memory usage and object creation */ 19429566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "------------------------------------------------------------------------------------------------------------------------")); 19434863603aSSatish Balay if (PetscLogMemory) { 19449566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "-----------------------------")); 19454863603aSSatish Balay } 1946d9c66bfbSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 19479566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "---------------------------------------")); 19484863603aSSatish Balay #endif 19499566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n")); 19509566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n")); 19515c6c1daeSBarry Smith 19525c6c1daeSBarry Smith /* Right now, only stages on the first processor are reported here, meaning only objects associated with 19535c6c1daeSBarry Smith the global communicator, or MPI_COMM_SELF for proc 1. We really should report global stats and then 19545c6c1daeSBarry Smith stats for stages local to processor sets. 19555c6c1daeSBarry Smith */ 19565c6c1daeSBarry Smith /* We should figure out the longest object name here (now 20 characters) */ 19574851f57dSBarry Smith PetscCall(PetscFPrintf(comm, fd, "Object Type Creations Destructions. Reports information only for process 0.\n")); 19585c6c1daeSBarry Smith for (stage = 0; stage < numStages; stage++) { 19595c6c1daeSBarry Smith if (localStageUsed[stage]) { 19605c6c1daeSBarry Smith classInfo = stageLog->stageInfo[stage].classLog->classInfo; 19619566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n--- Event Stage %d: %s\n\n", stage, stageInfo[stage].name)); 19625c6c1daeSBarry Smith for (oclass = 0; oclass < stageLog->stageInfo[stage].classLog->numClasses; oclass++) { 19635c6c1daeSBarry Smith if ((classInfo[oclass].creations > 0) || (classInfo[oclass].destructions > 0)) { 19644851f57dSBarry Smith PetscCall(PetscFPrintf(comm, fd, "%20s %5d %5d\n", stageLog->classLog->classInfo[oclass].name,classInfo[oclass].creations, classInfo[oclass].destructions)); 19655c6c1daeSBarry Smith } 19665c6c1daeSBarry Smith } 19675c6c1daeSBarry Smith } else { 1968cf019ec6SStefano Zampini if (!localStageVisible[stage]) continue; 19699566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n--- Event Stage %d: Unknown\n\n", stage)); 19705c6c1daeSBarry Smith } 19715c6c1daeSBarry Smith } 19725c6c1daeSBarry Smith 19739566063dSJacob Faibussowitsch PetscCall(PetscFree(localStageUsed)); 19749566063dSJacob Faibussowitsch PetscCall(PetscFree(stageUsed)); 19759566063dSJacob Faibussowitsch PetscCall(PetscFree(localStageVisible)); 19769566063dSJacob Faibussowitsch PetscCall(PetscFree(stageVisible)); 19775c6c1daeSBarry Smith 19785c6c1daeSBarry Smith /* Information unrelated to this particular run */ 19799566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "========================================================================================================================\n")); 19808563dfccSBarry Smith PetscTime(&y); 19818563dfccSBarry Smith PetscTime(&x); 19828563dfccSBarry Smith PetscTime(&y); PetscTime(&y); PetscTime(&y); PetscTime(&y); PetscTime(&y); 19838563dfccSBarry Smith PetscTime(&y); PetscTime(&y); PetscTime(&y); PetscTime(&y); PetscTime(&y); 19849566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm,fd,"Average time to get PetscTime(): %g\n", (y-x)/10.0)); 19855c6c1daeSBarry Smith /* MPI information */ 19865c6c1daeSBarry Smith if (size > 1) { 19875c6c1daeSBarry Smith MPI_Status status; 19885c6c1daeSBarry Smith PetscMPIInt tag; 19895c6c1daeSBarry Smith MPI_Comm newcomm; 19905c6c1daeSBarry Smith 19919566063dSJacob Faibussowitsch PetscCallMPI(MPI_Barrier(comm)); 19928563dfccSBarry Smith PetscTime(&x); 19939566063dSJacob Faibussowitsch PetscCallMPI(MPI_Barrier(comm)); 19949566063dSJacob Faibussowitsch PetscCallMPI(MPI_Barrier(comm)); 19959566063dSJacob Faibussowitsch PetscCallMPI(MPI_Barrier(comm)); 19969566063dSJacob Faibussowitsch PetscCallMPI(MPI_Barrier(comm)); 19979566063dSJacob Faibussowitsch PetscCallMPI(MPI_Barrier(comm)); 19988563dfccSBarry Smith PetscTime(&y); 19999566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Average time for MPI_Barrier(): %g\n", (y-x)/5.0)); 20009566063dSJacob Faibussowitsch PetscCall(PetscCommDuplicate(comm,&newcomm, &tag)); 20019566063dSJacob Faibussowitsch PetscCallMPI(MPI_Barrier(comm)); 20025c6c1daeSBarry Smith if (rank) { 20039566063dSJacob Faibussowitsch PetscCallMPI(MPI_Recv(NULL, 0, MPI_INT, rank-1, tag, newcomm, &status)); 20049566063dSJacob Faibussowitsch PetscCallMPI(MPI_Send(NULL, 0, MPI_INT, (rank+1)%size, tag, newcomm)); 20055c6c1daeSBarry Smith } else { 20068563dfccSBarry Smith PetscTime(&x); 20079566063dSJacob Faibussowitsch PetscCallMPI(MPI_Send(NULL, 0, MPI_INT, 1, tag, newcomm)); 20089566063dSJacob Faibussowitsch PetscCallMPI(MPI_Recv(NULL, 0, MPI_INT, size-1, tag, newcomm, &status)); 20098563dfccSBarry Smith PetscTime(&y); 20109566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm,fd,"Average time for zero size MPI_Send(): %g\n", (y-x)/size)); 20115c6c1daeSBarry Smith } 20129566063dSJacob Faibussowitsch PetscCall(PetscCommDestroy(&newcomm)); 20135c6c1daeSBarry Smith } 20149566063dSJacob Faibussowitsch PetscCall(PetscOptionsView(NULL,viewer)); 20155c6c1daeSBarry Smith 20165c6c1daeSBarry Smith /* Machine and compile information */ 20175c6c1daeSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNELS) 20189566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Compiled with FORTRAN kernels\n")); 20195c6c1daeSBarry Smith #else 20209566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Compiled without FORTRAN kernels\n")); 20215c6c1daeSBarry Smith #endif 2022217044c2SLisandro Dalcin #if defined(PETSC_USE_64BIT_INDICES) 20239566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Compiled with 64 bit PetscInt\n")); 2024217044c2SLisandro Dalcin #elif defined(PETSC_USE___FLOAT128) 20259566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Compiled with 32 bit PetscInt\n")); 2026217044c2SLisandro Dalcin #endif 20275c6c1daeSBarry Smith #if defined(PETSC_USE_REAL_SINGLE) 20289566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Compiled with single precision PetscScalar and PetscReal\n")); 20295f27b2e0SBarry Smith #elif defined(PETSC_USE___FLOAT128) 20309566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Compiled with 128 bit precision PetscScalar and PetscReal\n")); 20315c6c1daeSBarry Smith #endif 20325c6c1daeSBarry Smith #if defined(PETSC_USE_REAL_MAT_SINGLE) 20339566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Compiled with single precision matrices\n")); 20345c6c1daeSBarry Smith #else 20359566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Compiled with full precision matrices (default)\n")); 20365c6c1daeSBarry Smith #endif 2037d0609cedSBarry Smith PetscCall(PetscFPrintf(comm, fd, "sizeof(short) %d sizeof(int) %d sizeof(long) %d sizeof(void*) %d sizeof(PetscScalar) %d sizeof(PetscInt) %d\n", 2038d0609cedSBarry Smith (int) sizeof(short), (int) sizeof(int), (int) sizeof(long), (int) sizeof(void*),(int) sizeof(PetscScalar),(int) sizeof(PetscInt))); 20395c6c1daeSBarry Smith 20409566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "Configure options: %s",petscconfigureoptions)); 20419566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "%s", petscmachineinfo)); 20429566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "%s", petsccompilerinfo)); 20439566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "%s", petsccompilerflagsinfo)); 20449566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "%s", petsclinkerinfo)); 20455c6c1daeSBarry Smith 20465c6c1daeSBarry Smith /* Cleanup */ 20479566063dSJacob Faibussowitsch PetscCall(PetscFPrintf(comm, fd, "\n")); 20489566063dSJacob Faibussowitsch PetscCall(PetscLogViewWarnNoGpuAwareMpi(comm,fd)); 20499566063dSJacob Faibussowitsch PetscCall(PetscLogViewWarnDebugging(comm,fd)); 2050156b51fbSBarry Smith PetscCall(PetscFPTrapPop()); 20515c6c1daeSBarry Smith PetscFunctionReturn(0); 20525c6c1daeSBarry Smith } 20535c6c1daeSBarry Smith 20547d6c928cSSatish Balay /*@C 20557d6c928cSSatish Balay PetscLogView - Prints a summary of the logging. 20565c6c1daeSBarry Smith 20575c6c1daeSBarry Smith Collective over MPI_Comm 20585c6c1daeSBarry Smith 20595c6c1daeSBarry Smith Input Parameter: 2060f14045dbSBarry Smith . viewer - an ASCII viewer 20615c6c1daeSBarry Smith 20625c6c1daeSBarry Smith Options Database Keys: 2063bb1d7374SBarry Smith + -log_view [:filename] - Prints summary of log information 2064bb1d7374SBarry Smith . -log_view :filename.py:ascii_info_detail - Saves logging information from each process as a Python file 2065607d249eSBarry Smith . -log_view :filename.xml:ascii_xml - Saves a summary of the logging information in a nested format (see below for how to view it) 2066d0a29bd7SConnor Ward . -log_view :filename.txt:ascii_flamegraph - Saves logging information in a format suitable for visualising as a Flame Graph (see below for how to view it) 2067156b51fbSBarry Smith . -log_view_memory - Also display memory usage in each event 2068156b51fbSBarry Smith . -log_view_gpu_time - Also display time in each event for GPU kernels (Note this may slow the computation) 2069bb1d7374SBarry Smith . -log_all - Saves a file Log.rank for each MPI process with details of each step of the computation 2070bb1d7374SBarry Smith - -log_trace [filename] - Displays a trace of what each process is doing 20715c6c1daeSBarry Smith 20725c6c1daeSBarry Smith Notes: 2073bb1d7374SBarry Smith It is possible to control the logging programatically but we recommend using the options database approach whenever possible 20745c6c1daeSBarry Smith By default the summary is printed to stdout. 20755c6c1daeSBarry Smith 2076bb1d7374SBarry Smith Before calling this routine you must have called either PetscLogDefaultBegin() or PetscLogNestedBegin() 2077bb1d7374SBarry Smith 2078bb1d7374SBarry Smith If PETSc is configured with --with-logging=0 then this functionality is not available 2079bb1d7374SBarry Smith 2080607d249eSBarry Smith To view the nested XML format filename.xml first copy ${PETSC_DIR}/share/petsc/xml/performance_xml2html.xsl to the current 2081607d249eSBarry Smith directory then open filename.xml with your browser. Specific notes for certain browsers 2082607d249eSBarry Smith $ Firefox and Internet explorer - simply open the file 2083607d249eSBarry Smith $ Google Chrome - you must start up Chrome with the option --allow-file-access-from-files 2084a8d69d7bSBarry Smith $ Safari - see https://ccm.net/faq/36342-safari-how-to-enable-local-file-access 2085607d249eSBarry Smith or one can use the package http://xmlsoft.org/XSLT/xsltproc2.html to translate the xml file to html and then open it with 2086607d249eSBarry Smith your browser. 20872add09c0SLisandro Dalcin Alternatively, use the script ${PETSC_DIR}/lib/petsc/bin/petsc-performance-view to automatically open a new browser 20882add09c0SLisandro Dalcin window and render the XML log file contents. 2089607d249eSBarry Smith 2090bb1d7374SBarry Smith The nested XML format was kindly donated by Koos Huijssen and Christiaan M. Klaij MARITIME RESEARCH INSTITUTE NETHERLANDS 2091bb1d7374SBarry Smith 2092d0a29bd7SConnor Ward The Flame Graph output can be visualised using either the original Flame Graph script (https://github.com/brendangregg/FlameGraph) 2093d0a29bd7SConnor Ward or using speedscope (https://www.speedscope.app). 2094d0a29bd7SConnor Ward Old XML profiles may be converted into this format using the script ${PETSC_DIR}/lib/petsc/bin/xml2flamegraph.py. 2095d0a29bd7SConnor Ward 20965c6c1daeSBarry Smith Level: beginner 20975c6c1daeSBarry Smith 2098db781477SPatrick Sanan .seealso: `PetscLogDefaultBegin()`, `PetscLogDump()` 20995c6c1daeSBarry Smith @*/ 2100f14045dbSBarry Smith PetscErrorCode PetscLogView(PetscViewer viewer) 21015c6c1daeSBarry Smith { 2102f14045dbSBarry Smith PetscBool isascii; 2103f14045dbSBarry Smith PetscViewerFormat format; 210437b78d16SBarry Smith int stage, lastStage; 210537b78d16SBarry Smith PetscStageLog stageLog; 21065c6c1daeSBarry Smith 21075c6c1daeSBarry Smith PetscFunctionBegin; 210828b400f6SJacob Faibussowitsch PetscCheck(PetscLogPLB,PETSC_COMM_SELF,PETSC_ERR_SUP,"Must use -log_view or PetscLogDefaultBegin() before calling this routine"); 210937b78d16SBarry Smith /* Pop off any stages the user forgot to remove */ 211037b78d16SBarry Smith lastStage = 0; 21119566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 21129566063dSJacob Faibussowitsch PetscCall(PetscStageLogGetCurrent(stageLog, &stage)); 211337b78d16SBarry Smith while (stage >= 0) { 211437b78d16SBarry Smith lastStage = stage; 21159566063dSJacob Faibussowitsch PetscCall(PetscStageLogPop(stageLog)); 21169566063dSJacob Faibussowitsch PetscCall(PetscStageLogGetCurrent(stageLog, &stage)); 211737b78d16SBarry Smith } 21189566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&isascii)); 211928b400f6SJacob Faibussowitsch PetscCheck(isascii,PetscObjectComm((PetscObject)viewer),PETSC_ERR_SUP,"Currently can only view logging to ASCII"); 21209566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer,&format)); 2121f14045dbSBarry Smith if (format == PETSC_VIEWER_DEFAULT || format == PETSC_VIEWER_ASCII_INFO) { 21229566063dSJacob Faibussowitsch PetscCall(PetscLogView_Default(viewer)); 2123f14045dbSBarry Smith } else if (format == PETSC_VIEWER_ASCII_INFO_DETAIL) { 21249566063dSJacob Faibussowitsch PetscCall(PetscLogView_Detailed(viewer)); 212538144912Sdeepblu2718 } else if (format == PETSC_VIEWER_ASCII_CSV) { 21269566063dSJacob Faibussowitsch PetscCall(PetscLogView_CSV(viewer)); 2127bb1d7374SBarry Smith } else if (format == PETSC_VIEWER_ASCII_XML) { 21289566063dSJacob Faibussowitsch PetscCall(PetscLogView_Nested(viewer)); 2129d0a29bd7SConnor Ward } else if (format == PETSC_VIEWER_ASCII_FLAMEGRAPH) { 21309566063dSJacob Faibussowitsch PetscCall(PetscLogView_Flamegraph(viewer)); 21315c6c1daeSBarry Smith } 21329566063dSJacob Faibussowitsch PetscCall(PetscStageLogPush(stageLog, lastStage)); 21335c6c1daeSBarry Smith PetscFunctionReturn(0); 21345c6c1daeSBarry Smith } 21355c6c1daeSBarry Smith 2136f14045dbSBarry Smith /*@C 2137f14045dbSBarry Smith PetscLogViewFromOptions - Processes command line options to determine if/how a PetscLog is to be viewed. 2138f14045dbSBarry Smith 2139f14045dbSBarry Smith Collective on PETSC_COMM_WORLD 2140f14045dbSBarry Smith 2141f14045dbSBarry Smith Not normally called by user 2142f14045dbSBarry Smith 2143f14045dbSBarry Smith Level: intermediate 2144f14045dbSBarry Smith 2145f14045dbSBarry Smith @*/ 2146f14045dbSBarry Smith PetscErrorCode PetscLogViewFromOptions(void) 2147f14045dbSBarry Smith { 2148f14045dbSBarry Smith PetscViewer viewer; 2149f14045dbSBarry Smith PetscBool flg; 2150f14045dbSBarry Smith PetscViewerFormat format; 2151f14045dbSBarry Smith 2152f14045dbSBarry Smith PetscFunctionBegin; 21539566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetViewer(PETSC_COMM_WORLD,NULL,NULL,"-log_view",&viewer,&format,&flg)); 2154f14045dbSBarry Smith if (flg) { 21559566063dSJacob Faibussowitsch PetscCall(PetscViewerPushFormat(viewer,format)); 21569566063dSJacob Faibussowitsch PetscCall(PetscLogView(viewer)); 21579566063dSJacob Faibussowitsch PetscCall(PetscViewerPopFormat(viewer)); 21589566063dSJacob Faibussowitsch PetscCall(PetscViewerDestroy(&viewer)); 2159f14045dbSBarry Smith } 2160f14045dbSBarry Smith PetscFunctionReturn(0); 2161f14045dbSBarry Smith } 2162f14045dbSBarry Smith 21635c6c1daeSBarry Smith /*----------------------------------------------- Counter Functions -------------------------------------------------*/ 21645c6c1daeSBarry Smith /*@C 21655c6c1daeSBarry Smith PetscGetFlops - Returns the number of flops used on this processor 21665c6c1daeSBarry Smith since the program began. 21675c6c1daeSBarry Smith 21685c6c1daeSBarry Smith Not Collective 21695c6c1daeSBarry Smith 21705c6c1daeSBarry Smith Output Parameter: 21715c6c1daeSBarry Smith flops - number of floating point operations 21725c6c1daeSBarry Smith 21735c6c1daeSBarry Smith Notes: 21745c6c1daeSBarry Smith A global counter logs all PETSc flop counts. The user can use 21755c6c1daeSBarry Smith PetscLogFlops() to increment this counter to include flops for the 21765c6c1daeSBarry Smith application code. 21775c6c1daeSBarry Smith 21785c6c1daeSBarry Smith Level: intermediate 21795c6c1daeSBarry Smith 2180db781477SPatrick Sanan .seealso: `PetscTime()`, `PetscLogFlops()` 21815c6c1daeSBarry Smith @*/ 21825c6c1daeSBarry Smith PetscErrorCode PetscGetFlops(PetscLogDouble *flops) 21835c6c1daeSBarry Smith { 21845c6c1daeSBarry Smith PetscFunctionBegin; 21855c6c1daeSBarry Smith *flops = petsc_TotalFlops; 21865c6c1daeSBarry Smith PetscFunctionReturn(0); 21875c6c1daeSBarry Smith } 21885c6c1daeSBarry Smith 21895c6c1daeSBarry Smith PetscErrorCode PetscLogObjectState(PetscObject obj, const char format[], ...) 21905c6c1daeSBarry Smith { 21915c6c1daeSBarry Smith size_t fullLength; 21925c6c1daeSBarry Smith va_list Argp; 21935c6c1daeSBarry Smith 21945c6c1daeSBarry Smith PetscFunctionBegin; 21955c6c1daeSBarry Smith if (!petsc_logObjects) PetscFunctionReturn(0); 21965c6c1daeSBarry Smith va_start(Argp, format); 21979566063dSJacob Faibussowitsch PetscCall(PetscVSNPrintf(petsc_objects[obj->id].info, 64,format,&fullLength, Argp)); 21985c6c1daeSBarry Smith va_end(Argp); 21995c6c1daeSBarry Smith PetscFunctionReturn(0); 22005c6c1daeSBarry Smith } 22015c6c1daeSBarry Smith 22025c6c1daeSBarry Smith /*MC 22035c6c1daeSBarry Smith PetscLogFlops - Adds floating point operations to the global counter. 22045c6c1daeSBarry Smith 22055c6c1daeSBarry Smith Synopsis: 2206aaa7dc30SBarry Smith #include <petsclog.h> 22075c6c1daeSBarry Smith PetscErrorCode PetscLogFlops(PetscLogDouble f) 22085c6c1daeSBarry Smith 22095c6c1daeSBarry Smith Not Collective 22105c6c1daeSBarry Smith 22115c6c1daeSBarry Smith Input Parameter: 22125c6c1daeSBarry Smith . f - flop counter 22135c6c1daeSBarry Smith 22145c6c1daeSBarry Smith Usage: 22155c6c1daeSBarry Smith .vb 22165c6c1daeSBarry Smith PetscLogEvent USER_EVENT; 22175c6c1daeSBarry Smith PetscLogEventRegister("User event",0,&USER_EVENT); 22185c6c1daeSBarry Smith PetscLogEventBegin(USER_EVENT,0,0,0,0); 22195c6c1daeSBarry Smith [code segment to monitor] 22205c6c1daeSBarry Smith PetscLogFlops(user_flops) 22215c6c1daeSBarry Smith PetscLogEventEnd(USER_EVENT,0,0,0,0); 22225c6c1daeSBarry Smith .ve 22235c6c1daeSBarry Smith 22245c6c1daeSBarry Smith Notes: 22255c6c1daeSBarry Smith A global counter logs all PETSc flop counts. The user can use 22265c6c1daeSBarry Smith PetscLogFlops() to increment this counter to include flops for the 22275c6c1daeSBarry Smith application code. 22285c6c1daeSBarry Smith 22295c6c1daeSBarry Smith Level: intermediate 22305c6c1daeSBarry Smith 2231db781477SPatrick Sanan .seealso: `PetscLogEventRegister()`, `PetscLogEventBegin()`, `PetscLogEventEnd()`, `PetscGetFlops()` 22325c6c1daeSBarry Smith 22335c6c1daeSBarry Smith M*/ 22345c6c1daeSBarry Smith 22355c6c1daeSBarry Smith /*MC 22365c6c1daeSBarry Smith PetscPreLoadBegin - Begin a segment of code that may be preloaded (run twice) 22375c6c1daeSBarry Smith to get accurate timings 22385c6c1daeSBarry Smith 22395c6c1daeSBarry Smith Synopsis: 2240aaa7dc30SBarry Smith #include <petsclog.h> 22415c6c1daeSBarry Smith void PetscPreLoadBegin(PetscBool flag,char *name); 22425c6c1daeSBarry Smith 22435c6c1daeSBarry Smith Not Collective 22445c6c1daeSBarry Smith 2245d8d19677SJose E. Roman Input Parameters: 22465c6c1daeSBarry Smith + flag - PETSC_TRUE to run twice, PETSC_FALSE to run once, may be overridden 22475c6c1daeSBarry Smith with command line option -preload true or -preload false 2248609bdbeeSBarry Smith - name - name of first stage (lines of code timed separately with -log_view) to 22495c6c1daeSBarry Smith be preloaded 22505c6c1daeSBarry Smith 22515c6c1daeSBarry Smith Usage: 22525c6c1daeSBarry Smith .vb 22535c6c1daeSBarry Smith PetscPreLoadBegin(PETSC_TRUE,"first stage); 22545c6c1daeSBarry Smith lines of code 22555c6c1daeSBarry Smith PetscPreLoadStage("second stage"); 22565c6c1daeSBarry Smith lines of code 22575c6c1daeSBarry Smith PetscPreLoadEnd(); 22585c6c1daeSBarry Smith .ve 22595c6c1daeSBarry Smith 226095452b02SPatrick Sanan Notes: 226195452b02SPatrick Sanan Only works in C/C++, not Fortran 22625c6c1daeSBarry Smith 22635c6c1daeSBarry Smith Flags available within the macro. 22645c6c1daeSBarry Smith + PetscPreLoadingUsed - true if we are or have done preloading 22655c6c1daeSBarry Smith . PetscPreLoadingOn - true if it is CURRENTLY doing preload 22665c6c1daeSBarry Smith . PetscPreLoadIt - 0 for the first computation (with preloading turned off it is only 0) 1 for the second 22675c6c1daeSBarry Smith - PetscPreLoadMax - number of times it will do the computation, only one when preloading is turned on 22685c6c1daeSBarry Smith The first two variables are available throughout the program, the second two only between the PetscPreLoadBegin() 22695c6c1daeSBarry Smith and PetscPreLoadEnd() 22705c6c1daeSBarry Smith 22715c6c1daeSBarry Smith Level: intermediate 22725c6c1daeSBarry Smith 2273db781477SPatrick Sanan .seealso: `PetscLogEventRegister()`, `PetscLogEventBegin()`, `PetscLogEventEnd()`, `PetscPreLoadEnd()`, `PetscPreLoadStage()` 22745c6c1daeSBarry Smith 22755c6c1daeSBarry Smith M*/ 22765c6c1daeSBarry Smith 22775c6c1daeSBarry Smith /*MC 22785c6c1daeSBarry Smith PetscPreLoadEnd - End a segment of code that may be preloaded (run twice) 22795c6c1daeSBarry Smith to get accurate timings 22805c6c1daeSBarry Smith 22815c6c1daeSBarry Smith Synopsis: 2282aaa7dc30SBarry Smith #include <petsclog.h> 22835c6c1daeSBarry Smith void PetscPreLoadEnd(void); 22845c6c1daeSBarry Smith 22855c6c1daeSBarry Smith Not Collective 22865c6c1daeSBarry Smith 22875c6c1daeSBarry Smith Usage: 22885c6c1daeSBarry Smith .vb 22895c6c1daeSBarry Smith PetscPreLoadBegin(PETSC_TRUE,"first stage); 22905c6c1daeSBarry Smith lines of code 22915c6c1daeSBarry Smith PetscPreLoadStage("second stage"); 22925c6c1daeSBarry Smith lines of code 22935c6c1daeSBarry Smith PetscPreLoadEnd(); 22945c6c1daeSBarry Smith .ve 22955c6c1daeSBarry Smith 229695452b02SPatrick Sanan Notes: 229795452b02SPatrick Sanan only works in C/C++ not fortran 22985c6c1daeSBarry Smith 22995c6c1daeSBarry Smith Level: intermediate 23005c6c1daeSBarry Smith 2301db781477SPatrick Sanan .seealso: `PetscLogEventRegister()`, `PetscLogEventBegin()`, `PetscLogEventEnd()`, `PetscPreLoadBegin()`, `PetscPreLoadStage()` 23025c6c1daeSBarry Smith 23035c6c1daeSBarry Smith M*/ 23045c6c1daeSBarry Smith 23055c6c1daeSBarry Smith /*MC 23065c6c1daeSBarry Smith PetscPreLoadStage - Start a new segment of code to be timed separately. 23075c6c1daeSBarry Smith to get accurate timings 23085c6c1daeSBarry Smith 23095c6c1daeSBarry Smith Synopsis: 2310aaa7dc30SBarry Smith #include <petsclog.h> 23115c6c1daeSBarry Smith void PetscPreLoadStage(char *name); 23125c6c1daeSBarry Smith 23135c6c1daeSBarry Smith Not Collective 23145c6c1daeSBarry Smith 23155c6c1daeSBarry Smith Usage: 23165c6c1daeSBarry Smith .vb 23175c6c1daeSBarry Smith PetscPreLoadBegin(PETSC_TRUE,"first stage); 23185c6c1daeSBarry Smith lines of code 23195c6c1daeSBarry Smith PetscPreLoadStage("second stage"); 23205c6c1daeSBarry Smith lines of code 23215c6c1daeSBarry Smith PetscPreLoadEnd(); 23225c6c1daeSBarry Smith .ve 23235c6c1daeSBarry Smith 232495452b02SPatrick Sanan Notes: 232595452b02SPatrick Sanan only works in C/C++ not fortran 23265c6c1daeSBarry Smith 23275c6c1daeSBarry Smith Level: intermediate 23285c6c1daeSBarry Smith 2329db781477SPatrick Sanan .seealso: `PetscLogEventRegister()`, `PetscLogEventBegin()`, `PetscLogEventEnd()`, `PetscPreLoadBegin()`, `PetscPreLoadEnd()` 23305c6c1daeSBarry Smith 23315c6c1daeSBarry Smith M*/ 23325c6c1daeSBarry Smith 2333a4af0ceeSJacob Faibussowitsch #if PetscDefined(HAVE_DEVICE) 2334a4af0ceeSJacob Faibussowitsch #include <petsc/private/deviceimpl.h> 23359ffd0706SHong Zhang 2336156b51fbSBarry Smith PetscBool PetscLogGpuTimeFlag = PETSC_FALSE; 2337156b51fbSBarry Smith 2338156b51fbSBarry Smith /* 2339156b51fbSBarry Smith This cannot be called by users between PetscInitialize() and PetscFinalize() at any random location in the code 2340156b51fbSBarry Smith because it will result in timing results that cannot be interpreted. 2341156b51fbSBarry Smith */ 2342156b51fbSBarry Smith static PetscErrorCode PetscLogGpuTime_Off(void) 2343156b51fbSBarry Smith { 2344156b51fbSBarry Smith PetscLogGpuTimeFlag = PETSC_FALSE; 2345156b51fbSBarry Smith return 0; 2346156b51fbSBarry Smith } 2347156b51fbSBarry Smith 2348156b51fbSBarry Smith /*@C 2349156b51fbSBarry Smith PetscLogGpuTime - turn on the logging of GPU time for GPU kernels 2350156b51fbSBarry Smith 2351156b51fbSBarry Smith Options Database: 2352156b51fbSBarry Smith . -log_view_gpu_time - provide the GPU times in the -log_view output 2353156b51fbSBarry Smith 2354156b51fbSBarry Smith Notes: 2355156b51fbSBarry Smith Because the logging of GPU time requires blocking the CPU execution for each kernel, turning on the timing of the 2356156b51fbSBarry Smith GPU kernels can slow down the entire computation and should only be used when studying the performance 2357156b51fbSBarry Smith of operations on GPU such as vector operations and matrix-vector operations. 2358156b51fbSBarry Smith 2359156b51fbSBarry Smith This routine should only be called once near the beginning of the program. Once it is started it cannot be turned off. 2360156b51fbSBarry Smith 23610f8f8846SPatrick Sanan Level: advanced 23620f8f8846SPatrick Sanan 2363db781477SPatrick Sanan .seealso: `PetscLogView()`, `PetscLogGpuFlops()`, `PetscLogGpuTimeEnd()`, `PetscLogGpuTimeBegin()` 2364156b51fbSBarry Smith @*/ 2365156b51fbSBarry Smith PetscErrorCode PetscLogGpuTime(void) 2366156b51fbSBarry Smith { 2367156b51fbSBarry Smith if (!PetscLogGpuTimeFlag) PetscCall(PetscRegisterFinalize(PetscLogGpuTime_Off)); 2368156b51fbSBarry Smith PetscLogGpuTimeFlag = PETSC_TRUE; 2369156b51fbSBarry Smith return 0; 2370156b51fbSBarry Smith } 2371156b51fbSBarry Smith 23729ffd0706SHong Zhang /*@C 23739ffd0706SHong Zhang PetscLogGpuTimeBegin - Start timer for device 23749ffd0706SHong Zhang 23759ffd0706SHong Zhang Notes: 23769ffd0706SHong Zhang When CUDA or HIP is enabled, the timer is run on the GPU, it is a separate logging of time devoted to GPU computations (excluding kernel launch times). 23779ffd0706SHong Zhang When CUDA or HIP is not available, the timer is run on the CPU, it is a separate logging of time devoted to GPU computations (including kernel launch times). 23789ffd0706SHong Zhang There is no need to call WaitForCUDA() or WaitForHIP() between PetscLogGpuTimeBegin and PetscLogGpuTimeEnd 23799ffd0706SHong Zhang This timer should NOT include times for data transfers between the GPU and CPU, nor setup actions such as allocating space. 23809ffd0706SHong Zhang The regular logging captures the time for data transfers and any CPU activites during the event 23819ffd0706SHong Zhang It is used to compute the flop rate on the GPU as it is actively engaged in running a kernel. 23829ffd0706SHong Zhang 23839ffd0706SHong Zhang Developer Notes: 23849ffd0706SHong Zhang The GPU event timer captures the execution time of all the kernels launched in the default stream by the CPU between PetscLogGpuTimeBegin() and PetsLogGpuTimeEnd(). 23859ffd0706SHong Zhang PetscLogGpuTimeBegin() and PetsLogGpuTimeEnd() insert the begin and end events into the default stream (stream 0). The device will record a time stamp for the event when it reaches that event in the stream. The function xxxEventSynchronize() is called in PetsLogGpuTimeEnd() to block CPU execution, but not continued GPU excution, until the timer event is recorded. 23869ffd0706SHong Zhang 23879ffd0706SHong Zhang Level: intermediate 23889ffd0706SHong Zhang 2389db781477SPatrick Sanan .seealso: `PetscLogView()`, `PetscLogGpuFlops()`, `PetscLogGpuTimeEnd()`, `PetscLogGpuTime()` 23909ffd0706SHong Zhang @*/ 23919ffd0706SHong Zhang PetscErrorCode PetscLogGpuTimeBegin(void) 23929ffd0706SHong Zhang { 23939ffd0706SHong Zhang PetscFunctionBegin; 2394156b51fbSBarry Smith if (!PetscLogPLB || !PetscLogGpuTimeFlag) PetscFunctionReturn(0); 2395a4af0ceeSJacob Faibussowitsch if (PetscDefined(HAVE_CUDA) || PetscDefined(HAVE_HIP)) { 2396a4af0ceeSJacob Faibussowitsch PetscDeviceContext dctx; 2397a4af0ceeSJacob Faibussowitsch 23989566063dSJacob Faibussowitsch PetscCall(PetscDeviceContextGetCurrentContext(&dctx)); 23999566063dSJacob Faibussowitsch PetscCall(PetscDeviceContextBeginTimer_Internal(dctx)); 2400a4af0ceeSJacob Faibussowitsch } else { 24019566063dSJacob Faibussowitsch PetscCall(PetscTimeSubtract(&petsc_gtime)); 2402a4af0ceeSJacob Faibussowitsch } 24039ffd0706SHong Zhang PetscFunctionReturn(0); 24049ffd0706SHong Zhang } 24059ffd0706SHong Zhang 24069ffd0706SHong Zhang /*@C 24079ffd0706SHong Zhang PetscLogGpuTimeEnd - Stop timer for device 24089ffd0706SHong Zhang 24099ffd0706SHong Zhang Level: intermediate 24109ffd0706SHong Zhang 2411db781477SPatrick Sanan .seealso: `PetscLogView()`, `PetscLogGpuFlops()`, `PetscLogGpuTimeBegin()` 24129ffd0706SHong Zhang @*/ 24139ffd0706SHong Zhang PetscErrorCode PetscLogGpuTimeEnd(void) 24149ffd0706SHong Zhang { 24159ffd0706SHong Zhang PetscFunctionBegin; 2416156b51fbSBarry Smith if (!PetscLogPLE || !PetscLogGpuTimeFlag) PetscFunctionReturn(0); 2417a4af0ceeSJacob Faibussowitsch if (PetscDefined(HAVE_CUDA) || PetscDefined(HAVE_HIP)) { 2418a4af0ceeSJacob Faibussowitsch PetscDeviceContext dctx; 2419a4af0ceeSJacob Faibussowitsch PetscLogDouble elapsed; 2420a4af0ceeSJacob Faibussowitsch 24219566063dSJacob Faibussowitsch PetscCall(PetscDeviceContextGetCurrentContext(&dctx)); 24229566063dSJacob Faibussowitsch PetscCall(PetscDeviceContextEndTimer_Internal(dctx,&elapsed)); 2423a4af0ceeSJacob Faibussowitsch petsc_gtime += (elapsed/1000.0); 2424a4af0ceeSJacob Faibussowitsch } else { 24259566063dSJacob Faibussowitsch PetscCall(PetscTimeAdd(&petsc_gtime)); 2426a4af0ceeSJacob Faibussowitsch } 24279ffd0706SHong Zhang PetscFunctionReturn(0); 24289ffd0706SHong Zhang } 24299ffd0706SHong Zhang #endif /* end of PETSC_HAVE_DEVICE */ 24309ffd0706SHong Zhang 24315c6c1daeSBarry Smith #else /* end of -DPETSC_USE_LOG section */ 24325c6c1daeSBarry Smith 24335c6c1daeSBarry Smith PetscErrorCode PetscLogObjectState(PetscObject obj, const char format[], ...) 24345c6c1daeSBarry Smith { 24355c6c1daeSBarry Smith PetscFunctionBegin; 24365c6c1daeSBarry Smith PetscFunctionReturn(0); 24375c6c1daeSBarry Smith } 24385c6c1daeSBarry Smith 24395c6c1daeSBarry Smith #endif /* PETSC_USE_LOG*/ 24405c6c1daeSBarry Smith 24415c6c1daeSBarry Smith PetscClassId PETSC_LARGEST_CLASSID = PETSC_SMALLEST_CLASSID; 24425c6c1daeSBarry Smith PetscClassId PETSC_OBJECT_CLASSID = 0; 24435c6c1daeSBarry Smith 24445c6c1daeSBarry Smith /*@C 24455c6c1daeSBarry Smith PetscClassIdRegister - Registers a new class name for objects and logging operations in an application code. 24465c6c1daeSBarry Smith 24475c6c1daeSBarry Smith Not Collective 24485c6c1daeSBarry Smith 24495c6c1daeSBarry Smith Input Parameter: 24505c6c1daeSBarry Smith . name - The class name 24515c6c1daeSBarry Smith 24525c6c1daeSBarry Smith Output Parameter: 24535c6c1daeSBarry Smith . oclass - The class id or classid 24545c6c1daeSBarry Smith 24555c6c1daeSBarry Smith Level: developer 24565c6c1daeSBarry Smith 24575c6c1daeSBarry Smith @*/ 24585c6c1daeSBarry Smith PetscErrorCode PetscClassIdRegister(const char name[],PetscClassId *oclass) 24595c6c1daeSBarry Smith { 24605c6c1daeSBarry Smith #if defined(PETSC_USE_LOG) 24615c6c1daeSBarry Smith PetscStageLog stageLog; 24625c6c1daeSBarry Smith PetscInt stage; 24635c6c1daeSBarry Smith #endif 24645c6c1daeSBarry Smith 24655c6c1daeSBarry Smith PetscFunctionBegin; 24665c6c1daeSBarry Smith *oclass = ++PETSC_LARGEST_CLASSID; 24675c6c1daeSBarry Smith #if defined(PETSC_USE_LOG) 24689566063dSJacob Faibussowitsch PetscCall(PetscLogGetStageLog(&stageLog)); 24699566063dSJacob Faibussowitsch PetscCall(PetscClassRegLogRegister(stageLog->classLog, name, *oclass)); 24705c6c1daeSBarry Smith for (stage = 0; stage < stageLog->numStages; stage++) { 24719566063dSJacob Faibussowitsch PetscCall(PetscClassPerfLogEnsureSize(stageLog->stageInfo[stage].classLog, stageLog->classLog->numClasses)); 24725c6c1daeSBarry Smith } 24735c6c1daeSBarry Smith #endif 24745c6c1daeSBarry Smith PetscFunctionReturn(0); 24755c6c1daeSBarry Smith } 2476210b5426SBarry Smith 2477210b5426SBarry Smith #if defined(PETSC_USE_LOG) && defined(PETSC_HAVE_MPE) 2478210b5426SBarry Smith #include <mpe.h> 2479210b5426SBarry Smith 2480210b5426SBarry Smith PetscBool PetscBeganMPE = PETSC_FALSE; 2481210b5426SBarry Smith 2482495fc317SBarry Smith PETSC_INTERN PetscErrorCode PetscLogEventBeginMPE(PetscLogEvent,int,PetscObject,PetscObject,PetscObject,PetscObject); 2483495fc317SBarry Smith PETSC_INTERN PetscErrorCode PetscLogEventEndMPE(PetscLogEvent,int,PetscObject,PetscObject,PetscObject,PetscObject); 2484495fc317SBarry Smith 2485210b5426SBarry Smith /*@C 2486210b5426SBarry Smith PetscLogMPEBegin - Turns on MPE logging of events. This creates large log files 2487210b5426SBarry Smith and slows the program down. 2488210b5426SBarry Smith 2489210b5426SBarry Smith Collective over PETSC_COMM_WORLD 2490210b5426SBarry Smith 2491210b5426SBarry Smith Options Database Keys: 2492a2553e36SBarry Smith . -log_mpe - Prints extensive log information 2493210b5426SBarry Smith 2494210b5426SBarry Smith Notes: 2495609bdbeeSBarry Smith A related routine is PetscLogDefaultBegin() (with the options key -log_view), which is 2496210b5426SBarry Smith intended for production runs since it logs only flop rates and object 2497210b5426SBarry Smith creation (and should not significantly slow the programs). 2498210b5426SBarry Smith 2499210b5426SBarry Smith Level: advanced 2500210b5426SBarry Smith 2501db781477SPatrick Sanan .seealso: `PetscLogDump()`, `PetscLogDefaultBegin()`, `PetscLogAllBegin()`, `PetscLogEventActivate()`, 2502db781477SPatrick Sanan `PetscLogEventDeactivate()` 2503210b5426SBarry Smith @*/ 2504210b5426SBarry Smith PetscErrorCode PetscLogMPEBegin(void) 2505210b5426SBarry Smith { 2506210b5426SBarry Smith PetscFunctionBegin; 2507210b5426SBarry Smith /* Do MPE initialization */ 2508210b5426SBarry Smith if (!MPE_Initialized_logging()) { /* This function exists in mpich 1.1.2 and higher */ 25099566063dSJacob Faibussowitsch PetscCall(PetscInfo(0,"Initializing MPE.\n")); 25109566063dSJacob Faibussowitsch PetscCall(MPE_Init_log()); 2511210b5426SBarry Smith 2512210b5426SBarry Smith PetscBeganMPE = PETSC_TRUE; 2513210b5426SBarry Smith } else { 25149566063dSJacob Faibussowitsch PetscCall(PetscInfo(0,"MPE already initialized. Not attempting to reinitialize.\n")); 2515210b5426SBarry Smith } 25169566063dSJacob Faibussowitsch PetscCall(PetscLogSet(PetscLogEventBeginMPE, PetscLogEventEndMPE)); 2517210b5426SBarry Smith PetscFunctionReturn(0); 2518210b5426SBarry Smith } 2519210b5426SBarry Smith 2520210b5426SBarry Smith /*@C 2521495fc317SBarry Smith PetscLogMPEDump - Dumps the MPE logging info to file for later use with Jumpshot. 2522210b5426SBarry Smith 2523210b5426SBarry Smith Collective over PETSC_COMM_WORLD 2524210b5426SBarry Smith 2525210b5426SBarry Smith Level: advanced 2526210b5426SBarry Smith 2527db781477SPatrick Sanan .seealso: `PetscLogDump()`, `PetscLogAllBegin()`, `PetscLogMPEBegin()` 2528210b5426SBarry Smith @*/ 2529210b5426SBarry Smith PetscErrorCode PetscLogMPEDump(const char sname[]) 2530210b5426SBarry Smith { 2531210b5426SBarry Smith char name[PETSC_MAX_PATH_LEN]; 2532210b5426SBarry Smith 2533210b5426SBarry Smith PetscFunctionBegin; 2534210b5426SBarry Smith if (PetscBeganMPE) { 25359566063dSJacob Faibussowitsch PetscCall(PetscInfo(0,"Finalizing MPE.\n")); 2536210b5426SBarry Smith if (sname) { 25379566063dSJacob Faibussowitsch PetscCall(PetscStrcpy(name,sname)); 2538210b5426SBarry Smith } else { 25399566063dSJacob Faibussowitsch PetscCall(PetscGetProgramName(name,sizeof(name))); 2540210b5426SBarry Smith } 25419566063dSJacob Faibussowitsch PetscCall(MPE_Finish_log(name)); 2542210b5426SBarry Smith } else { 25439566063dSJacob Faibussowitsch PetscCall(PetscInfo(0,"Not finalizing MPE (not started by PETSc).\n")); 2544210b5426SBarry Smith } 2545210b5426SBarry Smith PetscFunctionReturn(0); 2546210b5426SBarry Smith } 2547210b5426SBarry Smith 2548210b5426SBarry Smith #define PETSC_RGB_COLORS_MAX 39 2549210b5426SBarry Smith static const char *PetscLogMPERGBColors[PETSC_RGB_COLORS_MAX] = { 2550210b5426SBarry Smith "OliveDrab: ", 2551210b5426SBarry Smith "BlueViolet: ", 2552210b5426SBarry Smith "CadetBlue: ", 2553210b5426SBarry Smith "CornflowerBlue: ", 2554210b5426SBarry Smith "DarkGoldenrod: ", 2555210b5426SBarry Smith "DarkGreen: ", 2556210b5426SBarry Smith "DarkKhaki: ", 2557210b5426SBarry Smith "DarkOliveGreen: ", 2558210b5426SBarry Smith "DarkOrange: ", 2559210b5426SBarry Smith "DarkOrchid: ", 2560210b5426SBarry Smith "DarkSeaGreen: ", 2561210b5426SBarry Smith "DarkSlateGray: ", 2562210b5426SBarry Smith "DarkTurquoise: ", 2563210b5426SBarry Smith "DeepPink: ", 2564210b5426SBarry Smith "DarkKhaki: ", 2565210b5426SBarry Smith "DimGray: ", 2566210b5426SBarry Smith "DodgerBlue: ", 2567210b5426SBarry Smith "GreenYellow: ", 2568210b5426SBarry Smith "HotPink: ", 2569210b5426SBarry Smith "IndianRed: ", 2570210b5426SBarry Smith "LavenderBlush: ", 2571210b5426SBarry Smith "LawnGreen: ", 2572210b5426SBarry Smith "LemonChiffon: ", 2573210b5426SBarry Smith "LightCoral: ", 2574210b5426SBarry Smith "LightCyan: ", 2575210b5426SBarry Smith "LightPink: ", 2576210b5426SBarry Smith "LightSalmon: ", 2577210b5426SBarry Smith "LightSlateGray: ", 2578210b5426SBarry Smith "LightYellow: ", 2579210b5426SBarry Smith "LimeGreen: ", 2580210b5426SBarry Smith "MediumPurple: ", 2581210b5426SBarry Smith "MediumSeaGreen: ", 2582210b5426SBarry Smith "MediumSlateBlue:", 2583210b5426SBarry Smith "MidnightBlue: ", 2584210b5426SBarry Smith "MintCream: ", 2585210b5426SBarry Smith "MistyRose: ", 2586210b5426SBarry Smith "NavajoWhite: ", 2587210b5426SBarry Smith "NavyBlue: ", 2588210b5426SBarry Smith "OliveDrab: " 2589210b5426SBarry Smith }; 2590210b5426SBarry Smith 2591210b5426SBarry Smith /*@C 2592210b5426SBarry Smith PetscLogMPEGetRGBColor - This routine returns a rgb color useable with PetscLogEventRegister() 2593210b5426SBarry Smith 2594210b5426SBarry Smith Not collective. Maybe it should be? 2595210b5426SBarry Smith 25967a7aea1fSJed Brown Output Parameter: 2597210b5426SBarry Smith . str - character string representing the color 2598210b5426SBarry Smith 2599210b5426SBarry Smith Level: developer 2600210b5426SBarry Smith 2601db781477SPatrick Sanan .seealso: `PetscLogEventRegister` 2602210b5426SBarry Smith @*/ 2603210b5426SBarry Smith PetscErrorCode PetscLogMPEGetRGBColor(const char *str[]) 2604210b5426SBarry Smith { 2605210b5426SBarry Smith static int idx = 0; 2606210b5426SBarry Smith 2607210b5426SBarry Smith PetscFunctionBegin; 2608210b5426SBarry Smith *str = PetscLogMPERGBColors[idx]; 2609210b5426SBarry Smith idx = (idx + 1)% PETSC_RGB_COLORS_MAX; 2610210b5426SBarry Smith PetscFunctionReturn(0); 2611210b5426SBarry Smith } 2612210b5426SBarry Smith 2613210b5426SBarry Smith #endif /* PETSC_USE_LOG && PETSC_HAVE_MPE */ 2614