2626void summary_example (nvbench::state &state)
2727{
2828 // Fetch parameters and compute duration in seconds:
29- const auto ms = static_cast <nvbench::float64_t >(state.get_int64 (" ms" ));
30- const auto us = static_cast <nvbench::float64_t >(state.get_int64 (" us" ));
29+ const auto ms = static_cast <nvbench::float64_t >(state.get_int64 (" ms" ));
30+ const auto us = static_cast <nvbench::float64_t >(state.get_int64 (" us" ));
3131 const auto duration = ms * 1e-3 + us * 1e-6 ;
3232
3333 // Add a new column to the summary table with the derived duration used by the benchmark.
@@ -41,7 +41,7 @@ void summary_example(nvbench::state &state)
4141 }
4242
4343 // Run the measurements:
44- state.exec ([duration](nvbench::launch &launch) {
44+ state.exec (nvbench::exec_tag::no_batch, [duration](nvbench::launch &launch) {
4545 nvbench::sleep_kernel<<<1 , 1 , 0 , launch.get_stream()>>> (duration);
4646 });
4747
@@ -56,14 +56,17 @@ void summary_example(nvbench::state &state)
5656#endif
5757
5858 // Default summary columns can be shown/hidden in the markdown output tables by adding/removing
59- // the "hide" key. Modify this benchmark to show the minimum and maximum times, but hide the
60- // means .
59+ // the "hide" key. Modify this benchmark to show the minimum and maximum GPUs times, but hide the
60+ // mean GPU time and all CPU times. SM Clock frequency and throttling info are also shown .
6161 state.get_summary (" nv/cold/time/gpu/min" ).remove_value (" hide" );
6262 state.get_summary (" nv/cold/time/gpu/max" ).remove_value (" hide" );
6363 state.get_summary (" nv/cold/time/gpu/mean" ).set_string (" hide" , " " );
64- state.get_summary (" nv/cold/time/cpu/min" ).remove_value (" hide" );
65- state.get_summary (" nv/cold/time/cpu/max" ).remove_value (" hide" );
6664 state.get_summary (" nv/cold/time/cpu/mean" ).set_string (" hide" , " " );
65+ state.get_summary (" nv/cold/time/cpu/min" ).set_string (" hide" , " " );
66+ state.get_summary (" nv/cold/time/cpu/max" ).set_string (" hide" , " " );
67+ state.get_summary (" nv/cold/time/cpu/stdev/relative" ).set_string (" hide" , " " );
68+ state.get_summary (" nv/cold/sm_clock_rate/mean" ).remove_value (" hide" );
69+ state.get_summary (" nv/cold/sm_clock_rate/scaling/percent" ).remove_value (" hide" );
6770}
6871NVBENCH_BENCH (summary_example)
6972 .add_int64_axis(" ms" , nvbench::range(10 , 50 , 20 ))
0 commit comments