3232#include < nvbench/stopping_criterion.cuh>
3333#include < nvbench/types.cuh>
3434
35- #include < cuda_runtime.h>
3635#include < cuda_profiler_api.h>
36+ #include < cuda_runtime.h>
37+
3738#include < utility>
3839#include < vector>
3940
@@ -76,14 +77,8 @@ protected:
7677 {
7778 NVBENCH_CUDA_CALL (cudaStreamSynchronize (m_launch.get_stream ()));
7879 }
79- __forceinline__ void profiler_start () const
80- {
81- NVBENCH_CUDA_CALL (cudaProfilerStart ());
82- }
83- __forceinline__ void profiler_stop () const
84- {
85- NVBENCH_CUDA_CALL (cudaProfilerStop ());
86- }
80+ __forceinline__ void profiler_start () const { NVBENCH_CUDA_CALL (cudaProfilerStart ()); }
81+ __forceinline__ void profiler_stop () const { NVBENCH_CUDA_CALL (cudaProfilerStop ()); }
8782 void block_stream ();
8883 __forceinline__ void unblock_stream () { m_blocker.unblock (); }
8984
@@ -143,7 +138,9 @@ struct measure_cold_base::kernel_launch_timer
143138 , m_run_once{measure.m_run_once }
144139 {}
145140
146- explicit kernel_launch_timer (measure_cold_base &measure, bool disable_blocking_kernel, bool run_once)
141+ explicit kernel_launch_timer (measure_cold_base &measure,
142+ bool disable_blocking_kernel,
143+ bool run_once)
147144 : m_measure{measure}
148145 , m_disable_blocking_kernel{disable_blocking_kernel}
149146 , m_run_once{run_once}
@@ -161,7 +158,7 @@ struct measure_cold_base::kernel_launch_timer
161158 {
162159 m_measure.gpu_frequency_start ();
163160 }
164- if (!m_run_once)
161+ if (!m_run_once)
165162 {
166163 m_measure.profiler_start ();
167164 }
@@ -183,7 +180,7 @@ struct measure_cold_base::kernel_launch_timer
183180 m_measure.gpu_frequency_stop ();
184181 }
185182 m_measure.sync_stream ();
186- if (!m_run_once)
183+ if (!m_run_once)
187184 {
188185 m_measure.profiler_stop ();
189186 }
0 commit comments