We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
2 parents e5a04c8 + 2ab76a8 commit 3de9dc9Copy full SHA for 3de9dc9
nvbench/detail/measure_cold.cuh
@@ -153,18 +153,16 @@ struct measure_cold_base::kernel_launch_timer
153
m_measure.gpu_frequency_start();
154
}
155
m_measure.m_cuda_timer.start(m_measure.m_launch.get_stream());
156
- if (m_disable_blocking_kernel)
157
- {
158
- m_measure.m_cpu_timer.start();
159
- }
+ // start CPU timer irrespective of use of blocking kernel
+ // Ref: https://github.com/NVIDIA/nvbench/issues/249
+ m_measure.m_cpu_timer.start();
160
161
162
__forceinline__ void stop()
163
{
164
m_measure.m_cuda_timer.stop(m_measure.m_launch.get_stream());
165
if (!m_disable_blocking_kernel)
166
167
168
m_measure.unblock_stream();
169
170
if (m_measure.m_check_throttling)
0 commit comments