1818
1919#pragma once
2020
21+ #include < cuda_runtime.h>
22+
2123#include < nvbench/blocking_kernel.cuh>
2224#include < nvbench/cpu_timer.cuh>
2325#include < nvbench/cuda_call.cuh>
2426#include < nvbench/cuda_timer.cuh>
27+ #include < nvbench/detail/gpu_frequency.cuh>
28+ #include < nvbench/detail/kernel_launcher_timer_wrapper.cuh>
29+ #include < nvbench/detail/l2flush.cuh>
30+ #include < nvbench/detail/statistics.cuh>
2531#include < nvbench/device_info.cuh>
2632#include < nvbench/exec_tag.cuh>
2733#include < nvbench/launch.cuh>
2834#include < nvbench/stopping_criterion.cuh>
2935
30- #include < nvbench/detail/kernel_launcher_timer_wrapper.cuh>
31- #include < nvbench/detail/l2flush.cuh>
32- #include < nvbench/detail/statistics.cuh>
33- #include < nvbench/detail/gpu_frequency.cuh>
34-
35- #include < cuda_runtime.h>
36-
3736#include < utility>
3837#include < vector>
38+
3939#include " nvbench/types.cuh"
4040
4141namespace nvbench
@@ -91,7 +91,7 @@ protected:
9191 nvbench::blocking_kernel m_blocker;
9292
9393 nvbench::criterion_params m_criterion_params;
94- nvbench::stopping_criterion_base& m_stopping_criterion;
94+ nvbench::stopping_criterion_base & m_stopping_criterion;
9595 nvbench::detail::gpu_frequency m_gpu_frequency;
9696
9797 bool m_disable_blocking_kernel{false };
@@ -102,8 +102,8 @@ protected:
102102 nvbench::float64_t m_skip_time{};
103103 nvbench::float64_t m_timeout{};
104104
105- nvbench::float32_t m_throttle_threshold{ 0 . 75f }; // [% of peak SM clock rate]
106- nvbench::float32_t m_throttle_recovery_delay{ 0 . 0f } ; // [seconds]
105+ nvbench::float32_t m_throttle_threshold; // [% of peak SM clock rate]
106+ nvbench::float32_t m_throttle_recovery_delay; // [seconds]
107107 bool m_discard_on_throttle{false };
108108
109109 nvbench::int64_t m_total_samples{};
0 commit comments