Skip to content

Commit c78d3ec

Browse files
committed
Merge remote-tracking branch 'origin/main'
2 parents dbc2cc1 + cadcd4b commit c78d3ec

File tree

3 files changed

+12
-0
lines changed

3 files changed

+12
-0
lines changed

include/hws/gpu_nvidia/utility.hpp

+4
Original file line numberDiff line numberDiff line change
@@ -52,13 +52,17 @@ namespace hws::detail {
5252
#define HWS_CUDA_ERROR_CHECK(cuda_func) cuda_func;
5353
#endif
5454

55+
#if CUDA_VERSION >= 12000
56+
5557
/**
5658
* @brief Convert the clock throttle reason event bitmask to a string representation. If the provided bitmask represents multiple reasons, they are split using "|".
5759
* @param[in] clocks_event_reasons the bitmask to convert to a string
5860
* @return all event throttle reasons (`[[nodiscard]]`)
5961
*/
6062
[[nodiscard]] std::string throttle_event_reason_to_string(unsigned long long clocks_event_reasons);
6163

64+
#endif
65+
6266
} // namespace hws::detail
6367

6468
#endif // HWS_GPU_NVIDIA_UTILITY_HPP_

src/hws/gpu_nvidia/hardware_sampler.cpp

+4
Original file line numberDiff line numberDiff line change
@@ -267,11 +267,13 @@ void gpu_nvidia_hardware_sampler::sampling_loop() {
267267
clock_samples_.memory_clock_frequency_ = decltype(clock_samples_.memory_clock_frequency_)::value_type{ static_cast<decltype(clock_samples_.memory_clock_frequency_)::value_type::value_type>(clock_mem) };
268268
}
269269

270+
#if CUDA_VERSION >= 12000
270271
decltype(clock_samples_.throttle_reason_)::value_type::value_type clock_throttle_reason{};
271272
if (nvmlDeviceGetCurrentClocksEventReasons(device, &clock_throttle_reason) == NVML_SUCCESS) {
272273
clock_samples_.throttle_reason_ = decltype(clock_samples_.throttle_reason_)::value_type{ clock_throttle_reason };
273274
clock_samples_.throttle_reason_string_ = decltype(clock_samples_.throttle_reason_string_)::value_type{ detail::throttle_event_reason_to_string(clock_throttle_reason) };
274275
}
276+
#endif
275277

276278
nvmlEnableState_t mode{};
277279
nvmlEnableState_t default_mode{};
@@ -464,12 +466,14 @@ void gpu_nvidia_hardware_sampler::sampling_loop() {
464466
clock_samples_.memory_clock_frequency_->push_back(static_cast<decltype(clock_samples_.memory_clock_frequency_)::value_type::value_type>(value));
465467
}
466468

469+
#if CUDA_VERSION >= 12000
467470
if (clock_samples_.throttle_reason_string_.has_value()) {
468471
decltype(clock_samples_.throttle_reason_)::value_type::value_type value{};
469472
HWS_NVML_ERROR_CHECK(nvmlDeviceGetCurrentClocksEventReasons(device, &value))
470473
clock_samples_.throttle_reason_->push_back(value);
471474
clock_samples_.throttle_reason_string_->push_back(detail::throttle_event_reason_to_string(value));
472475
}
476+
#endif
473477

474478
if (clock_samples_.auto_boosted_clock_.has_value()) {
475479
nvmlEnableState_t mode{};

src/hws/gpu_nvidia/utility.cpp

+4
Original file line numberDiff line numberDiff line change
@@ -16,6 +16,8 @@
1616

1717
namespace hws::detail {
1818

19+
#if CUDA_VERSION >= 12000
20+
1921
std::string throttle_event_reason_to_string(const unsigned long long clocks_event_reasons) {
2022
if (clocks_event_reasons == 0ull) {
2123
return "None";
@@ -52,4 +54,6 @@ std::string throttle_event_reason_to_string(const unsigned long long clocks_even
5254
}
5355
}
5456

57+
#endif
58+
5559
} // namespace hws::detail

0 commit comments

Comments
 (0)