/* * ============================================================================= * ROC Runtime Conformance Release License * ============================================================================= * The University of Illinois/NCSA * Open Source License (NCSA) * * Copyright (c) 2017-2023, Advanced Micro Devices, Inc. * All rights reserved. * * Developed by: * * AMD Research and AMD ROC Software Development * * Advanced Micro Devices, Inc. * * www.amd.com * * Permission is hereby granted, free of charge, to any person obtaining a copy * of this software and associated documentation files (the "Software"), to * deal with the Software without restriction, including without limitation * the rights to use, copy, modify, merge, publish, distribute, sublicense, * and/or sell copies of the Software, and to permit persons to whom the * Software is furnished to do so, subject to the following conditions: * * - Redistributions of source code must retain the above copyright notice, * this list of conditions and the following disclaimers. * - Redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimers in * the documentation and/or other materials provided with the distribution. * - Neither the names of , * nor the names of its contributors may be used to endorse or promote * products derived from this Software without specific prior written * permission. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL * THE CONTRIBUTORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER * DEALINGS WITH THE SOFTWARE. * */ #include #include #include #include #include #include #include #include "rocm_smi/rocm_smi.h" #define PRINT_RSMI_ERR(RET) { \ if (RET != RSMI_STATUS_SUCCESS) { \ const char *err_str; \ std::cout << "[ERROR] RSMI call returned " << (RET) \ << " at line " << __LINE__ << std::endl; \ rsmi_status_string((RET), &err_str); \ std::cout << err_str << std::endl; \ } \ } #define CHK_RSMI_RET(RET) { \ PRINT_RSMI_ERR(RET) \ if (RET != RSMI_STATUS_SUCCESS) { \ return (RET); \ } \ } #define CHK_AND_PRINT_RSMI_ERR_RET(RET) { \ PRINT_RSMI_ERR(RET) \ CHK_RSMI_RET(RET) \ } #define CHK_RSMI_RET_I(RET) { \ PRINT_RSMI_ERR(RET) \ if (RET != RSMI_STATUS_SUCCESS) { \ return static_cast(RET); \ } \ } #define CHK_FILE_PERMISSIONS(RET) { \ if ((RET) == RSMI_STATUS_PERMISSION) { \ if (isFileWritable(RET)) { \ CHK_RSMI_RET(RET) \ } \ } else { \ CHK_RSMI_RET(RET) \ } \ } #define CHK_FILE_PERMISSIONS_AND_NOT_SUPPORTED_OR_UNIMPLEMENTED(RET) { \ if ((RET) == RSMI_STATUS_PERMISSION) { \ if (isFileWritable(RET)) { \ CHK_RSMI_RET(RET) \ } \ } else if ((RET) == RSMI_STATUS_NOT_SUPPORTED) { \ std::cout << "Not Supported." \ << std::endl; \ } else if ((RET) == RSMI_STATUS_NOT_YET_IMPLEMENTED) { \ std::cout << "Not Yet Implemented." \ << std::endl; \ } else { \ CHK_RSMI_RET(RET) \ } \ } #define CHK_RSMI_NOT_SUPPORTED_RET(RET) { \ if ((RET) == RSMI_STATUS_NOT_SUPPORTED) { \ std::cout << "Not Supported." \ << std::endl; \ } else { \ CHK_RSMI_RET(RET) \ } \ } #define CHK_RSMI_NOT_SUPPORTED_OR_UNEXPECTED_DATA_RET(RET) { \ if ((RET) == RSMI_STATUS_NOT_SUPPORTED) { \ std::cout << "Not Supported." \ << std::endl; \ } else if ((RET) == RSMI_STATUS_UNEXPECTED_DATA) { \ std::cout << "[ERROR] RSMI_STATUS_UNEXPECTED_DATA retrieved." \ << std::endl; \ } else { \ CHK_RSMI_RET(RET) \ } \ } #define CHK_RSMI_NOT_SUPPORTED_OR_SETTING_UNAVAILABLE_RET(RET) {\ if ((RET) == RSMI_STATUS_NOT_SUPPORTED) { \ std::cout << "Not Supported."\ << std::endl; \ } else if ((RET) == RSMI_STATUS_SETTING_UNAVAILABLE) { \ std::cout << "[WARN] RSMI_STATUS_SETTING_UNAVAILABLE retrieved." \ << std::endl; \ } else { \ CHK_RSMI_RET(RET) \ } \ } #define CHK_NOT_SUPPORTED_OR_UNEXPECTED_DATA_OR_INSUFFICIENT_SIZE_RET(RET) { \ if ((RET) == RSMI_STATUS_NOT_SUPPORTED) { \ std::cout << "Not Supported." \ << std::endl; \ } else if ((RET) == RSMI_STATUS_UNEXPECTED_DATA) { \ std::cout << "[WARN] RSMI_STATUS_UNEXPECTED_DATA retrieved." \ << std::endl; \ } else if ((RET) == RSMI_STATUS_INSUFFICIENT_SIZE) { \ std::cout << "[WARN] RSMI_STATUS_INSUFFICIENT_SIZE retrieved." \ << std::endl; \ } else { \ CHK_RSMI_RET(RET) \ } \ } static void print_test_header(const char *str, uint32_t dv_ind) { std::cout << "********************************" << std::endl; std::cout << "*** " << str << std::endl; std::cout << "********************************" << std::endl; std::cout << "Device index: " << dv_ind << std::endl; } static void print_mini_header(const char *str) { std::cout << "\n>> " << str << " <<" << std::endl; } static const char * power_profile_string(rsmi_power_profile_preset_masks_t profile) { switch (profile) { case RSMI_PWR_PROF_PRST_CUSTOM_MASK: return "CUSTOM"; case RSMI_PWR_PROF_PRST_VIDEO_MASK: return "VIDEO"; case RSMI_PWR_PROF_PRST_POWER_SAVING_MASK: return "POWER SAVING"; case RSMI_PWR_PROF_PRST_COMPUTE_MASK: return "COMPUTE"; case RSMI_PWR_PROF_PRST_VR_MASK: return "VR"; case RSMI_PWR_PROF_PRST_3D_FULL_SCR_MASK: return "3D FULL SCREEN"; default: return "UNKNOWN"; } } static const std::string compute_partition_string(rsmi_compute_partition_type partition) { switch (partition) { case RSMI_COMPUTE_PARTITION_CPX: return "CPX"; case RSMI_COMPUTE_PARTITION_SPX: return "SPX"; case RSMI_COMPUTE_PARTITION_DPX: return "DPX"; case RSMI_COMPUTE_PARTITION_TPX: return "TPX"; case RSMI_COMPUTE_PARTITION_QPX: return "QPX"; default: return "UNKNOWN"; } } static std::map mapStringToRSMIComputePartitionTypes { {"CPX", RSMI_COMPUTE_PARTITION_CPX}, {"SPX", RSMI_COMPUTE_PARTITION_SPX}, {"DPX", RSMI_COMPUTE_PARTITION_DPX}, {"TPX", RSMI_COMPUTE_PARTITION_TPX}, {"QPX", RSMI_COMPUTE_PARTITION_QPX} }; static const std::string nps_mode_string(rsmi_nps_mode_type_t partition) { switch (partition) { case RSMI_MEMORY_PARTITION_NPS1: return "NPS1"; case RSMI_MEMORY_PARTITION_NPS2: return "NPS2"; case RSMI_MEMORY_PARTITION_NPS4: return "NPS4"; case RSMI_MEMORY_PARTITION_NPS8: return "NPS8"; default: return "UNKNOWN"; } } static std::map mapStringToRSMINpsModeTypes { {"NPS1", RSMI_MEMORY_PARTITION_NPS1}, {"NPS2", RSMI_MEMORY_PARTITION_NPS2}, {"NPS4", RSMI_MEMORY_PARTITION_NPS4}, {"NPS8", RSMI_MEMORY_PARTITION_NPS8} }; static const char * perf_level_string(rsmi_dev_perf_level_t perf_lvl) { switch (perf_lvl) { case RSMI_DEV_PERF_LEVEL_AUTO: return "AUTO"; case RSMI_DEV_PERF_LEVEL_LOW: return "LOW"; case RSMI_DEV_PERF_LEVEL_HIGH: return "HIGH"; case RSMI_DEV_PERF_LEVEL_MANUAL: return "MANUAL"; default: return "UNKNOWN"; } } static bool isUserRunningAsSudo() { bool isRunningWithSudo = false; auto myUID = getuid(); auto myPrivledges = geteuid(); if ((myUID == myPrivledges) && (myPrivledges == 0)) { isRunningWithSudo = true; } return isRunningWithSudo; } static bool isFileWritable(rsmi_status_t response) { // Clock files may not be writable, causing sets to // return RSMI_STATUS_PERMISSION. If running as sudo, // this means file is not writable. // isFileWritable(ret) - intends to capture this // response situation. bool fileWritable = true; if (isUserRunningAsSudo() && (response == RSMI_STATUS_PERMISSION)) { std::cout << "[WARN] User is running with sudo " << "permissions, file is not writable." << std::endl; fileWritable = false; } else { CHK_AND_PRINT_RSMI_ERR_RET(response) } return fileWritable; } static rsmi_status_t test_power_profile(uint32_t dv_ind) { rsmi_status_t ret; rsmi_power_profile_status_t status; print_test_header("Power Profile", dv_ind); std::cout << "The available power profiles are: "; ret = rsmi_dev_power_profile_presets_get(dv_ind, 0, &status); CHK_RSMI_NOT_SUPPORTED_RET(ret) if (ret != RSMI_STATUS_SUCCESS) { std::cout << "***Skipping Power Profile test." << std::endl; return RSMI_STATUS_SUCCESS; } CHK_RSMI_RET(ret) std::cout << "The available power profiles are:" << std::endl; uint64_t tmp = 1; while (tmp <= RSMI_PWR_PROF_PRST_LAST) { if ((tmp & status.available_profiles) == tmp) { std::cout << "\t" << power_profile_string((rsmi_power_profile_preset_masks_t)tmp) << std::endl; } tmp = tmp << 1; } std::cout << "The current power profile is: " << power_profile_string(status.current) << std::endl; // Try setting the profile to a different power profile rsmi_bit_field_t diff_profiles; rsmi_power_profile_preset_masks_t new_prof; diff_profiles = status.available_profiles & (~status.current); if (diff_profiles & RSMI_PWR_PROF_PRST_COMPUTE_MASK) { new_prof = RSMI_PWR_PROF_PRST_COMPUTE_MASK; } else if (diff_profiles & RSMI_PWR_PROF_PRST_VIDEO_MASK) { new_prof = RSMI_PWR_PROF_PRST_VIDEO_MASK; } else if (diff_profiles & RSMI_PWR_PROF_PRST_VR_MASK) { new_prof = RSMI_PWR_PROF_PRST_VR_MASK; } else if (diff_profiles & RSMI_PWR_PROF_PRST_POWER_SAVING_MASK) { new_prof = RSMI_PWR_PROF_PRST_POWER_SAVING_MASK; } else if (diff_profiles & RSMI_PWR_PROF_PRST_3D_FULL_SCR_MASK) { new_prof = RSMI_PWR_PROF_PRST_3D_FULL_SCR_MASK; } else { std::cout << "No other non-custom power profiles to set to" << std::endl; return ret; } std::cout << "Setting power profile to " << power_profile_string(new_prof) << "..." << std::endl; ret = rsmi_dev_power_profile_set(dv_ind, 0, new_prof); CHK_RSMI_RET(ret) std::cout << "Done." << std::endl; rsmi_dev_perf_level_t pfl; ret = rsmi_dev_perf_level_get(dv_ind, &pfl); CHK_RSMI_RET(ret) std::cout << "Performance Level is now " << perf_level_string(pfl) << std::endl; ret = rsmi_dev_power_profile_presets_get(dv_ind, 0, &status); CHK_RSMI_RET(ret) std::cout << "The current power profile is: " << power_profile_string(status.current) << std::endl; std::cout << "Resetting perf level to auto..." << std::endl; ret = rsmi_dev_perf_level_set_v1(dv_ind, RSMI_DEV_PERF_LEVEL_AUTO); CHK_RSMI_RET(ret) std::cout << "Done." << std::endl; ret = rsmi_dev_perf_level_get(dv_ind, &pfl); CHK_RSMI_RET(ret) std::cout << "Performance Level is now " << perf_level_string(pfl) << std::endl; ret = rsmi_dev_power_profile_presets_get(dv_ind, 0, &status); CHK_RSMI_RET(ret) std::cout << "The current power profile is: " << power_profile_string(status.current) << std::endl; return ret; } static rsmi_status_t test_power_cap(uint32_t dv_ind) { rsmi_status_t ret; uint64_t orig, min, max, new_cap; print_test_header("Power Control", dv_ind); ret = rsmi_dev_power_cap_range_get(dv_ind, 0, &max, &min); CHK_RSMI_RET(ret) ret = rsmi_dev_power_cap_get(dv_ind, 0, &orig); CHK_RSMI_RET(ret) std::cout << "Original Power Cap: " << orig << " uW" << std::endl; std::cout << "Power Cap Range: " << max << " uW to " << min << " uW" << std::endl; new_cap = (max + min)/2; std::cout << "Setting new cap to " << new_cap << "..." << std::endl; ret = rsmi_dev_power_cap_set(dv_ind, 0, new_cap); CHK_RSMI_RET(ret) ret = rsmi_dev_power_cap_get(dv_ind, 0, &new_cap); CHK_RSMI_RET(ret) std::cout << "New Power Cap: " << new_cap << " uW" << std::endl; std::cout << "Resetting cap to " << orig << "..." << std::endl; ret = rsmi_dev_power_cap_set(dv_ind, 0, orig); CHK_RSMI_RET(ret) ret = rsmi_dev_power_cap_get(dv_ind, 0, &new_cap); CHK_RSMI_RET(ret) std::cout << "Current Power Cap: " << new_cap << " uW" << std::endl; return ret; } static rsmi_status_t test_set_overdrive(uint32_t dv_ind) { rsmi_status_t ret; uint32_t val; print_test_header("Overdrive Control", dv_ind); std::cout << "Set Overdrive level to 0%..." << std::endl; ret = rsmi_dev_overdrive_level_set_v1(dv_ind, 0); CHK_RSMI_RET(ret) std::cout << "Set Overdrive level to 10%..." << std::endl; ret = rsmi_dev_overdrive_level_set_v1(dv_ind, 10); CHK_RSMI_RET(ret) ret = rsmi_dev_overdrive_level_get(dv_ind, &val); CHK_RSMI_RET(ret) std::cout << "\t**New OverDrive Level:" << std::dec << val << std::endl; std::cout << "Reset Overdrive level to 0%..." << std::endl; ret = rsmi_dev_overdrive_level_set_v1(dv_ind, 0); CHK_RSMI_RET(ret) ret = rsmi_dev_overdrive_level_get(dv_ind, &val); CHK_RSMI_RET(ret) std::cout << "\t**New OverDrive Level:" << std::dec << val << std::endl; return ret; } static rsmi_status_t test_set_fan_speed(uint32_t dv_ind) { rsmi_status_t ret; int64_t orig_speed; double new_speed; int64_t cur_spd; print_test_header("Fan Speed Control", dv_ind); std::cout << "Original fan speed: "; ret = rsmi_dev_fan_speed_get(dv_ind, 0, &orig_speed); if (ret == RSMI_STATUS_SUCCESS) { std::cout << orig_speed << std::endl; } else { CHK_RSMI_NOT_SUPPORTED_RET(ret) std::cout << "***Skipping Fan Speed Control test." << std::endl; return RSMI_STATUS_SUCCESS; } if (orig_speed == 0) { std::cout << "***System fan speed value is 0. Skip fan test." << std::endl; return RSMI_STATUS_SUCCESS; } new_speed = 1.1 * static_cast(orig_speed); std::cout << "Setting fan speed to " << new_speed << std::endl; ret = rsmi_dev_fan_speed_set(dv_ind, 0, static_cast(new_speed)); CHK_RSMI_RET(ret) sleep(4); ret = rsmi_dev_fan_speed_get(dv_ind, 0, &cur_spd); CHK_RSMI_RET(ret) std::cout << "New fan speed: " << cur_spd << std::endl; assert( (cur_spd > static_cast(0.95 * static_cast(new_speed)) && cur_spd < static_cast(1.1 * static_cast(new_speed))) || (cur_spd > static_cast(0.95 * static_cast(RSMI_MAX_FAN_SPEED)))); std::cout << "Resetting fan control to auto..." << std::endl; ret = rsmi_dev_fan_reset(dv_ind, 0); CHK_RSMI_RET(ret) sleep(3); ret = rsmi_dev_fan_speed_get(dv_ind, 0, &cur_spd); CHK_RSMI_RET(ret) std::cout << "End fan speed: " << cur_spd << std::endl; return ret; } static rsmi_status_t test_set_perf_level(uint32_t dv_ind) { rsmi_status_t ret; rsmi_dev_perf_level_t pfl, orig_pfl; print_test_header("Performance Level Control", dv_ind); ret = rsmi_dev_perf_level_get(dv_ind, &orig_pfl); CHK_RSMI_RET(ret) std::cout << "\t**Original Perf Level:" << perf_level_string(orig_pfl) << std::endl; pfl = (rsmi_dev_perf_level_t)((orig_pfl + 1) % (RSMI_DEV_PERF_LEVEL_LAST + 1)); std::cout << "Set Performance Level to " << (uint32_t)pfl << " ..." << std::endl; ret = rsmi_dev_perf_level_set_v1(dv_ind, pfl); if (ret != RSMI_STATUS_SUCCESS) { CHK_RSMI_NOT_SUPPORTED_RET(ret) std::cout << "***Skipping Performance Level Control test." << std::endl; return RSMI_STATUS_SUCCESS; } CHK_RSMI_RET(ret) ret = rsmi_dev_perf_level_get(dv_ind, &pfl); CHK_RSMI_RET(ret) std::cout << "\t**New Perf Level:" << perf_level_string(pfl) << std::endl; std::cout << "Reset Perf level to " << orig_pfl << " ..." << std::endl; ret = rsmi_dev_perf_level_set_v1(dv_ind, orig_pfl); CHK_RSMI_RET(ret) ret = rsmi_dev_perf_level_get(dv_ind, &pfl); CHK_RSMI_RET(ret) std::cout << "\t**New Perf Level:" << perf_level_string(pfl) << std::endl; return ret; } static rsmi_status_t test_set_freq(uint32_t dv_ind) { rsmi_status_t ret; rsmi_frequencies_t f; uint32_t freq_bitmask; rsmi_clk_type rsmi_clk; // Clock files may not be writable, causing sets to // return RSMI_STATUS_PERMISSION even if running with // sudo. See isFileWritable() for more info. print_test_header("Clock Frequency Control", dv_ind); for (uint32_t clk = (uint32_t)RSMI_CLK_TYPE_FIRST; clk <= RSMI_CLK_TYPE_LAST; ++clk) { std::string miniHeader = "Testing clock" + std::to_string(clk); print_mini_header(miniHeader.c_str()); rsmi_clk = (rsmi_clk_type)clk; ret = rsmi_dev_gpu_clk_freq_get(dv_ind, rsmi_clk, &f); CHK_FILE_PERMISSIONS_AND_NOT_SUPPORTED_OR_UNIMPLEMENTED(ret) std::cout << "Initial frequency for clock" << rsmi_clk << " is " << f.current << std::endl; // Set clocks to something other than the usual default of the lowest // frequency. freq_bitmask = 0b01100; // Try the 3rd and 4th clocks std::string freq_bm_str = std::bitset(freq_bitmask).to_string(); freq_bm_str.erase(0, std::min(freq_bm_str.find_first_not_of('0'), freq_bm_str.size()-1)); std::cout << "Setting frequency mask for clock " << rsmi_clk << " to 0b" << freq_bm_str << " ..." << std::endl; ret = rsmi_dev_gpu_clk_freq_set(dv_ind, rsmi_clk, freq_bitmask); CHK_FILE_PERMISSIONS_AND_NOT_SUPPORTED_OR_UNIMPLEMENTED(ret) ret = rsmi_dev_gpu_clk_freq_get(dv_ind, rsmi_clk, &f); CHK_FILE_PERMISSIONS_AND_NOT_SUPPORTED_OR_UNIMPLEMENTED(ret) std::cout << "Frequency is now index " << f.current << std::endl; std::cout << "Resetting mask to all frequencies." << std::endl; ret = rsmi_dev_gpu_clk_freq_set(dv_ind, rsmi_clk, 0xFFFFFFFF); CHK_FILE_PERMISSIONS_AND_NOT_SUPPORTED_OR_UNIMPLEMENTED(ret) ret = rsmi_dev_perf_level_set_v1(dv_ind, RSMI_DEV_PERF_LEVEL_AUTO); CHK_FILE_PERMISSIONS(ret) } std::cout << std::endl; return RSMI_STATUS_SUCCESS; } static void print_frequencies(rsmi_frequencies_t *f) { assert(f != nullptr); for (uint32_t j = 0; j < f->num_supported; ++j) { std::cout << "\t** " << j << ": " << f->frequency[j]; if (j == f->current) { std::cout << " *"; } std::cout << std::endl; } } static rsmi_status_t test_set_compute_partitioning(uint32_t dv_ind) { rsmi_status_t ret; uint32_t buffer_len = 10; char originalComputePartition[buffer_len]; originalComputePartition[0] = '\0'; print_test_header("Compute Partitioning Control", dv_ind); ret = rsmi_dev_compute_partition_get(dv_ind, originalComputePartition, buffer_len); CHK_RSMI_NOT_SUPPORTED_OR_UNEXPECTED_DATA_RET(ret) if (ret == RSMI_STATUS_NOT_SUPPORTED) { return RSMI_STATUS_SUCCESS; } std::cout << "Original Compute Partition: " << (((originalComputePartition == nullptr) || ((originalComputePartition != nullptr) && (originalComputePartition[0] == '\0'))) ? "UNKNOWN" : originalComputePartition) << std::endl << std::endl; for (int newComputePartition = RSMI_COMPUTE_PARTITION_CPX; newComputePartition <= RSMI_COMPUTE_PARTITION_QPX; newComputePartition++) { rsmi_compute_partition_type newPartition = static_cast(newComputePartition); std::cout << "Attempting to set compute partition to " << compute_partition_string(newPartition) << "..." << std::endl; ret = rsmi_dev_compute_partition_set(dv_ind, newPartition); CHK_RSMI_NOT_SUPPORTED_OR_SETTING_UNAVAILABLE_RET(ret) std::cout << "Done setting compute partition to " << compute_partition_string(newPartition) << "." << std::endl; std::cout << std::endl << std::endl; } std::cout << "About to initate compute partition reset..." << std::endl; ret = rsmi_dev_compute_partition_reset(dv_ind); CHK_RSMI_NOT_SUPPORTED_RET(ret) std::cout << "Done resetting compute partition." << std::endl; std::string myComputePartition = originalComputePartition; if (myComputePartition.empty() == false) { std::cout << "Resetting back to original compute partition to " << originalComputePartition << "... " << std::endl; rsmi_compute_partition_type origComputePartitionType = mapStringToRSMIComputePartitionTypes[originalComputePartition]; ret = rsmi_dev_compute_partition_set(dv_ind, origComputePartitionType); CHK_RSMI_NOT_SUPPORTED_OR_SETTING_UNAVAILABLE_RET(ret) std::cout << "Done" << std::endl; } return RSMI_STATUS_SUCCESS; } static rsmi_status_t test_set_nps_mode(uint32_t dv_ind) { rsmi_status_t ret; uint32_t buffer_len = 10; char originalNpsMode[buffer_len]; originalNpsMode[0] = '\0'; print_test_header("NPS Mode Control", dv_ind); ret = rsmi_dev_nps_mode_get(dv_ind, originalNpsMode, buffer_len); CHK_RSMI_NOT_SUPPORTED_OR_UNEXPECTED_DATA_RET(ret) if (ret == RSMI_STATUS_NOT_SUPPORTED) { return RSMI_STATUS_SUCCESS; } std::cout << "Original NPS Mode: " << (((originalNpsMode == nullptr) || ((originalNpsMode != nullptr) && (originalNpsMode[0] == '\0'))) ? "UNKNOWN" : originalNpsMode) << std::endl << std::endl; for (int newNpsMode = RSMI_MEMORY_PARTITION_NPS1; newNpsMode <= RSMI_MEMORY_PARTITION_NPS8; newNpsMode++) { rsmi_nps_mode_type_t newMemoryPartition = static_cast(newNpsMode); std::cout << "Attempting to set NPS mode to " << nps_mode_string(newMemoryPartition) << "..." << std::endl; ret = rsmi_dev_nps_mode_set(dv_ind, newMemoryPartition); CHK_RSMI_NOT_SUPPORTED_RET(ret) if (ret == RSMI_STATUS_NOT_SUPPORTED) { // do not continue attempting to set, device does not support setting return RSMI_STATUS_SUCCESS; } std::cout << "Done setting NPS mode to " << nps_mode_string(newMemoryPartition) << "." << std::endl; std::cout << std::endl << std::endl; } std::cout << "About to initate nps mode reset..." << std::endl; ret = rsmi_dev_nps_mode_reset(dv_ind); CHK_RSMI_NOT_SUPPORTED_RET(ret) std::cout << "Done resetting nps mode." << std::endl; std::string myNpsMode = originalNpsMode; if (myNpsMode.empty() == false) { std::cout << "Resetting compute partition to " << originalNpsMode << "... " << std::endl; rsmi_nps_mode_type_t origNpsModeType = mapStringToRSMINpsModeTypes[originalNpsMode]; ret = rsmi_dev_nps_mode_set(dv_ind, origNpsModeType); CHK_RSMI_NOT_SUPPORTED_RET(ret) std::cout << "Done" << std::endl; } return RSMI_STATUS_SUCCESS; } int main() { rsmi_status_t ret; ret = rsmi_init(0); CHK_RSMI_RET_I(ret) std::vector val_vec; uint64_t val_ui64, val2_ui64; int64_t val_i64; uint32_t val_ui32; uint16_t val_ui16; rsmi_dev_perf_level_t pfl; rsmi_frequencies_t f; uint32_t num_monitor_devs = 0; rsmi_gpu_metrics_t p; rsmi_num_monitor_devices(&num_monitor_devs); for (uint32_t i = 0; i < num_monitor_devs; ++i) { ret = rsmi_dev_id_get(i, &val_ui16); CHK_RSMI_RET_I(ret) std::cout << "\t**Device ID: 0x" << std::hex << val_ui16 << std::endl; char current_compute_partition[256]; current_compute_partition[0] = '\0'; ret = rsmi_dev_compute_partition_get(i, current_compute_partition, 256); std::cout << "\t**Current Compute Partition: " << (((current_compute_partition == nullptr) || ((current_compute_partition != nullptr) && (current_compute_partition[0] == '\0'))) ? "UNKNOWN" : current_compute_partition); if (ret != RSMI_STATUS_SUCCESS) { std::cout << ", RSMI_STATUS = "; } else { std::cout << std::endl; } CHK_RSMI_NOT_SUPPORTED_OR_UNEXPECTED_DATA_RET(ret) uint32_t len = 5; char nps_mode[len]; nps_mode[0] = '\0'; ret = rsmi_dev_nps_mode_get(i, nps_mode, len); std::cout << "\t**NPS Mode: " << (((nps_mode == nullptr) || ((nps_mode != nullptr) && (nps_mode[0] == '\0'))) ? "UNKNOWN" : nps_mode); if (ret != RSMI_STATUS_SUCCESS) { std::cout << ", RSMI_STATUS = "; } else { std::cout << std::endl; } CHK_NOT_SUPPORTED_OR_UNEXPECTED_DATA_OR_INSUFFICIENT_SIZE_RET(ret) ret = rsmi_dev_gpu_metrics_info_get(i, &p); CHK_AND_PRINT_RSMI_ERR_RET(ret) std::cout << "\t**GPU METRICS" << std::endl; ret = rsmi_dev_perf_level_get(i, &pfl); CHK_AND_PRINT_RSMI_ERR_RET(ret) std::cout << "\t**Performance Level:" << perf_level_string(pfl) << std::endl; ret = rsmi_dev_overdrive_level_get(i, &val_ui32); CHK_AND_PRINT_RSMI_ERR_RET(ret) std::cout << "\t**OverDrive Level:" << val_ui32 << std::endl; ret = rsmi_dev_gpu_clk_freq_get(i, RSMI_CLK_TYPE_MEM, &f); CHK_AND_PRINT_RSMI_ERR_RET(ret) std::cout << "\t**Supported GPU Memory clock frequencies: "; std::cout << f.num_supported << std::endl; print_frequencies(&f); ret = rsmi_dev_gpu_clk_freq_get(i, RSMI_CLK_TYPE_SYS, &f); CHK_AND_PRINT_RSMI_ERR_RET(ret) std::cout << "\t**Supported GPU clock frequencies: "; std::cout << f.num_supported << std::endl; print_frequencies(&f); std::cout << "\t**Monitor name: "; char name[128]; ret = rsmi_dev_name_get(i, name, 128); CHK_AND_PRINT_RSMI_ERR_RET(ret) std::cout << name << std::endl; std::cout << "\t**Temperature: "; ret = rsmi_dev_temp_metric_get(i, 0, RSMI_TEMP_CURRENT, &val_i64); if (ret == RSMI_STATUS_SUCCESS) { std::cout << val_i64/1000 << "C" << std::endl; } CHK_RSMI_NOT_SUPPORTED_RET(ret) std::cout << "\t**Voltage: "; ret = rsmi_dev_volt_metric_get(i, RSMI_VOLT_TYPE_VDDGFX, RSMI_VOLT_CURRENT, &val_i64); if (ret == RSMI_STATUS_SUCCESS) { std::cout << val_i64 << "mV" << std::endl; } CHK_RSMI_NOT_SUPPORTED_RET(ret) std::cout << "\t**Current Fan Speed: "; ret = rsmi_dev_fan_speed_get(i, 0, &val_i64); if (ret == RSMI_STATUS_SUCCESS) { ret = rsmi_dev_fan_speed_max_get(i, 0, &val_ui64); CHK_AND_PRINT_RSMI_ERR_RET(ret) std::cout << (static_cast(val_i64)/val_ui64) * 100; std::cout << "% (" << std::dec << val_i64 << "/" << std::dec << val_ui64 << ")" << std::endl; } CHK_RSMI_NOT_SUPPORTED_RET(ret) std::cout << "\t**Current fan RPMs: "; ret = rsmi_dev_fan_rpms_get(i, 0, &val_i64); if (ret == RSMI_STATUS_SUCCESS) { std::cout << std::dec << val_i64 << std::endl; } CHK_RSMI_NOT_SUPPORTED_RET(ret) std::cout << "\t**Current Power Cap: "; ret = rsmi_dev_power_cap_get(i, 0, &val_ui64); if (ret == RSMI_STATUS_SUCCESS) { std::cout << std::dec << val_ui64 << "uW" <(val_ui64)/1000 << " W" << std::endl; } CHK_RSMI_NOT_SUPPORTED_RET(ret) std::cout << "\t=======" << std::endl; } std::cout << "***** Testing write api's" << std::endl; if (isUserRunningAsSudo() == false) { std::cout << "Write APIs require users to execute with sudo. " << "Cannot proceed." << std::endl; return 0; } for (uint32_t i = 0; i< num_monitor_devs; ++i) { ret = test_set_overdrive(i); CHK_AND_PRINT_RSMI_ERR_RET(ret) ret = test_set_perf_level(i); CHK_AND_PRINT_RSMI_ERR_RET(ret) ret = test_set_fan_speed(i); CHK_AND_PRINT_RSMI_ERR_RET(ret) ret = test_power_cap(i); CHK_AND_PRINT_RSMI_ERR_RET(ret) ret = test_power_profile(i); CHK_AND_PRINT_RSMI_ERR_RET(ret) ret = test_set_compute_partitioning(i); CHK_AND_PRINT_RSMI_ERR_RET(ret) ret = test_set_freq(i); CHK_AND_PRINT_RSMI_ERR_RET(ret) ret = test_set_nps_mode(i); CHK_AND_PRINT_RSMI_ERR_RET(ret) } return 0; }