Files
rocm-systems/tests/python_unittest/unit_tests.py
T
Castillo, Juan 34f465bfc5 [SWDEV-531904] Removed Handle Exceptions function (#531)
Removed:
- handle_exceptions() Exposes, silences, and logs AMDSMI exceptions to users returns success/failure

Signed-off-by: Juan Castillo <juan.castillo@amd.com>
2025-07-07 13:26:26 -05:00

4051 wiersze
155 KiB
Python
Executable File

#!/usr/bin/env python3
#
# Copyright (c) Advanced Micro Devices, Inc. All rights reserved.
#
# Permission is hereby granted, free of charge, to any person obtaining a copy
# of this software and associated documentation files (the "Software"), to deal
# in the Software without restriction, including without limitation the rights
# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
# copies of the Software, and to permit persons to whom the Software is
# furnished to do so, subject to the following conditions:
#
# The above copyright notice and this permission notice shall be included in
# all copies or substantial portions of the Software.
#
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
# THE SOFTWARE.
import inspect
import json
import sys
import unittest
sys.path.append("/opt/rocm/libexec/amdsmi_cli/")
try:
import amdsmi
except ImportError:
raise ImportError("Could not import /opt/rocm/libexec/amdsmi_cli/amdsmi_cli.py")
not_supported_error_codes = ['2', '3', '49']
not_supported_error_code_names = ['AMDSMI_STATUS_NOT_SUPPORTED', 'AMDSMI_STATUS_NOT_YET_IMPLEMENTED', 'AMDSMI_STATUS_NO_HSMP_MSG_SUP']
error_map = \
{
'0': 'AMDSMI_STATUS_SUCCESS',
'1': 'AMDSMI_STATUS_INVAL',
'2': 'AMDSMI_STATUS_NOT_SUPPORTED',
'3': 'AMDSMI_STATUS_NOT_YET_IMPLEMENTED',
'4': 'AMDSMI_STATUS_FAIL_LOAD_MODULE',
'5': 'AMDSMI_STATUS_FAIL_LOAD_SYMBOL',
'6': 'AMDSMI_STATUS_DRM_ERROR',
'7': 'AMDSMI_STATUS_API_FAILED',
'8': 'AMDSMI_STATUS_TIMEOUT',
'9': 'AMDSMI_STATUS_RETRY',
'10': 'AMDSMI_STATUS_NO_PERM',
'11': 'AMDSMI_STATUS_INTERRUPT',
'12': 'AMDSMI_STATUS_IO',
'13': 'AMDSMI_STATUS_ADDRESS_FAULT',
'14': 'AMDSMI_STATUS_FILE_ERROR',
'15': 'AMDSMI_STATUS_OUT_OF_RESOURCES',
'16': 'AMDSMI_STATUS_INTERNAL_EXCEPTION',
'17': 'AMDSMI_STATUS_INPUT_OUT_OF_BOUNDS',
'18': 'AMDSMI_STATUS_INIT_ERROR',
'19': 'AMDSMI_STATUS_REFCOUNT_OVERFLOW',
'30': 'AMDSMI_STATUS_BUSY',
'31': 'AMDSMI_STATUS_NOT_FOUND',
'32': 'AMDSMI_STATUS_NOT_INIT',
'33': 'AMDSMI_STATUS_NO_SLOT',
'34': 'AMDSMI_STATUS_DRIVER_NOT_LOADED',
'39': 'AMDSMI_STATUS_MORE_DATA',
'40': 'AMDSMI_STATUS_NO_DATA',
'41': 'AMDSMI_STATUS_INSUFFICIENT_SIZE',
'42': 'AMDSMI_STATUS_UNEXPECTED_SIZE',
'43': 'AMDSMI_STATUS_UNEXPECTED_DATA',
'44': 'AMDSMI_STATUS_NON_AMD_CPU',
'45': 'AMDSMI_STATUS_NO_ENERGY_DRV',
'46': 'AMDSMI_STATUS_NO_MSR_DRV',
'47': 'AMDSMI_STATUS_NO_HSMP_DRV',
'48': 'AMDSMI_STATUS_NO_HSMP_SUP',
'49': 'AMDSMI_STATUS_NO_HSMP_MSG_SUP',
'50': 'AMDSMI_STATUS_HSMP_TIMEOUT',
'51': 'AMDSMI_STATUS_NO_DRV',
'52': 'AMDSMI_STATUS_FILE_NOT_FOUND',
'53': 'AMDSMI_STATUS_ARG_PTR_NULL',
'54': 'AMDSMI_STATUS_AMDGPU_RESTART_ERR',
'55': 'AMDSMI_STATUS_SETTING_UNAVAILABLE',
'56': 'AMDSMI_STATUS_CORRUPTED_EEPROM',
'0xFFFFFFFE': 'AMDSMI_STATUS_MAP_ERROR',
'0xFFFFFFFF': 'AMDSMI_STATUS_UNKNOWN_ERROR'
}
class TestAmdSmiPythonBDF(unittest.TestCase):
valid_bdfs = {
"00:00.0": [0, 0, 0, 0],
"01:01.1": [0, 1, 1, 1],
"FF:1F.7": [0, 255, 31, 7],
"FF:00.7": [0, 255, 0, 7],
"11:01.2": [0, 17, 1, 2],
"11:0a.2": [0, 17, 10, 2],
"0000:FF:1F.7": [0, 255, 31, 7],
"0001:ff:1F.7": [1, 255, 31, 7],
"ffff:FF:1f.7": [65535, 255, 31, 7],
}
invalid_bdfs = {
# invalid bdf strings, expect None
None: None,
"": None,
"00:00:0": None,
"00.00:0": None,
"00:00.Z": None,
"00:0Z.0": None,
"0Z:00.0": None,
"Z00:00.0": None,
"A00:00.0": None,
"0A00:00.0": None,
"00:00.07": None,
"00:00.8": None,
"00:00.10": None,
"00:00.11": None,
"00:00.-1": None,
"00:00.*-1": None,
"00:00.123": None,
"00:20.0": None,
"00:45.0": None,
"00:200.0": None,
"00:002.0": None,
"100:00.0": None,
"0100:00.0": None,
"00100:00.0": None,
"0101:00.0": None,
"00001:00.0": None,
"10001:00.0": None,
"45:0.0": None,
".00:00.0": None,
"00.00.0": None,
"00.0.0": None,
"0.00.0": None,
"000.00.0": None,
"00 00 0": None,
" 00:00.0": None,
"00:00.0 ": None,
"0000:00.00.0": None,
"000:00:00.0": None,
"00:00:00.1": None,
"0:00:00.1": None,
"0000 00 00 0": None,
"-1-1:00:00.0": None,
"AAAA:00:AA.0": None,
"*1*1:00:00.0": None,
"0000:00:00.07": None,
"0000:00:00.8": None,
"0000:00:00.10": None,
"0000:00:00.11": None,
"0000:00:00.-1": None,
"0000:00:00.*-1": None,
"0000:00:00.123": None,
"0000:00:20.0": None,
"0000:00:45.0": None,
"0000:00:200.0": None,
"0000:00:002.0": None,
"0000:100:00.0": None,
"0000:0100:00.0": None,
"0000:00100:00.0": None,
"0000:0101:00.0": None,
"0000:00001:00.0": None,
"0000:10001:00.0": None,
"0000:45:0.0": None,
".0000.00:00.0": None,
"0000.00.0.0": None,
" 0000:00:00.0": None,
"0000:00:00.0 ": None,
}
PASS = 'AMDSMI_STATUS_SUCCESS'
FAIL = 'AMDSMI_STATUS_INVAL'
# Tests marked wtih either of these flags will be skipped
# and need to be implemented later.
TODO_SKIP_NYI = True
TODO_SKIP_FAIL = True
TODO_SKIP_NOT_COMPLETE = True
clk_types = \
[
('SYS', amdsmi.AmdSmiClkType.SYS, PASS),
('GFX', amdsmi.AmdSmiClkType.GFX, PASS),
('DF', amdsmi.AmdSmiClkType.DF, PASS),
('DCEF', amdsmi.AmdSmiClkType.DCEF, PASS),
('SOC', amdsmi.AmdSmiClkType.SOC, PASS),
('MEM', amdsmi.AmdSmiClkType.MEM, PASS),
('PCIE', amdsmi.AmdSmiClkType.PCIE, PASS),
('VCLK0', amdsmi.AmdSmiClkType.VCLK0, PASS),
('VCLK1', amdsmi.AmdSmiClkType.VCLK1, PASS),
('DCLK0', amdsmi.AmdSmiClkType.DCLK0, PASS),
('DCLK1', amdsmi.AmdSmiClkType.DCLK1, PASS)
]
clk_limit_types = \
[
('MIN', amdsmi.AmdSmiClkLimitType.MIN, PASS),
('MAX', amdsmi.AmdSmiClkLimitType.MAX, PASS)
]
io_bw_encodings = \
[
('AGG_BW0', amdsmi.amdsmi_wrapper.AGG_BW0, PASS),
('RD_BW0', amdsmi.amdsmi_wrapper.RD_BW0, PASS),
('WR_BW0', amdsmi.amdsmi_wrapper.WR_BW0, PASS)
]
event_groups = \
[
('XGMI', amdsmi.AmdSmiEventGroup.XGMI, PASS),
('XGMI_DATA_OUT', amdsmi.AmdSmiEventGroup.XGMI_DATA_OUT, PASS),
('GRP_INVALID', amdsmi.AmdSmiEventGroup.GRP_INVALID, FAIL)
]
gpu_blocks = \
[
('INVALID', amdsmi.AmdSmiGpuBlock.INVALID, FAIL),
('UMC', amdsmi.AmdSmiGpuBlock.UMC, PASS),
('SDMA', amdsmi.AmdSmiGpuBlock.SDMA, PASS),
('GFX', amdsmi.AmdSmiGpuBlock.GFX, PASS),
('MMHUB', amdsmi.AmdSmiGpuBlock.MMHUB, PASS),
('ATHUB', amdsmi.AmdSmiGpuBlock.ATHUB, PASS),
('PCIE_BIF', amdsmi.AmdSmiGpuBlock.PCIE_BIF, PASS),
('HDP', amdsmi.AmdSmiGpuBlock.HDP, PASS),
('XGMI_WAFL', amdsmi.AmdSmiGpuBlock.XGMI_WAFL, PASS),
('DF', amdsmi.AmdSmiGpuBlock.DF, PASS),
('SMN', amdsmi.AmdSmiGpuBlock.SMN, PASS),
('SEM', amdsmi.AmdSmiGpuBlock.SEM, PASS),
('MP0', amdsmi.AmdSmiGpuBlock.MP0, PASS),
('MP1', amdsmi.AmdSmiGpuBlock.MP1, PASS),
('FUSE', amdsmi.AmdSmiGpuBlock.FUSE, PASS),
('MCA', amdsmi.AmdSmiGpuBlock.MCA, PASS),
('VCN', amdsmi.AmdSmiGpuBlock.VCN, PASS),
('JPEG', amdsmi.AmdSmiGpuBlock.JPEG, PASS),
('IH', amdsmi.AmdSmiGpuBlock.IH, PASS),
('MPIO', amdsmi.AmdSmiGpuBlock.MPIO, PASS),
('RESERVED', amdsmi.AmdSmiGpuBlock.RESERVED, FAIL)
]
memory_types = \
[
('VRAM', amdsmi.AmdSmiMemoryType.VRAM, PASS),
('VIS_VRAM', amdsmi.AmdSmiMemoryType.VIS_VRAM, PASS),
('GTT', amdsmi.AmdSmiMemoryType.GTT, PASS)
]
reg_types = \
[
('XGMI', amdsmi.AmdSmiRegType.XGMI, PASS),
('WAFL', amdsmi.AmdSmiRegType.WAFL, PASS),
('PCIE', amdsmi.AmdSmiRegType.PCIE, PASS),
('USR', amdsmi.AmdSmiRegType.USR, PASS),
('USR1', amdsmi.AmdSmiRegType.USR1, PASS)
]
voltage_metrics = \
[
('CURRENT', amdsmi.AmdSmiVoltageMetric.CURRENT, PASS),
('MAX', amdsmi.AmdSmiVoltageMetric.MAX, PASS),
('MIN_CRIT', amdsmi.AmdSmiVoltageMetric.MIN_CRIT, PASS),
('MIN', amdsmi.AmdSmiVoltageMetric.MIN, PASS),
('MAX_CRIT', amdsmi.AmdSmiVoltageMetric.MAX_CRIT, PASS),
('AVERAGE', amdsmi.AmdSmiVoltageMetric.AVERAGE, PASS),
('LOWEST', amdsmi.AmdSmiVoltageMetric.LOWEST, PASS),
('HIGHEST', amdsmi.AmdSmiVoltageMetric.HIGHEST, PASS)
]
voltage_types = \
[
('VDDGFX', amdsmi.AmdSmiVoltageType.VDDGFX, PASS),
('INVALID', amdsmi.AmdSmiVoltageType.INVALID, FAIL)
]
link_types = \
[
('AMDSMI_LINK_TYPE_INTERNAL', amdsmi.AmdSmiLinkType.AMDSMI_LINK_TYPE_INTERNAL, PASS),
('AMDSMI_LINK_TYPE_XGMI', amdsmi.AmdSmiLinkType.AMDSMI_LINK_TYPE_XGMI, PASS),
('AMDSMI_LINK_TYPE_PCIE', amdsmi.AmdSmiLinkType.AMDSMI_LINK_TYPE_PCIE, PASS),
('AMDSMI_LINK_TYPE_NOT_APPLICABLE', amdsmi.AmdSmiLinkType.AMDSMI_LINK_TYPE_NOT_APPLICABLE, FAIL),
('AMDSMI_LINK_TYPE_UNKNOWN', amdsmi.AmdSmiLinkType.AMDSMI_LINK_TYPE_UNKNOWN, FAIL)
]
temperature_types = \
[
('EDGE', amdsmi.AmdSmiTemperatureType.EDGE, PASS),
('HOTSPOT', amdsmi.AmdSmiTemperatureType.HOTSPOT, PASS),
('JUNCTION', amdsmi.AmdSmiTemperatureType.JUNCTION, PASS),
('VRAM', amdsmi.AmdSmiTemperatureType.VRAM, PASS),
('HBM_0', amdsmi.AmdSmiTemperatureType.HBM_0, PASS),
('HBM_1', amdsmi.AmdSmiTemperatureType.HBM_1, PASS),
('HBM_2', amdsmi.AmdSmiTemperatureType.HBM_2, PASS),
('HBM_3', amdsmi.AmdSmiTemperatureType.HBM_3, PASS),
('PLX', amdsmi.AmdSmiTemperatureType.PLX, PASS)
]
temperature_metrics = \
[
('CURRENT', amdsmi.AmdSmiTemperatureMetric.CURRENT, PASS),
('MAX', amdsmi.AmdSmiTemperatureMetric.MAX, PASS),
('MIN', amdsmi.AmdSmiTemperatureMetric.MIN, PASS),
('MAX_HYST', amdsmi.AmdSmiTemperatureMetric.MAX_HYST, PASS),
('MIN_HYST', amdsmi.AmdSmiTemperatureMetric.MIN_HYST, PASS),
('CRITICAL', amdsmi.AmdSmiTemperatureMetric.CRITICAL, PASS),
('CRITICAL_HYST', amdsmi.AmdSmiTemperatureMetric.CRITICAL_HYST, PASS),
('EMERGENCY', amdsmi.AmdSmiTemperatureMetric.EMERGENCY, PASS),
('EMERGENCY_HYST', amdsmi.AmdSmiTemperatureMetric.EMERGENCY_HYST, PASS),
('CRIT_MIN', amdsmi.AmdSmiTemperatureMetric.CRIT_MIN, PASS),
('CRIT_MIN_HYST', amdsmi.AmdSmiTemperatureMetric.CRIT_MIN_HYST, PASS),
('OFFSET', amdsmi.AmdSmiTemperatureMetric.OFFSET, PASS),
('LOWEST', amdsmi.AmdSmiTemperatureMetric.LOWEST, PASS),
('HIGHEST', amdsmi.AmdSmiTemperatureMetric.HIGHEST, PASS)
]
utilization_counter_types = \
[
('COARSE_GRAIN_GFX_ACTIVITY', amdsmi.AmdSmiUtilizationCounterType.COARSE_GRAIN_GFX_ACTIVITY, PASS),
('COARSE_GRAIN_MEM_ACTIVITY', amdsmi.AmdSmiUtilizationCounterType.COARSE_GRAIN_MEM_ACTIVITY, PASS),
('COARSE_DECODER_ACTIVITY', amdsmi.AmdSmiUtilizationCounterType.COARSE_DECODER_ACTIVITY, PASS),
('FINE_GRAIN_GFX_ACTIVITY', amdsmi.AmdSmiUtilizationCounterType.FINE_GRAIN_GFX_ACTIVITY, PASS),
('FINE_GRAIN_MEM_ACTIVITY', amdsmi.AmdSmiUtilizationCounterType.FINE_GRAIN_MEM_ACTIVITY, PASS),
('FINE_DECODER_ACTIVITY', amdsmi.AmdSmiUtilizationCounterType.FINE_DECODER_ACTIVITY, PASS),
('UTILIZATION_COUNTER_FIRST', amdsmi.AmdSmiUtilizationCounterType.UTILIZATION_COUNTER_FIRST, PASS),
('UTILIZATION_COUNTER_LAST', amdsmi.AmdSmiUtilizationCounterType.UTILIZATION_COUNTER_LAST, PASS)
]
event_types = \
[
('XGMI_0_NOP_TX', amdsmi.AmdSmiEventType.XGMI_0_NOP_TX, PASS),
('XGMI_0_REQUEST_TX', amdsmi.AmdSmiEventType.XGMI_0_REQUEST_TX, PASS),
('XGMI_0_RESPONSE_TX', amdsmi.AmdSmiEventType.XGMI_0_RESPONSE_TX, PASS),
('XGMI_0_BEATS_TX', amdsmi.AmdSmiEventType.XGMI_0_BEATS_TX, PASS),
('XGMI_1_NOP_TX', amdsmi.AmdSmiEventType.XGMI_1_NOP_TX, PASS),
('XGMI_1_REQUEST_TX', amdsmi.AmdSmiEventType.XGMI_1_REQUEST_TX, PASS),
('XGMI_1_RESPONSE_TX', amdsmi.AmdSmiEventType.XGMI_1_RESPONSE_TX, PASS),
('XGMI_1_BEATS_TX', amdsmi.AmdSmiEventType.XGMI_1_BEATS_TX, PASS),
('XGMI_DATA_OUT_0', amdsmi.AmdSmiEventType.XGMI_DATA_OUT_0, PASS),
('XGMI_DATA_OUT_1', amdsmi.AmdSmiEventType.XGMI_DATA_OUT_1, PASS),
('XGMI_DATA_OUT_2', amdsmi.AmdSmiEventType.XGMI_DATA_OUT_2, PASS),
('XGMI_DATA_OUT_3', amdsmi.AmdSmiEventType.XGMI_DATA_OUT_3, PASS),
('XGMI_DATA_OUT_4', amdsmi.AmdSmiEventType.XGMI_DATA_OUT_4, PASS),
('XGMI_DATA_OUT_5', amdsmi.AmdSmiEventType.XGMI_DATA_OUT_5, PASS)
]
counter_commands = \
[
('CMD_START', amdsmi.AmdSmiCounterCommand.CMD_START, PASS),
('CMD_STOP', amdsmi.AmdSmiCounterCommand.CMD_STOP, PASS)
]
compute_partition_types = \
[
('SPX', amdsmi.AmdSmiComputePartitionType.SPX, PASS),
('DPX', amdsmi.AmdSmiComputePartitionType.DPX, PASS),
('TPX', amdsmi.AmdSmiComputePartitionType.TPX, PASS),
('QPX', amdsmi.AmdSmiComputePartitionType.QPX, PASS),
('CPX', amdsmi.AmdSmiComputePartitionType.CPX, PASS),
('INVALID', amdsmi.AmdSmiComputePartitionType.INVALID, FAIL)
]
memory_partition_types = \
[
('NPS1', amdsmi.AmdSmiMemoryPartitionType.NPS1, PASS),
('NPS2', amdsmi.AmdSmiMemoryPartitionType.NPS2, PASS),
('NPS4', amdsmi.AmdSmiMemoryPartitionType.NPS4, PASS),
('NPS8', amdsmi.AmdSmiMemoryPartitionType.NPS8, PASS),
('UNKNOWN', amdsmi.AmdSmiMemoryPartitionType.UNKNOWN, FAIL)
]
freq_inds = \
[
('MIN', amdsmi.AmdSmiFreqInd.MIN, PASS),
('MAX', amdsmi.AmdSmiFreqInd.MAX, PASS),
('INVALID', amdsmi.AmdSmiFreqInd.INVALID, FAIL)
]
dev_perf_levels = \
[
('AUTO', amdsmi.AmdSmiDevPerfLevel.AUTO, PASS),
('LOW', amdsmi.AmdSmiDevPerfLevel.LOW, PASS),
('HIGH', amdsmi.AmdSmiDevPerfLevel.HIGH, PASS),
('MANUAL', amdsmi.AmdSmiDevPerfLevel.MANUAL, PASS),
('STABLE_STD', amdsmi.AmdSmiDevPerfLevel.STABLE_STD, PASS),
('STABLE_PEAK', amdsmi.AmdSmiDevPerfLevel.STABLE_PEAK, PASS),
('STABLE_MIN_MCLK', amdsmi.AmdSmiDevPerfLevel.STABLE_MIN_MCLK, PASS),
('STABLE_MIN_SCLK', amdsmi.AmdSmiDevPerfLevel.STABLE_MIN_SCLK, PASS),
('DETERMINISM', amdsmi.AmdSmiDevPerfLevel.DETERMINISM, PASS),
('UNKNOWN', amdsmi.AmdSmiDevPerfLevel.UNKNOWN, FAIL)
]
power_profile_preset_masks = \
[
('CUSTOM_MASK', amdsmi.AmdSmiPowerProfilePresetMasks.CUSTOM_MASK, PASS),
('VIDEO_MASK', amdsmi.AmdSmiPowerProfilePresetMasks.VIDEO_MASK, PASS),
('POWER_SAVING_MASK', amdsmi.AmdSmiPowerProfilePresetMasks.POWER_SAVING_MASK, PASS),
('COMPUTE_MASK', amdsmi.AmdSmiPowerProfilePresetMasks.COMPUTE_MASK, PASS),
('VR_MASK', amdsmi.AmdSmiPowerProfilePresetMasks.VR_MASK, PASS),
('THREE_D_FULL_SCR_MASK', amdsmi.AmdSmiPowerProfilePresetMasks.THREE_D_FULL_SCR_MASK, PASS),
('BOOTUP_DEFAULT', amdsmi.AmdSmiPowerProfilePresetMasks.BOOTUP_DEFAULT, PASS),
('INVALID', amdsmi.AmdSmiPowerProfilePresetMasks.INVALID, FAIL)
]
def test_parse_bdf(self):
# go through all bdfs
expectations = self.valid_bdfs.copy()
expectations.update(self.invalid_bdfs)
for bdf in expectations:
expected = expectations[bdf]
result = amdsmi.amdsmi_interface._parse_bdf(bdf)
self.assertEqual(result, expected,
"Expected {} for bdf {}, but got {}".format(
expected, bdf, result))
@classmethod
def _convert_bdf_to_long(clz, bdf):
if len(bdf) == 12:
return bdf
if len(bdf) == 7:
return "0000:" + bdf
return None
def test_format_bdf(self):
# go through valid bdfs
expectations = self.valid_bdfs.copy()
for bdf_string in expectations:
# use key as result and value as input
bdf_list = expectations[bdf_string]
smi_bdf = amdsmi.amdsmi_interface._make_amdsmi_bdf_from_list(bdf_list)
expected = TestAmdSmiPythonBDF._convert_bdf_to_long(bdf_string)
expected = expected.lower()
result = amdsmi.amdsmi_interface._format_bdf(smi_bdf)
self.assertEqual(result, expected,
"Expected {} for bdf {}, but got {}".format(
expected, bdf_string, result))
def test_check_res(self):
# expect retry error to raise SmiRetryException
with self.assertRaises(amdsmi.AmdSmiRetryException) as retry_test:
amdsmi.amdsmi_interface._check_res(
(lambda: amdsmi.amdsmi_interface.amdsmi_wrapper.AMDSMI_STATUS_RETRY)())
# except retry error to have AMDSMI_STATUS_RETRY error code
self.assertEqual(retry_test.exception.get_error_code(),
amdsmi.amdsmi_interface.amdsmi_wrapper.AMDSMI_STATUS_RETRY)
# expect invalid args error to raise AmdSmiLibraryException
with self.assertRaises(amdsmi.AmdSmiLibraryException) as inval_test:
amdsmi.amdsmi_interface._check_res(
(lambda: amdsmi.amdsmi_interface.amdsmi_wrapper.AMDSMI_STATUS_INVAL)())
# expect invalid args error to have AMDSMI_STATUS_INVAL error code
self.assertEqual(inval_test.exception.get_error_code(),
amdsmi.amdsmi_interface.amdsmi_wrapper.AMDSMI_STATUS_INVAL)
# for successfull call, expect no error is given
result = amdsmi.amdsmi_interface._check_res(
(lambda: amdsmi.amdsmi_interface.amdsmi_wrapper.AMDSMI_STATUS_SUCCESS)())
self.assertEqual(None, result)
@classmethod
def _print(self, msg, data=None, cond=None):
if verbose == 2:
if not data:
print(msg, flush=True)
elif data in not_supported_error_code_names:
print(f'{msg}{data}', flush=True)
else:
if isinstance(data, str) and data in error_map.values():
print(msg, end='')
else:
print(msg)
print(json.dumps(data, sort_keys=False, indent=4), flush=True)
return
@classmethod
def _print_func_name(self, msg):
if verbose == 2:
stk = inspect.stack()
if stk[2].function == '_callSetUp':
return
print(msg, flush=True)
print(f'{stk[2].function}', flush=True)
return
@classmethod
def get_error_code(self, e):
error_code = e.get_error_code()
return error_map[error_code]
@classmethod
def _check_ret(self, msg, _e, expected_code=None):
error_code = str(_e.get_error_code())
error_code_name = error_map[error_code]
if error_code in not_supported_error_codes:
if verbose == 2:
print(f'{msg}\nTest SKIPPED with result {error_code_name}', flush=True)
elif error_code_name == expected_code:
if verbose == 2:
print(f'{msg}\nTest PASSED with expected result {expected_code}', flush=True)
else:
if verbose == 2:
print(f'{msg}\nTest FAILED with expected result {expected_code} but received {error_code_name}', flush=True)
return True
return False
def setUp(self):
self._print_func_name('')
amdsmi.amdsmi_init()
def tearDown(self):
amdsmi.amdsmi_shut_down()
def test_clean_gpu_local_data(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f"gpu({i}): "
ret = amdsmi.amdsmi_clean_gpu_local_data(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_cpu_apb_disable(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f"gpu({i}): "
ret = amdsmi.amdsmi_cpu_apb_disable(processors[i], 0)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_cpu_apb_enable(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f"gpu({i}): "
ret = amdsmi.amdsmi_cpu_apb_enable(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_first_online_core_on_cpu_socket(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_first_online_core_on_cpu_socket as it fails.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f"gpu({i}): "
ret = amdsmi.amdsmi_first_online_core_on_cpu_socket(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_free_name_value_pairs(self):
if self.TODO_SKIP_NYI:
self.skipTest("Skipping test_free_name_value_pairs as it is not implemented yet.")
raise_exception = None
self.setUp()
try:
msg = f""
rc = amdsmi.amdsmi_free_name_value_pairs(None)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_clk_freq(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_get_clock_info as it fails.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
for clk_type_name, clk_type, clk_cond in self.clk_types:
try:
msg = f"gpu({i}): Clock Type({clk_type_name}): "
ret = amdsmi.amdsmi_get_clk_freq(processors[i], clk_type)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, clk_cond):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_clock_info(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_get_clock_info as it fails.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
for clk_type_name, clk_type, clk_cond in self.clk_types:
try:
msg = f'gpu({i}): Clock Type({clk_type_name}): '
ret = amdsmi.amdsmi_get_clock_info(processors[i], clk_type)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, clk_cond):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_cpu_cclk_limit(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_cpu_cclk_limit(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_cpu_core_boostlimit(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_cpu_core_boostlimit(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
self.tearDown()
if raise_exception:
raise raise_exception
def test_get_cpu_core_current_freq_limit(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f"gpu({i}): "
ret = amdsmi.amdsmi_get_cpu_core_current_freq_limit(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_cpu_core_energy(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_get_cpu_core_energy as it fails.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f"gpu({i}): "
ret = amdsmi.amdsmi_get_cpu_core_energy(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_cpu_current_io_bandwidth(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
for encoding_name, encoding, encoding_cond in self.io_bw_encodings:
try:
msg = f'gpu({i}): encodeing({encoding_name}): '
ret = amdsmi.amdsmi_get_cpu_current_io_bandwidth(processors[i], encoding, encoding_name)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, encoding_cond):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_cpu_ddr_bw(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_cpu_ddr_bw(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_cpu_dimm_power_consumption(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_get_cpu_dimm_power_consumption as it fails.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO dimm_addr = 0
dimm_addr = 0
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_cpu_dimm_power_consumption(processors[i], dimm_addr)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_cpu_dimm_temp_range_and_refresh_rate(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_get_cpu_dimm_temp_range_and_refresh_rate as it fails.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO dimm_addr = 0
dimm_addr = 0
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_cpu_dimm_temp_range_and_refresh_rate(processors[i], dimm_addr)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_cpu_dimm_thermal_sensor(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_get_cpu_dimm_thermal_sensor as it fails.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO dimm_addr = 0
dimm_addr = 0
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_cpu_dimm_thermal_sensor(processors[i], dimm_addr)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_cpu_family(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_get_cpu_family as it fails.")
raise_exception = None
self.setUp()
try:
msg = ''
ret = amdsmi.amdsmi_get_cpu_family()
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_cpu_fclk_mclk(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_cpu_fclk_mclk(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_cpu_handles(self):
if self.TODO_SKIP_NYI:
self.skipTest("Skipping test_get_cpu_handles as it is not implemented yet.")
raise_exception = None
self.setUp()
try:
msg = ''
ret = amdsmi.amdsmi_get_cpu_handles(amdsmi.amdsmi_interface.AMDSMI_MAX_DEVICES)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_cpu_hsmp_driver_version(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_get_cpu_hsmp_driver_version as it fails.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_cpu_hsmp_driver_version(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_cpu_hsmp_proto_ver(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_get_cpu_hsmp_proto_ver as it fails.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_cpu_hsmp_proto_ver(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_cpu_model(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_get_cpu_model as it fails.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
try:
msg = ''
ret = amdsmi.amdsmi_get_cpu_model()
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_cpu_prochot_status(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_cpu_prochot_status(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_cpu_pwr_svi_telemetry_all_rails(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_cpu_pwr_svi_telemetry_all_rails(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_cpu_smu_fw_version(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_cpu_smu_fw_version(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_cpu_socket_c0_residency(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_cpu_socket_c0_residency(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_cpu_socket_current_active_freq_limit(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_cpu_socket_current_active_freq_limit(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_cpu_socket_energy(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_get_cpu_socket_energy as it fails.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_cpu_socket_energy(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_cpu_socket_freq_range(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_cpu_socket_freq_range(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_cpu_socket_lclk_dpm_level(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
nbio_id = 0
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): nbio_id({nbio_id}): '
ret = amdsmi.amdsmi_get_cpu_socket_lclk_dpm_level(processors[i], nbio_id)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_cpu_socket_power(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_cpu_socket_power(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_cpu_socket_power_cap(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_cpu_socket_power_cap(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_cpu_socket_power_cap_max(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_cpu_socket_power_cap_max(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_cpu_socket_temperature(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_cpu_socket_temperature(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_energy_count(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_energy_count(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_esmi_err_msg(self):
if self.TODO_SKIP_NYI:
self.skipTest("Skipping test_get_esmi_err_msg as it is not implemented yet.")
raise_exception = None
self.setUp()
for status_num in error_map:
try:
msg = f'status({error_map[status_num]}): '
ret = amdsmi.amdsmi_get_esmi_err_msg(error_map[status_num])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_fw_info(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f"gpu({i}): "
ret = amdsmi.amdsmi_get_fw_info(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_accelerator_partition_profile(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_accelerator_partition_profile(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_accelerator_partition_profile_config(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_accelerator_partition_profile_config(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_activity(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_activity(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_asic_info(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_asic_info(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_bad_page_info(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_bad_page_info(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_bad_page_threshold(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_bad_page_threshold(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_bdf_id(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_bdf_id(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_board_info(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_board_info(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_cache_info(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = gpu_cache_infos = amdsmi.amdsmi_get_gpu_cache_info(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_compute_partition(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_compute_partition(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_compute_process_gpus(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_get_gpu_compute_process_gpus as it fails.")
raise_exception = None
self.setUp()
# TODO pid = 0
pid = 0
try:
msg = f'pid({pid}): '
ret = gpu_compute_process_gpuss = amdsmi.amdsmi_get_gpu_compute_process_gpus(pid)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_compute_process_info(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_compute_process_info()
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_compute_process_info_by_pid(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_get_gpu_compute_process_info_by_pid as it fails.")
raise_exception = None
self.setUp()
# TODO pid = 0
pid = 0
try:
msg = f'pid({pid}): '
ret = amdsmi.amdsmi_get_gpu_compute_process_info_by_pid(pid)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_device_bdf(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_device_bdf(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_device_uuid(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_device_uuid(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_driver_info(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_driver_info(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_ecc_count(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
for gpu_block_name, gpu_block, gpu_block_cond in self.gpu_blocks:
try:
msg = f'gpu({i}): gpu_block({gpu_block_name}) '
ret = amdsmi.amdsmi_get_gpu_ecc_count(processors[i], gpu_block)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, gpu_block_cond):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_ecc_enabled(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_ecc_enabled(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_ecc_status(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_get_gpu_ecc_status as it fails.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
for gpu_block_name, gpu_block, gpu_block_cond in self.gpu_blocks:
try:
msg = f'gpu({i}): gpu_block({gpu_block_name}) '
ret = amdsmi.amdsmi_get_gpu_ecc_status(processors[i], gpu_block)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, gpu_block_cond):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_enumeration_info(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_enumeration_info(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_event_notification(self):
if self.TODO_SKIP_NYI:
self.skipTest("Skipping test_get_gpu_event_notification as it is not implemented yet.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_event_notification(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_fan_rpms(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_fan_rpms(processors[i], 0)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_fan_speed(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_fan_speed(processors[i], 0)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_fan_speed_max(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_fan_speed_max(processors[i], 0)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_id(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_id(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_kfd_info(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_kfd_info(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_mem_overdrive_level(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_mem_overdrive_level(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_memory_partition(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_memory_partition(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_memory_partition_config(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_memory_partition_config(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_memory_reserved_pages(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_memory_reserved_pages(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_memory_total(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
for memory_type_name, memory_type, memory_type_cond in self.memory_types:
try:
msg = f'gpu({i}): memory_type({memory_type_name}) '
ret = amdsmi.amdsmi_get_gpu_memory_total(processors[i], memory_type)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, memory_type_cond):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_memory_usage(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
for memory_type_name, memory_type, memory_type_cond in self.memory_types:
try:
msg = f'gpu({i}): memory_type({memory_type_name}) '
ret = amdsmi.amdsmi_get_gpu_memory_usage(processors[i], memory_type)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, memory_type_cond):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_metrics_header_info(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_metrics_header_info(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_metrics_info(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_metrics_info(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_od_volt_curve_regions(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
num_region = 10
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): num_region({num_region}): '
ret = amdsmi.amdsmi_get_gpu_od_volt_curve_regions(processors[i], num_region)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_od_volt_info(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_get_gpu_od_volt_info as it fails.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_od_volt_info(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_overdrive_level(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_overdrive_level(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_pci_bandwidth(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_pci_bandwidth(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_pci_replay_counter(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_pci_replay_counter(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_pci_throughput(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_pci_throughput(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_perf_level(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_perf_level(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_pm_metrics_info(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_get_gpu_pm_metrics_info as it fails.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_pm_metrics_info(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_power_profile_presets(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_power_profile_presets(processors[i], 0)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_process_isolation(self):
if self.TODO_SKIP_NYI:
self.skipTest("Skipping test_get_gpu_process_isolation as it is not implemented yet.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_process_isolation(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_process_list(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_process_list(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_ras_block_features_enabled(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_ras_block_features_enabled(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_ras_feature_info(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_ras_feature_info(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_reg_table_info(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_get_gpu_reg_table_info as it fails.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
for reg_type_name, reg_type, reg_type_cond in self.reg_types:
try:
msg = f'gpu({i}): reg_type({reg_type_name}): '
ret = amdsmi.amdsmi_get_gpu_reg_table_info(processors[i], reg_type)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, reg_type_cond):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_revision(self):
if self.TODO_SKIP_NYI:
self.skipTest("Skipping test_get_gpu_revision as it is not implemented yet.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_revision(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_subsystem_id(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_subsystem_id(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_subsystem_name(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_subsystem_name(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_topo_numa_affinity(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_topo_numa_affinity(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_total_ecc_count(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_total_ecc_count(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_vbios_info(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_vbios_info(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_vendor_name(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_vendor_name(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_virtualization_mode(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_virtualization_mode(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_volt_metric(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
for voltage_type_name, voltage_type, voltage_type_cond in self.voltage_types:
for voltage_metric_name, voltage_metric, voltage_metric_cond in self.voltage_metrics:
try:
msg = f'gpu({i}): voltage_type({voltage_type_name}) voltage_metric({voltage_metric_name}): '
ret = amdsmi.amdsmi_get_gpu_volt_metric(processors[i], voltage_type, voltage_metric)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if not voltage_type_cond == self.PASS:
if self._check_ret(msg, e, voltage_type_cond):
raise_exception = e
elif not voltage_metric_cond == self.PASS:
if self._check_ret(msg, e, voltage_metric_cond):
raise_exception = e
else:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_vram_info(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_vram_info(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_vram_usage(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_vram_usage(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_vram_vendor(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_vram_vendor(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_xcd_counter(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_xcd_counter(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_xgmi_link_status(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_gpu_xgmi_link_status(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_hsmp_metrics_table(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_hsmp_metrics_table(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_hsmp_metrics_table_version(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_hsmp_metrics_table_version(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_lib_version(self):
raise_exception = None
self.setUp()
try:
msg = f''
ret = amdsmi.amdsmi_get_lib_version()
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_link_metrics(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_get_link_metrics as it fails.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_link_metrics(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_link_topology_nearest(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
for link_type_name, link_type, link_type_cond in self.link_types:
try:
msg = f'gpu({i}): link_type({link_type_name}) '
ret = amdsmi.amdsmi_get_link_topology_nearest(processors[i], link_type)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, link_type_cond):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_minmax_bandwidth_between_processors(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_get_minmax_bandwidth_between_processors as it fails.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
for j in range(0, len(processors)):
try:
msg = f'gpu({i},{j}): '
ret = amdsmi.amdsmi_get_minmax_bandwidth_between_processors(processors[i], processors[j])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_pcie_info(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_pcie_info(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_power_cap_info(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_power_cap_info(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_power_info(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = power_info = amdsmi.amdsmi_get_power_info(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_processor_count_from_handles(self):
if self.TODO_SKIP_NYI:
self.skipTest("Skipping test_get_processor_count_from_handles as it is not implemented yet.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_processor_count_from_handles(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_processor_handle_from_bdf(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_get_processor_handle_from_bdf as it fails.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
#TODO: define bdf
bdf = 0
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_processor_handle_from_bdf(bdf)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_processor_handles(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
self._print(f' {i:2d} processor_handles: {processors[i]}')
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_processor_handles_by_type(self):
if self.TODO_SKIP_NYI:
self.skipTest("Skipping test_get_processor_handles_by_type as it is not implemented yet.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_processor_handles_by_type(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_processor_info(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_processor_info(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_processor_type(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_processor_type(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_soc_pstate(self):
if self.TODO_SKIP_NYI:
self.skipTest("Skipping test_get_soc_pstate as it is not implemented yet.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_soc_pstate(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_socket_handles(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_get_socket_handles as it fails.")
raise_exception = None
self.setUp()
try:
msg = f''
ret = amdsmi.amdsmi_get_socket_handles()
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_socket_info(self):
raise_exception = None
self.setUp()
sockets = amdsmi.amdsmi_get_socket_handles()
self.assertGreaterEqual(len(sockets), 1)
# TODO Find maximum number of sockets
self.assertLessEqual(len(sockets), 32)
for i in range(0, len(sockets)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_socket_info(sockets[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_temp_metric(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
for temperature_type_name, temperature_type, temperature_type_cond in self.temperature_types:
for temperature_metric_name, temperature_metric, temperature_metric_cond in self.temperature_metrics:
try:
msg = f'gpu({i}): temperature_type=({temperature_type_name}) temperature_metric({temperature_metric_name}): '
ret = amdsmi.amdsmi_get_temp_metric(processors[i], temperature_type, temperature_metric)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if not temperature_type_cond == self.PASS:
if self._check_ret(msg, e, temperature_type_cond):
raise_exception = e
elif not temperature_metric_cond == self.PASS:
if self._check_ret(msg, e, temperature_metric_cond):
raise_exception = e
else:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_threads_per_core(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_get_threads_per_core as it fails.")
raise_exception = None
self.setUp()
# TODO threads_per_core
try:
msg = f'threads_per_core: '
ret = amdsmi.amdsmi_get_threads_per_core()
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_utilization_count(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_get_utilization_count as it fails.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
for utilization_counter_type_name, utilization_counter_type, utilization_counter_type_cond in self.utilization_counter_types:
try:
msg = f'gpu({i}): utilization_counter_type({utilization_counter_type_name}): '
ret = amdsmi.amdsmi_get_utilization_count(processors[i], utilization_counter_type)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, utilization_counter_type_cond):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_violation_status(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_violation_status(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_xgmi_info(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_xgmi_info(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_xgmi_plpd(self):
if self.TODO_SKIP_NYI:
self.skipTest("Skipping test_get_xgmi_plpd as it is not implemented yet.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_get_xgmi_plpd(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_gpu_counter_group_supported(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_gpu_counter_group_supported as it fails.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
for event_group_name, event_group, event_group_cond in self.event_groups:
try:
msg = f'gpu({i}): event_group({event_group_name}): '
ret = amdsmi.amdsmi_gpu_counter_group_supported(processors[i], event_group)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, event_group_cond):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
if False: # TODO: create_counter, destroy_counter, read_counter, get_gpu_available_counters, gpu_control_counter
''' Check these:
test_get_gpu_pci_replay_counter
test_get_gpu_xcd_counter
test_gpu_counter_group_supported
'''
def test_gpu_create_counter(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_gpu_create_counter as it fails.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
for event_type_name, event_type, event_type_cond in self.event_types:
try:
msg = f'gpu({i}): event_type({event_type_name}): '
ret = amdsmi.amdsmi_gpu_create_counter(processors[i], event_type)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, event_type_cond):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_gpu_destroy_counter(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_gpu_destroy_counter as it fails.")
raise_exception = None
self.setUp()
# TODO event_handle = 0
event_handle = 0
try:
msg = f'event_handle({event_handle}): '
ret = event_handle
amdsmi.amdsmi_gpu_destroy_counter(event_handle)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_gpu_read_counter(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_gpu_read_counter as it fails.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO event_handle = 0
event_handle = 0
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): event_handle({event_handle}): '
ret = amdsmi.amdsmi_gpu_read_counter(event_handle)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_get_gpu_available_counters(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_get_gpu_available_counters as it fails.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
for event_group_name, event_group_type, event_group_cond in self.event_groups:
try:
msg = f'gpu({i}): event_group({event_group_name}) '
ret = amdsmi.amdsmi_get_gpu_available_counters(processors[i], event_group_type)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, event_group_cond):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_gpu_control_counter(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_gpu_control_counter as it fails.")
raise_exception = None
self.setUp()
# TODO event_handle = 0
event_handle = 0
for counter_command_name, counter_command, counter_commands_cond in self.counter_commands:
try:
msg = f'counter_command({counter_command_name}): '
ret = amdsmi.amdsmi_gpu_control_counter(event_handle, counter_command)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_gpu_validate_ras_eeprom(self):
if self.TODO_SKIP_NYI:
self.skipTest("Skipping test_gpu_validate_ras_eeprom as it is not implemented yet.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_gpu_validate_ras_eeprom(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_gpu_xgmi_error_status(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_gpu_xgmi_error_status(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_init(self):
raise_exception = None
self.setUp()
try:
msg = f''
ret = amdsmi.amdsmi_init()
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_shut_down(self):
raise_exception = None
self.setUp()
try:
msg = f''
ret = amdsmi.amdsmi_shut_down()
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_init_gpu_event_notification(self):
if self.TODO_SKIP_NYI:
self.skipTest("Skipping test_init_gpu_event_notification as it is not implemented yet.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_init_gpu_event_notification(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_is_P2P_accessible(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
for j in range(0, len(processors)):
try:
msg = f'gpu({i},{j}): '
ret = amdsmi.amdsmi_is_P2P_accessible(processors[i], processors[j])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_is_gpu_power_management_enabled(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_is_gpu_power_management_enabled(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_reset_gpu(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_reset_gpu(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_reset_gpu_fan(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_reset_gpu_fan(processors[i], 0)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_reset_gpu_xgmi_error(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_reset_gpu_xgmi_error(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_clk_freq(self):
if self.TODO_SKIP_NOT_COMPLETE:
self.skipTest("Skipping test_set_clk_freq as it is not complete.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO freq_bitmask = 0
freq_bitmask = 0
for i in range(0, len(processors)):
for clk_type_name, clk_type, clk_cond in self.clk_types:
try:
msg = f'gpu({i}): clk_type({clk_type_name}): freq_bitmask({freq_bitmask}): '
ret = amdsmi.amdsmi_set_clk_freq(processors[i], clk_type, freq_bitmask)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, clk_cond):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_cpu_core_boostlimit(self):
if self.TODO_SKIP_NOT_COMPLETE:
self.skipTest("Skipping test_set_cpu_core_boostlimit as it is not complete.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO boost_limit = 0
boost_limit = 0
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): boost_limit({boost_limit}): '
ret = amdsmi.amdsmi_set_cpu_core_boostlimit(processors[i], boost_limit)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_cpu_df_pstate_range(self):
if self.TODO_SKIP_NOT_COMPLETE:
self.skipTest("Skipping test_set_cpu_df_pstate_range as it is not complete.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO max_pstate = 0, min_pstate = 0
max_pstate = 0
min_pstate = 0
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): max_pstate({max_pstate}) min_pstate({min_pstate}): '
ret = amdsmi.amdsmi_set_cpu_df_pstate_range(processors[i], max_pstate, min_pstate)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_cpu_gmi3_link_width_range(self):
if self.TODO_SKIP_NOT_COMPLETE:
self.skipTest("Skipping test_set_cpu_gmi3_link_width_range as it is not complete.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO min_link_width = 0, max_link_width = 0
min_link_width = 0
max_link_width = 0
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): min_link_width({min_link_width}) max_link_width({max_link_width}): '
ret = amdsmi.amdsmi_set_cpu_gmi3_link_width_range(processors[i], min_link_width, max_link_width)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_cpu_pcie_link_rate(self):
if self.TODO_SKIP_NOT_COMPLETE:
self.skipTest("Skipping test_set_cpu_pcie_link_rate as it is not complete.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO rate_ctrl = 0
rate_ctrl = 0
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): rate_ctrl({rate_ctrl}): '
ret = amdsmi.amdsmi_set_cpu_pcie_link_rate(processors[i], rate_ctrl)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_cpu_pwr_efficiency_mode(self):
if self.TODO_SKIP_NYI:
self.skipTest("Skipping test_set_cpu_pwr_efficiency_mode as it is not implemented is not yet implemented.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO mode = 0
mode = 0
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): mode({mode}): '
ret = amdsmi.set_cpu_pwr_efficiency_mode(processors[i], mode)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_cpu_socket_boostlimit(self):
if self.TODO_SKIP_NOT_COMPLETE:
self.skipTest("Skipping test_set_cpu_socket_boostlimit as it is not complete.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO boost_limit = 0
boost_limit = 0
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): boost_limit({boost_limit}): '
ret = amdsmi.amdsmi_set_cpu_socket_boostlimit(processors[i], boost_limit)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_cpu_socket_lclk_dpm_level(self):
if self.TODO_SKIP_NOT_COMPLETE:
self.skipTest("Skipping test_set_cpu_socket_lclk_dpm_level as it is not complete.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO nbio_id = 0, min_val = 0, max_val = 0
nbio_id = 0
min_val = 0
max_val = 0
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): nbio_id({nbio_id}) min_val({min_val}) max_val({max_val}): '
ret = amdsmi.amdsmi_set_cpu_socket_lclk_dpm_level(processors[i], nbio_id, min_val, max_val)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_cpu_socket_power_cap(self):
if self.TODO_SKIP_NOT_COMPLETE:
self.skipTest("Skipping test_set_cpu_socket_power_cap as it is not complete.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO power_cap = 0
power_cap = 0
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): power_cap({power_cap}): '
ret = amdsmi.amdsmi_set_cpu_socket_power_cap(processors[i], power_cap)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_cpu_xgmi_width(self):
if self.TODO_SKIP_NOT_COMPLETE:
self.skipTest("Skipping test_set_cpu_xgmi_width as it is not complete.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO min_width = 0, max_width = 0
min_width = 0
max_width = 0
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): min_width({min_width} max_width({max_width}): )'
ret = amdsmi.amdsmi_set_cpu_xgmi_width(processors[i], min_width , max_width)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_gpu_accelerator_partition_profile(self):
if self.TODO_SKIP_NOT_COMPLETE:
self.skipTest("Skipping test_set_gpu_accelerator_partition_profile as it is not complete.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO profile_index = 0
profile_index = 0
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): profile_index({profile_index}): '
ret = amdsmi.amdsmi_set_gpu_accelerator_partition_profile(processors[i], profile_index)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_gpu_clk_limit(self):
if self.TODO_SKIP_NOT_COMPLETE:
self.skipTest("Skipping test_set_gpu_clk_limit as it is not complete.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO value = 0 is for min and max, need to separate out values
value = 0
for i in range(0, len(processors)):
for clk_type_name, clk_type, clk_cond in self.clk_types:
for clk_limit_type_name, clk_limit_type, clk_limit_cond in self.clk_limit_types:
try:
msg = f'gpu({i}): value({value}) clock_type=({clk_type_name}) clock_limit_type({clk_limit_type_name}): '
ret = amdsmi.amdsmi_set_gpu_clk_limit(processors[i], clk_type, clk_limit_type, value)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if not clk_cond == self.PASS:
self._check_ret(msg, e, clk_cond)
raise_exception = e
elif not clk_limit_type == self.PASS:
self._check_ret(msg, e, clk_limit_type)
raise_exception = e
else:
self._check_ret(msg, e, self.PASS)
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_gpu_clk_range(self):
if self.TODO_SKIP_NOT_COMPLETE:
self.skipTest("Skipping test_set_gpu_clk_range as it is not complete.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO min_clk_value = 0 max_clk_value = 0
min_clk_value = 0
max_clk_value = 0
for i in range(0, len(processors)):
for clk_type_name, clk_type, clk_cond in self.clk_types:
try:
msg = f'gpu({i}): min_clk_value({min_clk_value}) max_clk_value({max_clk_value}) clk_type({clk_type_name}): '
ret = amdsmi.amdsmi_set_gpu_clk_range(processors[i], min_clk_value, max_clk_value, clk_type)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, clk_cond):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_gpu_compute_partition(self):
if self.TODO_SKIP_NOT_COMPLETE:
self.skipTest("Skipping test_set_gpu_compute_partition as it is not complete.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
for compute_partition_type_name, compute_partition_type, compute_partition_type_cond in self.compute_partition_types:
try:
msg = f'gpu({i}): compute_partition_type({compute_partition_type_name}): '
ret = amdsmi.amdsmi_set_gpu_compute_partition(processors[i], compute_partition_type)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, compute_partition_type_cond):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_gpu_event_notification_mask(self):
if self.TODO_SKIP_NYI:
self.skipTest("Skipping test_set_gpu_event_notification_mask as it is not implemented yet.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_set_gpu_event_notification_mask(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_gpu_fan_speed(self):
if self.TODO_SKIP_NOT_COMPLETE:
self.skipTest("Skipping test_set_gpu_fan_speed as it is not complete.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO fan_speed = 0
fan_speed = 0
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): fan_speed({fan_speed}): '
ret = amdsmi.amdsmi_set_gpu_fan_speed(processors[i], 0, fan_speed)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_gpu_memory_partition(self):
if self.TODO_SKIP_NOT_COMPLETE:
self.skipTest("Skipping test_set_gpu_memory_partition as it is not complete.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
for memory_partition_type_name, memory_partition_type, memory_partition_type_cond in self.memory_partition_types:
try:
msg = f'gpu({i}): memory_partition_type({memory_partition_type_name}): '
ret = amdsmi.amdsmi_set_gpu_memory_partition(processors[i], memory_partition_type)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, memory_partition_type_cond):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_gpu_memory_partition_mode(self):
if self.TODO_SKIP_NOT_COMPLETE:
self.skipTest("Skipping test_set_gpu_memory_partition_mode as it is not complete.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
for memory_partition_type_name, memory_partition_type, memory_partition_type_cond in self.memory_partition_types:
try:
msg = f'gpu({i}): memory_partition_type({memory_partition_type_name}): '
ret = amdsmi.amdsmi_set_gpu_memory_partition_mode(processors[i], memory_partition_type)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, memory_partition_type_cond):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_gpu_od_clk_info(self):
if self.TODO_SKIP_NOT_COMPLETE:
self.skipTest("Skipping test_set_gpu_od_clk_info as it is not complete.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO value = 0
value = 0
for i in range(0, len(processors)):
for freq_ind_name, freq_ind, freq_ind_cond in self.freq_inds:
for clk_type_name, clk_type, clk_cond in self.clk_types:
try:
msg = f'gpu({i}): freq_ind({freq_ind_name}) value({value}) clk_type({clk_type_name}): '
ret = amdsmi.amdsmi_set_gpu_od_clk_info(processors[i], freq_ind, value, clk_type)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if not freq_ind_cond == self.PASS:
self._check_ret(msg, e, freq_ind_cond)
raise_exception = e
elif not clk_cond == self.PASS:
self._check_ret(msg, e, clk_cond)
raise_exception = e
else:
self._check_ret(msg, e, self.PASS)
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_gpu_od_volt_info(self):
if self.TODO_SKIP_NOT_COMPLETE:
self.skipTest("Skipping test_set_gpu_od_volt_info as it is not complete.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO vpoint = 0 clk_value = 0 volt_value = 0
vpoint = 0
clk_value = 0
volt_value = 0
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): vpoint({vpoint}) clk_value({clk_value}) volt_value({volt_value}): '
ret = amdsmi.amdsmi_set_gpu_od_volt_info(processors[i], vpoint, clk_value, volt_value)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_gpu_overdrive_level(self):
if self.TODO_SKIP_NOT_COMPLETE:
self.skipTest("Skipping test_set_gpu_overdrive_level as it is not complete.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO overdrive_value = 0
overdrive_value = 0
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): overdrive_value({overdrive_value}): '
ret = amdsmi.amdsmi_set_gpu_overdrive_level(processors[i], overdrive_value)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_gpu_pci_bandwidth(self):
if self.TODO_SKIP_NOT_COMPLETE:
self.skipTest("Skipping test_set_gpu_pci_bandwidth as it is not complete.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO bitmask = 0
bitmask = 0
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): bitmask({bitmask}): '
ret = amdsmi.amdsmi_set_gpu_pci_bandwidth(processors[i], bitmask)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_gpu_perf_determinism_mode(self):
if self.TODO_SKIP_NOT_COMPLETE:
self.skipTest("Skipping test_set_gpu_perf_determinism_mode as it is not complete.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO clk_value = 0
clk_value = 0
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): clk_value({clk_value}): '
ret = amdsmi.amdsmi_set_gpu_perf_determinism_mode(processors[i], clk_value)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_gpu_perf_level(self):
if self.TODO_SKIP_NOT_COMPLETE:
self.skipTest("Skipping test_set_gpu_perf_level as it is not complete.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO Need to set back to default
for i in range(0, len(processors)):
for dev_perf_level_name, dev_perf_level, dev_perf_level_cond in self.dev_perf_levels:
try:
msg = f'gpu({i}): dev_perf_level({dev_perf_level_name}): '
ret = amdsmi.amdsmi_set_gpu_perf_level(processors[i], dev_perf_level)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, dev_perf_level_cond):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_gpu_power_profile(self):
if self.TODO_SKIP_NOT_COMPLETE:
self.skipTest("Skipping test_set_gpu_power_profile as it is not complete.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
for power_profile_preset_mask, power_profile_preset_masks_cond in self.power_profile_preset_masks:
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_set_gpu_power_profile(processors[i], 0, power_profile_preset_mask)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, power_profile_preset_masks_cond):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_gpu_process_isolation(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_set_gpu_process_isolation as it is not yet implemented.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO pisolate = 0
pisolate = 0
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_set_gpu_process_isolation(processors[i], pisolate)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_power_cap(self):
if self.TODO_SKIP_NOT_COMPLETE:
self.skipTest("Skipping test_set_power_cap as it is not complete.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO cap = 0
cap = 0
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_set_power_cap(processors[i], 0, cap)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_soc_pstate(self):
if self.TODO_SKIP_NOT_COMPLETE:
self.skipTest("Skipping test_set_soc_pstate as it is not complete.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO policy_id = 0
policy_id = 0
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_set_soc_pstate(processors[i], policy_id)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_set_xgmi_plpd(self):
if self.TODO_SKIP_NOT_COMPLETE:
self.skipTest("Skipping test_set_xgmi_plpd as it is not complete.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
# TODO policy_id = 0
policy_id = 0
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_set_xgmi_plpd(processors[i], policy_id)
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_status_code_to_string(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_status_code_to_string as it fails.")
raise_exception = None
self.setUp()
# TODO status = 0
status = 0
status_code_to_string = amdsmi.amdsmi_status_code_to_string(status)
self._print(f' {status} status_code_to_string: {status_code_to_string}')
if raise_exception:
raise raise_exception
self.tearDown()
def test_stop_gpu_event_notification(self):
if self.TODO_SKIP_NYI:
self.skipTest("Skipping test_stop_gpu_event_notification as it is not implemented yet.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_stop_gpu_event_notification(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_topo_get_link_type(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
for j in range(0, len(processors)):
try:
msg = f'gpu({i},{j}): '
ret = amdsmi.amdsmi_topo_get_link_type(processors[i], processors[j])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_topo_get_link_weight(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
for j in range(0, len(processors)):
try:
msg = f'gpu({i},{j}): '
ret = amdsmi.amdsmi_topo_get_link_weight(processors[i], processors[j])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_topo_get_numa_node_number(self):
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
try:
msg = f'gpu({i}): '
ret = amdsmi.amdsmi_topo_get_numa_node_number(processors[i])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
def test_topo_get_p2p_status(self):
if self.TODO_SKIP_FAIL:
self.skipTest("Skipping test_topo_get_p2p_status as it fails.")
raise_exception = None
self.setUp()
processors = amdsmi.amdsmi_get_processor_handles()
self.assertGreaterEqual(len(processors), 1)
self.assertLessEqual(len(processors), 32)
for i in range(0, len(processors)):
for j in range(0, len(processors)):
try:
msg = f'gpu({i},{j}): '
ret = amdsmi.amdsmi_topo_get_p2p_status(processors[i], processors[j])
self._print(msg, ret)
except amdsmi.AmdSmiLibraryException as e:
if self._check_ret(msg, e, self.PASS):
raise_exception = e
if raise_exception:
raise raise_exception
self.tearDown()
if __name__ == '__main__':
verbose=1
if '-q' in sys.argv or '--quiet' in sys.argv:
verbose=0
elif '-v' in sys.argv or '--verbose' in sys.argv:
verbose=2
unittest.main()