34f465bfc5
Removed: - handle_exceptions() Exposes, silences, and logs AMDSMI exceptions to users returns success/failure Signed-off-by: Juan Castillo <juan.castillo@amd.com>
4051 linhas
155 KiB
Python
Ficheiro executável
4051 linhas
155 KiB
Python
Ficheiro executável
#!/usr/bin/env python3
|
|
#
|
|
# Copyright (c) Advanced Micro Devices, Inc. All rights reserved.
|
|
#
|
|
# Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
# of this software and associated documentation files (the "Software"), to deal
|
|
# in the Software without restriction, including without limitation the rights
|
|
# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
# copies of the Software, and to permit persons to whom the Software is
|
|
# furnished to do so, subject to the following conditions:
|
|
#
|
|
# The above copyright notice and this permission notice shall be included in
|
|
# all copies or substantial portions of the Software.
|
|
#
|
|
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
# THE SOFTWARE.
|
|
|
|
import inspect
|
|
import json
|
|
import sys
|
|
import unittest
|
|
sys.path.append("/opt/rocm/libexec/amdsmi_cli/")
|
|
|
|
try:
|
|
import amdsmi
|
|
except ImportError:
|
|
raise ImportError("Could not import /opt/rocm/libexec/amdsmi_cli/amdsmi_cli.py")
|
|
|
|
not_supported_error_codes = ['2', '3', '49']
|
|
not_supported_error_code_names = ['AMDSMI_STATUS_NOT_SUPPORTED', 'AMDSMI_STATUS_NOT_YET_IMPLEMENTED', 'AMDSMI_STATUS_NO_HSMP_MSG_SUP']
|
|
|
|
error_map = \
|
|
{
|
|
'0': 'AMDSMI_STATUS_SUCCESS',
|
|
'1': 'AMDSMI_STATUS_INVAL',
|
|
'2': 'AMDSMI_STATUS_NOT_SUPPORTED',
|
|
'3': 'AMDSMI_STATUS_NOT_YET_IMPLEMENTED',
|
|
'4': 'AMDSMI_STATUS_FAIL_LOAD_MODULE',
|
|
'5': 'AMDSMI_STATUS_FAIL_LOAD_SYMBOL',
|
|
'6': 'AMDSMI_STATUS_DRM_ERROR',
|
|
'7': 'AMDSMI_STATUS_API_FAILED',
|
|
'8': 'AMDSMI_STATUS_TIMEOUT',
|
|
'9': 'AMDSMI_STATUS_RETRY',
|
|
'10': 'AMDSMI_STATUS_NO_PERM',
|
|
'11': 'AMDSMI_STATUS_INTERRUPT',
|
|
'12': 'AMDSMI_STATUS_IO',
|
|
'13': 'AMDSMI_STATUS_ADDRESS_FAULT',
|
|
'14': 'AMDSMI_STATUS_FILE_ERROR',
|
|
'15': 'AMDSMI_STATUS_OUT_OF_RESOURCES',
|
|
'16': 'AMDSMI_STATUS_INTERNAL_EXCEPTION',
|
|
'17': 'AMDSMI_STATUS_INPUT_OUT_OF_BOUNDS',
|
|
'18': 'AMDSMI_STATUS_INIT_ERROR',
|
|
'19': 'AMDSMI_STATUS_REFCOUNT_OVERFLOW',
|
|
'30': 'AMDSMI_STATUS_BUSY',
|
|
'31': 'AMDSMI_STATUS_NOT_FOUND',
|
|
'32': 'AMDSMI_STATUS_NOT_INIT',
|
|
'33': 'AMDSMI_STATUS_NO_SLOT',
|
|
'34': 'AMDSMI_STATUS_DRIVER_NOT_LOADED',
|
|
'39': 'AMDSMI_STATUS_MORE_DATA',
|
|
'40': 'AMDSMI_STATUS_NO_DATA',
|
|
'41': 'AMDSMI_STATUS_INSUFFICIENT_SIZE',
|
|
'42': 'AMDSMI_STATUS_UNEXPECTED_SIZE',
|
|
'43': 'AMDSMI_STATUS_UNEXPECTED_DATA',
|
|
'44': 'AMDSMI_STATUS_NON_AMD_CPU',
|
|
'45': 'AMDSMI_STATUS_NO_ENERGY_DRV',
|
|
'46': 'AMDSMI_STATUS_NO_MSR_DRV',
|
|
'47': 'AMDSMI_STATUS_NO_HSMP_DRV',
|
|
'48': 'AMDSMI_STATUS_NO_HSMP_SUP',
|
|
'49': 'AMDSMI_STATUS_NO_HSMP_MSG_SUP',
|
|
'50': 'AMDSMI_STATUS_HSMP_TIMEOUT',
|
|
'51': 'AMDSMI_STATUS_NO_DRV',
|
|
'52': 'AMDSMI_STATUS_FILE_NOT_FOUND',
|
|
'53': 'AMDSMI_STATUS_ARG_PTR_NULL',
|
|
'54': 'AMDSMI_STATUS_AMDGPU_RESTART_ERR',
|
|
'55': 'AMDSMI_STATUS_SETTING_UNAVAILABLE',
|
|
'56': 'AMDSMI_STATUS_CORRUPTED_EEPROM',
|
|
'0xFFFFFFFE': 'AMDSMI_STATUS_MAP_ERROR',
|
|
'0xFFFFFFFF': 'AMDSMI_STATUS_UNKNOWN_ERROR'
|
|
}
|
|
|
|
|
|
class TestAmdSmiPythonBDF(unittest.TestCase):
|
|
valid_bdfs = {
|
|
"00:00.0": [0, 0, 0, 0],
|
|
"01:01.1": [0, 1, 1, 1],
|
|
"FF:1F.7": [0, 255, 31, 7],
|
|
"FF:00.7": [0, 255, 0, 7],
|
|
"11:01.2": [0, 17, 1, 2],
|
|
"11:0a.2": [0, 17, 10, 2],
|
|
"0000:FF:1F.7": [0, 255, 31, 7],
|
|
"0001:ff:1F.7": [1, 255, 31, 7],
|
|
"ffff:FF:1f.7": [65535, 255, 31, 7],
|
|
}
|
|
|
|
invalid_bdfs = {
|
|
# invalid bdf strings, expect None
|
|
None: None,
|
|
"": None,
|
|
"00:00:0": None,
|
|
"00.00:0": None,
|
|
"00:00.Z": None,
|
|
"00:0Z.0": None,
|
|
"0Z:00.0": None,
|
|
"Z00:00.0": None,
|
|
"A00:00.0": None,
|
|
"0A00:00.0": None,
|
|
"00:00.07": None,
|
|
"00:00.8": None,
|
|
"00:00.10": None,
|
|
"00:00.11": None,
|
|
"00:00.-1": None,
|
|
"00:00.*-1": None,
|
|
"00:00.123": None,
|
|
"00:20.0": None,
|
|
"00:45.0": None,
|
|
"00:200.0": None,
|
|
"00:002.0": None,
|
|
"100:00.0": None,
|
|
"0100:00.0": None,
|
|
"00100:00.0": None,
|
|
"0101:00.0": None,
|
|
"00001:00.0": None,
|
|
"10001:00.0": None,
|
|
"45:0.0": None,
|
|
".00:00.0": None,
|
|
"00.00.0": None,
|
|
"00.0.0": None,
|
|
"0.00.0": None,
|
|
"000.00.0": None,
|
|
"00 00 0": None,
|
|
" 00:00.0": None,
|
|
"00:00.0 ": None,
|
|
"0000:00.00.0": None,
|
|
"000:00:00.0": None,
|
|
"00:00:00.1": None,
|
|
"0:00:00.1": None,
|
|
"0000 00 00 0": None,
|
|
"-1-1:00:00.0": None,
|
|
"AAAA:00:AA.0": None,
|
|
"*1*1:00:00.0": None,
|
|
"0000:00:00.07": None,
|
|
"0000:00:00.8": None,
|
|
"0000:00:00.10": None,
|
|
"0000:00:00.11": None,
|
|
"0000:00:00.-1": None,
|
|
"0000:00:00.*-1": None,
|
|
"0000:00:00.123": None,
|
|
"0000:00:20.0": None,
|
|
"0000:00:45.0": None,
|
|
"0000:00:200.0": None,
|
|
"0000:00:002.0": None,
|
|
"0000:100:00.0": None,
|
|
"0000:0100:00.0": None,
|
|
"0000:00100:00.0": None,
|
|
"0000:0101:00.0": None,
|
|
"0000:00001:00.0": None,
|
|
"0000:10001:00.0": None,
|
|
"0000:45:0.0": None,
|
|
".0000.00:00.0": None,
|
|
"0000.00.0.0": None,
|
|
" 0000:00:00.0": None,
|
|
"0000:00:00.0 ": None,
|
|
}
|
|
|
|
PASS = 'AMDSMI_STATUS_SUCCESS'
|
|
FAIL = 'AMDSMI_STATUS_INVAL'
|
|
|
|
# Tests marked wtih either of these flags will be skipped
|
|
# and need to be implemented later.
|
|
TODO_SKIP_NYI = True
|
|
TODO_SKIP_FAIL = True
|
|
TODO_SKIP_NOT_COMPLETE = True
|
|
|
|
clk_types = \
|
|
[
|
|
('SYS', amdsmi.AmdSmiClkType.SYS, PASS),
|
|
('GFX', amdsmi.AmdSmiClkType.GFX, PASS),
|
|
('DF', amdsmi.AmdSmiClkType.DF, PASS),
|
|
('DCEF', amdsmi.AmdSmiClkType.DCEF, PASS),
|
|
('SOC', amdsmi.AmdSmiClkType.SOC, PASS),
|
|
('MEM', amdsmi.AmdSmiClkType.MEM, PASS),
|
|
('PCIE', amdsmi.AmdSmiClkType.PCIE, PASS),
|
|
('VCLK0', amdsmi.AmdSmiClkType.VCLK0, PASS),
|
|
('VCLK1', amdsmi.AmdSmiClkType.VCLK1, PASS),
|
|
('DCLK0', amdsmi.AmdSmiClkType.DCLK0, PASS),
|
|
('DCLK1', amdsmi.AmdSmiClkType.DCLK1, PASS)
|
|
]
|
|
|
|
clk_limit_types = \
|
|
[
|
|
('MIN', amdsmi.AmdSmiClkLimitType.MIN, PASS),
|
|
('MAX', amdsmi.AmdSmiClkLimitType.MAX, PASS)
|
|
]
|
|
|
|
io_bw_encodings = \
|
|
[
|
|
('AGG_BW0', amdsmi.amdsmi_wrapper.AGG_BW0, PASS),
|
|
('RD_BW0', amdsmi.amdsmi_wrapper.RD_BW0, PASS),
|
|
('WR_BW0', amdsmi.amdsmi_wrapper.WR_BW0, PASS)
|
|
]
|
|
|
|
event_groups = \
|
|
[
|
|
('XGMI', amdsmi.AmdSmiEventGroup.XGMI, PASS),
|
|
('XGMI_DATA_OUT', amdsmi.AmdSmiEventGroup.XGMI_DATA_OUT, PASS),
|
|
('GRP_INVALID', amdsmi.AmdSmiEventGroup.GRP_INVALID, FAIL)
|
|
]
|
|
|
|
gpu_blocks = \
|
|
[
|
|
('INVALID', amdsmi.AmdSmiGpuBlock.INVALID, FAIL),
|
|
('UMC', amdsmi.AmdSmiGpuBlock.UMC, PASS),
|
|
('SDMA', amdsmi.AmdSmiGpuBlock.SDMA, PASS),
|
|
('GFX', amdsmi.AmdSmiGpuBlock.GFX, PASS),
|
|
('MMHUB', amdsmi.AmdSmiGpuBlock.MMHUB, PASS),
|
|
('ATHUB', amdsmi.AmdSmiGpuBlock.ATHUB, PASS),
|
|
('PCIE_BIF', amdsmi.AmdSmiGpuBlock.PCIE_BIF, PASS),
|
|
('HDP', amdsmi.AmdSmiGpuBlock.HDP, PASS),
|
|
('XGMI_WAFL', amdsmi.AmdSmiGpuBlock.XGMI_WAFL, PASS),
|
|
('DF', amdsmi.AmdSmiGpuBlock.DF, PASS),
|
|
('SMN', amdsmi.AmdSmiGpuBlock.SMN, PASS),
|
|
('SEM', amdsmi.AmdSmiGpuBlock.SEM, PASS),
|
|
('MP0', amdsmi.AmdSmiGpuBlock.MP0, PASS),
|
|
('MP1', amdsmi.AmdSmiGpuBlock.MP1, PASS),
|
|
('FUSE', amdsmi.AmdSmiGpuBlock.FUSE, PASS),
|
|
('MCA', amdsmi.AmdSmiGpuBlock.MCA, PASS),
|
|
('VCN', amdsmi.AmdSmiGpuBlock.VCN, PASS),
|
|
('JPEG', amdsmi.AmdSmiGpuBlock.JPEG, PASS),
|
|
('IH', amdsmi.AmdSmiGpuBlock.IH, PASS),
|
|
('MPIO', amdsmi.AmdSmiGpuBlock.MPIO, PASS),
|
|
('RESERVED', amdsmi.AmdSmiGpuBlock.RESERVED, FAIL)
|
|
]
|
|
|
|
memory_types = \
|
|
[
|
|
('VRAM', amdsmi.AmdSmiMemoryType.VRAM, PASS),
|
|
('VIS_VRAM', amdsmi.AmdSmiMemoryType.VIS_VRAM, PASS),
|
|
('GTT', amdsmi.AmdSmiMemoryType.GTT, PASS)
|
|
]
|
|
|
|
reg_types = \
|
|
[
|
|
('XGMI', amdsmi.AmdSmiRegType.XGMI, PASS),
|
|
('WAFL', amdsmi.AmdSmiRegType.WAFL, PASS),
|
|
('PCIE', amdsmi.AmdSmiRegType.PCIE, PASS),
|
|
('USR', amdsmi.AmdSmiRegType.USR, PASS),
|
|
('USR1', amdsmi.AmdSmiRegType.USR1, PASS)
|
|
]
|
|
|
|
voltage_metrics = \
|
|
[
|
|
('CURRENT', amdsmi.AmdSmiVoltageMetric.CURRENT, PASS),
|
|
('MAX', amdsmi.AmdSmiVoltageMetric.MAX, PASS),
|
|
('MIN_CRIT', amdsmi.AmdSmiVoltageMetric.MIN_CRIT, PASS),
|
|
('MIN', amdsmi.AmdSmiVoltageMetric.MIN, PASS),
|
|
('MAX_CRIT', amdsmi.AmdSmiVoltageMetric.MAX_CRIT, PASS),
|
|
('AVERAGE', amdsmi.AmdSmiVoltageMetric.AVERAGE, PASS),
|
|
('LOWEST', amdsmi.AmdSmiVoltageMetric.LOWEST, PASS),
|
|
('HIGHEST', amdsmi.AmdSmiVoltageMetric.HIGHEST, PASS)
|
|
]
|
|
|
|
voltage_types = \
|
|
[
|
|
('VDDGFX', amdsmi.AmdSmiVoltageType.VDDGFX, PASS),
|
|
('INVALID', amdsmi.AmdSmiVoltageType.INVALID, FAIL)
|
|
]
|
|
|
|
link_types = \
|
|
[
|
|
('AMDSMI_LINK_TYPE_INTERNAL', amdsmi.AmdSmiLinkType.AMDSMI_LINK_TYPE_INTERNAL, PASS),
|
|
('AMDSMI_LINK_TYPE_XGMI', amdsmi.AmdSmiLinkType.AMDSMI_LINK_TYPE_XGMI, PASS),
|
|
('AMDSMI_LINK_TYPE_PCIE', amdsmi.AmdSmiLinkType.AMDSMI_LINK_TYPE_PCIE, PASS),
|
|
('AMDSMI_LINK_TYPE_NOT_APPLICABLE', amdsmi.AmdSmiLinkType.AMDSMI_LINK_TYPE_NOT_APPLICABLE, FAIL),
|
|
('AMDSMI_LINK_TYPE_UNKNOWN', amdsmi.AmdSmiLinkType.AMDSMI_LINK_TYPE_UNKNOWN, FAIL)
|
|
]
|
|
|
|
temperature_types = \
|
|
[
|
|
('EDGE', amdsmi.AmdSmiTemperatureType.EDGE, PASS),
|
|
('HOTSPOT', amdsmi.AmdSmiTemperatureType.HOTSPOT, PASS),
|
|
('JUNCTION', amdsmi.AmdSmiTemperatureType.JUNCTION, PASS),
|
|
('VRAM', amdsmi.AmdSmiTemperatureType.VRAM, PASS),
|
|
('HBM_0', amdsmi.AmdSmiTemperatureType.HBM_0, PASS),
|
|
('HBM_1', amdsmi.AmdSmiTemperatureType.HBM_1, PASS),
|
|
('HBM_2', amdsmi.AmdSmiTemperatureType.HBM_2, PASS),
|
|
('HBM_3', amdsmi.AmdSmiTemperatureType.HBM_3, PASS),
|
|
('PLX', amdsmi.AmdSmiTemperatureType.PLX, PASS)
|
|
]
|
|
|
|
temperature_metrics = \
|
|
[
|
|
('CURRENT', amdsmi.AmdSmiTemperatureMetric.CURRENT, PASS),
|
|
('MAX', amdsmi.AmdSmiTemperatureMetric.MAX, PASS),
|
|
('MIN', amdsmi.AmdSmiTemperatureMetric.MIN, PASS),
|
|
('MAX_HYST', amdsmi.AmdSmiTemperatureMetric.MAX_HYST, PASS),
|
|
('MIN_HYST', amdsmi.AmdSmiTemperatureMetric.MIN_HYST, PASS),
|
|
('CRITICAL', amdsmi.AmdSmiTemperatureMetric.CRITICAL, PASS),
|
|
('CRITICAL_HYST', amdsmi.AmdSmiTemperatureMetric.CRITICAL_HYST, PASS),
|
|
('EMERGENCY', amdsmi.AmdSmiTemperatureMetric.EMERGENCY, PASS),
|
|
('EMERGENCY_HYST', amdsmi.AmdSmiTemperatureMetric.EMERGENCY_HYST, PASS),
|
|
('CRIT_MIN', amdsmi.AmdSmiTemperatureMetric.CRIT_MIN, PASS),
|
|
('CRIT_MIN_HYST', amdsmi.AmdSmiTemperatureMetric.CRIT_MIN_HYST, PASS),
|
|
('OFFSET', amdsmi.AmdSmiTemperatureMetric.OFFSET, PASS),
|
|
('LOWEST', amdsmi.AmdSmiTemperatureMetric.LOWEST, PASS),
|
|
('HIGHEST', amdsmi.AmdSmiTemperatureMetric.HIGHEST, PASS)
|
|
]
|
|
|
|
utilization_counter_types = \
|
|
[
|
|
('COARSE_GRAIN_GFX_ACTIVITY', amdsmi.AmdSmiUtilizationCounterType.COARSE_GRAIN_GFX_ACTIVITY, PASS),
|
|
('COARSE_GRAIN_MEM_ACTIVITY', amdsmi.AmdSmiUtilizationCounterType.COARSE_GRAIN_MEM_ACTIVITY, PASS),
|
|
('COARSE_DECODER_ACTIVITY', amdsmi.AmdSmiUtilizationCounterType.COARSE_DECODER_ACTIVITY, PASS),
|
|
('FINE_GRAIN_GFX_ACTIVITY', amdsmi.AmdSmiUtilizationCounterType.FINE_GRAIN_GFX_ACTIVITY, PASS),
|
|
('FINE_GRAIN_MEM_ACTIVITY', amdsmi.AmdSmiUtilizationCounterType.FINE_GRAIN_MEM_ACTIVITY, PASS),
|
|
('FINE_DECODER_ACTIVITY', amdsmi.AmdSmiUtilizationCounterType.FINE_DECODER_ACTIVITY, PASS),
|
|
('UTILIZATION_COUNTER_FIRST', amdsmi.AmdSmiUtilizationCounterType.UTILIZATION_COUNTER_FIRST, PASS),
|
|
('UTILIZATION_COUNTER_LAST', amdsmi.AmdSmiUtilizationCounterType.UTILIZATION_COUNTER_LAST, PASS)
|
|
]
|
|
|
|
event_types = \
|
|
[
|
|
('XGMI_0_NOP_TX', amdsmi.AmdSmiEventType.XGMI_0_NOP_TX, PASS),
|
|
('XGMI_0_REQUEST_TX', amdsmi.AmdSmiEventType.XGMI_0_REQUEST_TX, PASS),
|
|
('XGMI_0_RESPONSE_TX', amdsmi.AmdSmiEventType.XGMI_0_RESPONSE_TX, PASS),
|
|
('XGMI_0_BEATS_TX', amdsmi.AmdSmiEventType.XGMI_0_BEATS_TX, PASS),
|
|
('XGMI_1_NOP_TX', amdsmi.AmdSmiEventType.XGMI_1_NOP_TX, PASS),
|
|
('XGMI_1_REQUEST_TX', amdsmi.AmdSmiEventType.XGMI_1_REQUEST_TX, PASS),
|
|
('XGMI_1_RESPONSE_TX', amdsmi.AmdSmiEventType.XGMI_1_RESPONSE_TX, PASS),
|
|
('XGMI_1_BEATS_TX', amdsmi.AmdSmiEventType.XGMI_1_BEATS_TX, PASS),
|
|
('XGMI_DATA_OUT_0', amdsmi.AmdSmiEventType.XGMI_DATA_OUT_0, PASS),
|
|
('XGMI_DATA_OUT_1', amdsmi.AmdSmiEventType.XGMI_DATA_OUT_1, PASS),
|
|
('XGMI_DATA_OUT_2', amdsmi.AmdSmiEventType.XGMI_DATA_OUT_2, PASS),
|
|
('XGMI_DATA_OUT_3', amdsmi.AmdSmiEventType.XGMI_DATA_OUT_3, PASS),
|
|
('XGMI_DATA_OUT_4', amdsmi.AmdSmiEventType.XGMI_DATA_OUT_4, PASS),
|
|
('XGMI_DATA_OUT_5', amdsmi.AmdSmiEventType.XGMI_DATA_OUT_5, PASS)
|
|
]
|
|
|
|
counter_commands = \
|
|
[
|
|
('CMD_START', amdsmi.AmdSmiCounterCommand.CMD_START, PASS),
|
|
('CMD_STOP', amdsmi.AmdSmiCounterCommand.CMD_STOP, PASS)
|
|
]
|
|
|
|
compute_partition_types = \
|
|
[
|
|
('SPX', amdsmi.AmdSmiComputePartitionType.SPX, PASS),
|
|
('DPX', amdsmi.AmdSmiComputePartitionType.DPX, PASS),
|
|
('TPX', amdsmi.AmdSmiComputePartitionType.TPX, PASS),
|
|
('QPX', amdsmi.AmdSmiComputePartitionType.QPX, PASS),
|
|
('CPX', amdsmi.AmdSmiComputePartitionType.CPX, PASS),
|
|
('INVALID', amdsmi.AmdSmiComputePartitionType.INVALID, FAIL)
|
|
]
|
|
|
|
memory_partition_types = \
|
|
[
|
|
('NPS1', amdsmi.AmdSmiMemoryPartitionType.NPS1, PASS),
|
|
('NPS2', amdsmi.AmdSmiMemoryPartitionType.NPS2, PASS),
|
|
('NPS4', amdsmi.AmdSmiMemoryPartitionType.NPS4, PASS),
|
|
('NPS8', amdsmi.AmdSmiMemoryPartitionType.NPS8, PASS),
|
|
('UNKNOWN', amdsmi.AmdSmiMemoryPartitionType.UNKNOWN, FAIL)
|
|
]
|
|
|
|
freq_inds = \
|
|
[
|
|
('MIN', amdsmi.AmdSmiFreqInd.MIN, PASS),
|
|
('MAX', amdsmi.AmdSmiFreqInd.MAX, PASS),
|
|
('INVALID', amdsmi.AmdSmiFreqInd.INVALID, FAIL)
|
|
]
|
|
|
|
dev_perf_levels = \
|
|
[
|
|
('AUTO', amdsmi.AmdSmiDevPerfLevel.AUTO, PASS),
|
|
('LOW', amdsmi.AmdSmiDevPerfLevel.LOW, PASS),
|
|
('HIGH', amdsmi.AmdSmiDevPerfLevel.HIGH, PASS),
|
|
('MANUAL', amdsmi.AmdSmiDevPerfLevel.MANUAL, PASS),
|
|
('STABLE_STD', amdsmi.AmdSmiDevPerfLevel.STABLE_STD, PASS),
|
|
('STABLE_PEAK', amdsmi.AmdSmiDevPerfLevel.STABLE_PEAK, PASS),
|
|
('STABLE_MIN_MCLK', amdsmi.AmdSmiDevPerfLevel.STABLE_MIN_MCLK, PASS),
|
|
('STABLE_MIN_SCLK', amdsmi.AmdSmiDevPerfLevel.STABLE_MIN_SCLK, PASS),
|
|
('DETERMINISM', amdsmi.AmdSmiDevPerfLevel.DETERMINISM, PASS),
|
|
('UNKNOWN', amdsmi.AmdSmiDevPerfLevel.UNKNOWN, FAIL)
|
|
]
|
|
|
|
power_profile_preset_masks = \
|
|
[
|
|
('CUSTOM_MASK', amdsmi.AmdSmiPowerProfilePresetMasks.CUSTOM_MASK, PASS),
|
|
('VIDEO_MASK', amdsmi.AmdSmiPowerProfilePresetMasks.VIDEO_MASK, PASS),
|
|
('POWER_SAVING_MASK', amdsmi.AmdSmiPowerProfilePresetMasks.POWER_SAVING_MASK, PASS),
|
|
('COMPUTE_MASK', amdsmi.AmdSmiPowerProfilePresetMasks.COMPUTE_MASK, PASS),
|
|
('VR_MASK', amdsmi.AmdSmiPowerProfilePresetMasks.VR_MASK, PASS),
|
|
('THREE_D_FULL_SCR_MASK', amdsmi.AmdSmiPowerProfilePresetMasks.THREE_D_FULL_SCR_MASK, PASS),
|
|
('BOOTUP_DEFAULT', amdsmi.AmdSmiPowerProfilePresetMasks.BOOTUP_DEFAULT, PASS),
|
|
('INVALID', amdsmi.AmdSmiPowerProfilePresetMasks.INVALID, FAIL)
|
|
]
|
|
|
|
def test_parse_bdf(self):
|
|
# go through all bdfs
|
|
expectations = self.valid_bdfs.copy()
|
|
expectations.update(self.invalid_bdfs)
|
|
for bdf in expectations:
|
|
expected = expectations[bdf]
|
|
result = amdsmi.amdsmi_interface._parse_bdf(bdf)
|
|
self.assertEqual(result, expected,
|
|
"Expected {} for bdf {}, but got {}".format(
|
|
expected, bdf, result))
|
|
|
|
@classmethod
|
|
def _convert_bdf_to_long(clz, bdf):
|
|
if len(bdf) == 12:
|
|
return bdf
|
|
if len(bdf) == 7:
|
|
return "0000:" + bdf
|
|
return None
|
|
|
|
def test_format_bdf(self):
|
|
# go through valid bdfs
|
|
expectations = self.valid_bdfs.copy()
|
|
for bdf_string in expectations:
|
|
# use key as result and value as input
|
|
bdf_list = expectations[bdf_string]
|
|
smi_bdf = amdsmi.amdsmi_interface._make_amdsmi_bdf_from_list(bdf_list)
|
|
expected = TestAmdSmiPythonBDF._convert_bdf_to_long(bdf_string)
|
|
expected = expected.lower()
|
|
result = amdsmi.amdsmi_interface._format_bdf(smi_bdf)
|
|
self.assertEqual(result, expected,
|
|
"Expected {} for bdf {}, but got {}".format(
|
|
expected, bdf_string, result))
|
|
|
|
def test_check_res(self):
|
|
# expect retry error to raise SmiRetryException
|
|
with self.assertRaises(amdsmi.AmdSmiRetryException) as retry_test:
|
|
amdsmi.amdsmi_interface._check_res(
|
|
(lambda: amdsmi.amdsmi_interface.amdsmi_wrapper.AMDSMI_STATUS_RETRY)())
|
|
# except retry error to have AMDSMI_STATUS_RETRY error code
|
|
self.assertEqual(retry_test.exception.get_error_code(),
|
|
amdsmi.amdsmi_interface.amdsmi_wrapper.AMDSMI_STATUS_RETRY)
|
|
# expect invalid args error to raise AmdSmiLibraryException
|
|
with self.assertRaises(amdsmi.AmdSmiLibraryException) as inval_test:
|
|
amdsmi.amdsmi_interface._check_res(
|
|
(lambda: amdsmi.amdsmi_interface.amdsmi_wrapper.AMDSMI_STATUS_INVAL)())
|
|
# expect invalid args error to have AMDSMI_STATUS_INVAL error code
|
|
self.assertEqual(inval_test.exception.get_error_code(),
|
|
amdsmi.amdsmi_interface.amdsmi_wrapper.AMDSMI_STATUS_INVAL)
|
|
# for successfull call, expect no error is given
|
|
result = amdsmi.amdsmi_interface._check_res(
|
|
(lambda: amdsmi.amdsmi_interface.amdsmi_wrapper.AMDSMI_STATUS_SUCCESS)())
|
|
self.assertEqual(None, result)
|
|
|
|
@classmethod
|
|
def _print(self, msg, data=None, cond=None):
|
|
if verbose == 2:
|
|
if not data:
|
|
print(msg, flush=True)
|
|
elif data in not_supported_error_code_names:
|
|
print(f'{msg}{data}', flush=True)
|
|
else:
|
|
if isinstance(data, str) and data in error_map.values():
|
|
print(msg, end='')
|
|
else:
|
|
print(msg)
|
|
print(json.dumps(data, sort_keys=False, indent=4), flush=True)
|
|
return
|
|
|
|
@classmethod
|
|
def _print_func_name(self, msg):
|
|
if verbose == 2:
|
|
stk = inspect.stack()
|
|
if stk[2].function == '_callSetUp':
|
|
return
|
|
print(msg, flush=True)
|
|
print(f'{stk[2].function}', flush=True)
|
|
return
|
|
|
|
@classmethod
|
|
def get_error_code(self, e):
|
|
error_code = e.get_error_code()
|
|
return error_map[error_code]
|
|
|
|
@classmethod
|
|
def _check_ret(self, msg, _e, expected_code=None):
|
|
error_code = str(_e.get_error_code())
|
|
error_code_name = error_map[error_code]
|
|
if error_code in not_supported_error_codes:
|
|
if verbose == 2:
|
|
print(f'{msg}\nTest SKIPPED with result {error_code_name}', flush=True)
|
|
elif error_code_name == expected_code:
|
|
if verbose == 2:
|
|
print(f'{msg}\nTest PASSED with expected result {expected_code}', flush=True)
|
|
else:
|
|
if verbose == 2:
|
|
print(f'{msg}\nTest FAILED with expected result {expected_code} but received {error_code_name}', flush=True)
|
|
return True
|
|
return False
|
|
|
|
def setUp(self):
|
|
self._print_func_name('')
|
|
amdsmi.amdsmi_init()
|
|
|
|
def tearDown(self):
|
|
amdsmi.amdsmi_shut_down()
|
|
|
|
|
|
def test_clean_gpu_local_data(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f"gpu({i}): "
|
|
ret = amdsmi.amdsmi_clean_gpu_local_data(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_cpu_apb_disable(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f"gpu({i}): "
|
|
ret = amdsmi.amdsmi_cpu_apb_disable(processors[i], 0)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_cpu_apb_enable(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f"gpu({i}): "
|
|
ret = amdsmi.amdsmi_cpu_apb_enable(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_first_online_core_on_cpu_socket(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_first_online_core_on_cpu_socket as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f"gpu({i}): "
|
|
ret = amdsmi.amdsmi_first_online_core_on_cpu_socket(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_free_name_value_pairs(self):
|
|
if self.TODO_SKIP_NYI:
|
|
self.skipTest("Skipping test_free_name_value_pairs as it is not implemented yet.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
try:
|
|
msg = f""
|
|
rc = amdsmi.amdsmi_free_name_value_pairs(None)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_clk_freq(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_get_clock_info as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
for clk_type_name, clk_type, clk_cond in self.clk_types:
|
|
try:
|
|
msg = f"gpu({i}): Clock Type({clk_type_name}): "
|
|
ret = amdsmi.amdsmi_get_clk_freq(processors[i], clk_type)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, clk_cond):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_clock_info(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_get_clock_info as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
for clk_type_name, clk_type, clk_cond in self.clk_types:
|
|
try:
|
|
msg = f'gpu({i}): Clock Type({clk_type_name}): '
|
|
ret = amdsmi.amdsmi_get_clock_info(processors[i], clk_type)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, clk_cond):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_cpu_cclk_limit(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_cpu_cclk_limit(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_cpu_core_boostlimit(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_cpu_core_boostlimit(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
self.tearDown()
|
|
if raise_exception:
|
|
raise raise_exception
|
|
|
|
|
|
def test_get_cpu_core_current_freq_limit(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f"gpu({i}): "
|
|
ret = amdsmi.amdsmi_get_cpu_core_current_freq_limit(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_cpu_core_energy(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_get_cpu_core_energy as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f"gpu({i}): "
|
|
ret = amdsmi.amdsmi_get_cpu_core_energy(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_cpu_current_io_bandwidth(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
for encoding_name, encoding, encoding_cond in self.io_bw_encodings:
|
|
try:
|
|
msg = f'gpu({i}): encodeing({encoding_name}): '
|
|
ret = amdsmi.amdsmi_get_cpu_current_io_bandwidth(processors[i], encoding, encoding_name)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, encoding_cond):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_cpu_ddr_bw(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_cpu_ddr_bw(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_cpu_dimm_power_consumption(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_get_cpu_dimm_power_consumption as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO dimm_addr = 0
|
|
dimm_addr = 0
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_cpu_dimm_power_consumption(processors[i], dimm_addr)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_cpu_dimm_temp_range_and_refresh_rate(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_get_cpu_dimm_temp_range_and_refresh_rate as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO dimm_addr = 0
|
|
dimm_addr = 0
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_cpu_dimm_temp_range_and_refresh_rate(processors[i], dimm_addr)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_cpu_dimm_thermal_sensor(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_get_cpu_dimm_thermal_sensor as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO dimm_addr = 0
|
|
dimm_addr = 0
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_cpu_dimm_thermal_sensor(processors[i], dimm_addr)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_cpu_family(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_get_cpu_family as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
try:
|
|
msg = ''
|
|
ret = amdsmi.amdsmi_get_cpu_family()
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_cpu_fclk_mclk(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_cpu_fclk_mclk(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_cpu_handles(self):
|
|
if self.TODO_SKIP_NYI:
|
|
self.skipTest("Skipping test_get_cpu_handles as it is not implemented yet.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
try:
|
|
msg = ''
|
|
ret = amdsmi.amdsmi_get_cpu_handles(amdsmi.amdsmi_interface.AMDSMI_MAX_DEVICES)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_cpu_hsmp_driver_version(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_get_cpu_hsmp_driver_version as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_cpu_hsmp_driver_version(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_cpu_hsmp_proto_ver(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_get_cpu_hsmp_proto_ver as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_cpu_hsmp_proto_ver(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_cpu_model(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_get_cpu_model as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
try:
|
|
msg = ''
|
|
ret = amdsmi.amdsmi_get_cpu_model()
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_cpu_prochot_status(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_cpu_prochot_status(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_cpu_pwr_svi_telemetry_all_rails(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_cpu_pwr_svi_telemetry_all_rails(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_cpu_smu_fw_version(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_cpu_smu_fw_version(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_cpu_socket_c0_residency(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_cpu_socket_c0_residency(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_cpu_socket_current_active_freq_limit(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_cpu_socket_current_active_freq_limit(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_cpu_socket_energy(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_get_cpu_socket_energy as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_cpu_socket_energy(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_cpu_socket_freq_range(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_cpu_socket_freq_range(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_cpu_socket_lclk_dpm_level(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
nbio_id = 0
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): nbio_id({nbio_id}): '
|
|
ret = amdsmi.amdsmi_get_cpu_socket_lclk_dpm_level(processors[i], nbio_id)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_cpu_socket_power(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_cpu_socket_power(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_cpu_socket_power_cap(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_cpu_socket_power_cap(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_cpu_socket_power_cap_max(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_cpu_socket_power_cap_max(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_cpu_socket_temperature(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_cpu_socket_temperature(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_energy_count(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_energy_count(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_esmi_err_msg(self):
|
|
if self.TODO_SKIP_NYI:
|
|
self.skipTest("Skipping test_get_esmi_err_msg as it is not implemented yet.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
for status_num in error_map:
|
|
try:
|
|
msg = f'status({error_map[status_num]}): '
|
|
ret = amdsmi.amdsmi_get_esmi_err_msg(error_map[status_num])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_fw_info(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f"gpu({i}): "
|
|
ret = amdsmi.amdsmi_get_fw_info(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_accelerator_partition_profile(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_accelerator_partition_profile(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_accelerator_partition_profile_config(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_accelerator_partition_profile_config(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_activity(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_activity(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_asic_info(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_asic_info(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_bad_page_info(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_bad_page_info(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_bad_page_threshold(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_bad_page_threshold(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_bdf_id(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_bdf_id(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_board_info(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_board_info(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_cache_info(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = gpu_cache_infos = amdsmi.amdsmi_get_gpu_cache_info(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_compute_partition(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_compute_partition(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_compute_process_gpus(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_get_gpu_compute_process_gpus as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
# TODO pid = 0
|
|
pid = 0
|
|
try:
|
|
msg = f'pid({pid}): '
|
|
ret = gpu_compute_process_gpuss = amdsmi.amdsmi_get_gpu_compute_process_gpus(pid)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_compute_process_info(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_compute_process_info()
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_compute_process_info_by_pid(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_get_gpu_compute_process_info_by_pid as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
# TODO pid = 0
|
|
pid = 0
|
|
try:
|
|
msg = f'pid({pid}): '
|
|
ret = amdsmi.amdsmi_get_gpu_compute_process_info_by_pid(pid)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_device_bdf(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_device_bdf(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_device_uuid(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_device_uuid(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_driver_info(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_driver_info(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_ecc_count(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
for gpu_block_name, gpu_block, gpu_block_cond in self.gpu_blocks:
|
|
try:
|
|
msg = f'gpu({i}): gpu_block({gpu_block_name}) '
|
|
ret = amdsmi.amdsmi_get_gpu_ecc_count(processors[i], gpu_block)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, gpu_block_cond):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_ecc_enabled(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_ecc_enabled(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_ecc_status(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_get_gpu_ecc_status as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
for gpu_block_name, gpu_block, gpu_block_cond in self.gpu_blocks:
|
|
try:
|
|
msg = f'gpu({i}): gpu_block({gpu_block_name}) '
|
|
ret = amdsmi.amdsmi_get_gpu_ecc_status(processors[i], gpu_block)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, gpu_block_cond):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_enumeration_info(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_enumeration_info(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_event_notification(self):
|
|
if self.TODO_SKIP_NYI:
|
|
self.skipTest("Skipping test_get_gpu_event_notification as it is not implemented yet.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_event_notification(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_fan_rpms(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_fan_rpms(processors[i], 0)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_fan_speed(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_fan_speed(processors[i], 0)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_fan_speed_max(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_fan_speed_max(processors[i], 0)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_id(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_id(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_kfd_info(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_kfd_info(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_mem_overdrive_level(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_mem_overdrive_level(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_memory_partition(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_memory_partition(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_memory_partition_config(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_memory_partition_config(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_memory_reserved_pages(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_memory_reserved_pages(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_memory_total(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
for memory_type_name, memory_type, memory_type_cond in self.memory_types:
|
|
try:
|
|
msg = f'gpu({i}): memory_type({memory_type_name}) '
|
|
ret = amdsmi.amdsmi_get_gpu_memory_total(processors[i], memory_type)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, memory_type_cond):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_memory_usage(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
for memory_type_name, memory_type, memory_type_cond in self.memory_types:
|
|
try:
|
|
msg = f'gpu({i}): memory_type({memory_type_name}) '
|
|
ret = amdsmi.amdsmi_get_gpu_memory_usage(processors[i], memory_type)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, memory_type_cond):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_metrics_header_info(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_metrics_header_info(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_metrics_info(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_metrics_info(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_od_volt_curve_regions(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
num_region = 10
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): num_region({num_region}): '
|
|
ret = amdsmi.amdsmi_get_gpu_od_volt_curve_regions(processors[i], num_region)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_od_volt_info(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_get_gpu_od_volt_info as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_od_volt_info(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_overdrive_level(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_overdrive_level(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_pci_bandwidth(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_pci_bandwidth(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_pci_replay_counter(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_pci_replay_counter(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_pci_throughput(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_pci_throughput(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_perf_level(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_perf_level(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_pm_metrics_info(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_get_gpu_pm_metrics_info as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_pm_metrics_info(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_power_profile_presets(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_power_profile_presets(processors[i], 0)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_process_isolation(self):
|
|
if self.TODO_SKIP_NYI:
|
|
self.skipTest("Skipping test_get_gpu_process_isolation as it is not implemented yet.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_process_isolation(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_process_list(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_process_list(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_ras_block_features_enabled(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_ras_block_features_enabled(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_ras_feature_info(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_ras_feature_info(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_reg_table_info(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_get_gpu_reg_table_info as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
for reg_type_name, reg_type, reg_type_cond in self.reg_types:
|
|
try:
|
|
msg = f'gpu({i}): reg_type({reg_type_name}): '
|
|
ret = amdsmi.amdsmi_get_gpu_reg_table_info(processors[i], reg_type)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, reg_type_cond):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_revision(self):
|
|
if self.TODO_SKIP_NYI:
|
|
self.skipTest("Skipping test_get_gpu_revision as it is not implemented yet.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_revision(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_subsystem_id(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_subsystem_id(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_subsystem_name(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_subsystem_name(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_topo_numa_affinity(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_topo_numa_affinity(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_total_ecc_count(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_total_ecc_count(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_vbios_info(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_vbios_info(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_vendor_name(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_vendor_name(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_virtualization_mode(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_virtualization_mode(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_volt_metric(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
for voltage_type_name, voltage_type, voltage_type_cond in self.voltage_types:
|
|
for voltage_metric_name, voltage_metric, voltage_metric_cond in self.voltage_metrics:
|
|
try:
|
|
msg = f'gpu({i}): voltage_type({voltage_type_name}) voltage_metric({voltage_metric_name}): '
|
|
ret = amdsmi.amdsmi_get_gpu_volt_metric(processors[i], voltage_type, voltage_metric)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if not voltage_type_cond == self.PASS:
|
|
if self._check_ret(msg, e, voltage_type_cond):
|
|
raise_exception = e
|
|
elif not voltage_metric_cond == self.PASS:
|
|
if self._check_ret(msg, e, voltage_metric_cond):
|
|
raise_exception = e
|
|
else:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_vram_info(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_vram_info(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_vram_usage(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_vram_usage(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_vram_vendor(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_vram_vendor(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_xcd_counter(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_xcd_counter(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_xgmi_link_status(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_gpu_xgmi_link_status(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_hsmp_metrics_table(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_hsmp_metrics_table(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_hsmp_metrics_table_version(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_hsmp_metrics_table_version(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_lib_version(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
try:
|
|
msg = f''
|
|
ret = amdsmi.amdsmi_get_lib_version()
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_link_metrics(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_get_link_metrics as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_link_metrics(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_link_topology_nearest(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
for link_type_name, link_type, link_type_cond in self.link_types:
|
|
try:
|
|
msg = f'gpu({i}): link_type({link_type_name}) '
|
|
ret = amdsmi.amdsmi_get_link_topology_nearest(processors[i], link_type)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, link_type_cond):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_minmax_bandwidth_between_processors(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_get_minmax_bandwidth_between_processors as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
for j in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i},{j}): '
|
|
ret = amdsmi.amdsmi_get_minmax_bandwidth_between_processors(processors[i], processors[j])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_pcie_info(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_pcie_info(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_power_cap_info(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_power_cap_info(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_power_info(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = power_info = amdsmi.amdsmi_get_power_info(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_processor_count_from_handles(self):
|
|
if self.TODO_SKIP_NYI:
|
|
self.skipTest("Skipping test_get_processor_count_from_handles as it is not implemented yet.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_processor_count_from_handles(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_processor_handle_from_bdf(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_get_processor_handle_from_bdf as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
#TODO: define bdf
|
|
bdf = 0
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_processor_handle_from_bdf(bdf)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_processor_handles(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
self._print(f' {i:2d} processor_handles: {processors[i]}')
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_processor_handles_by_type(self):
|
|
if self.TODO_SKIP_NYI:
|
|
self.skipTest("Skipping test_get_processor_handles_by_type as it is not implemented yet.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_processor_handles_by_type(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_processor_info(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_processor_info(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_processor_type(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_processor_type(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_soc_pstate(self):
|
|
if self.TODO_SKIP_NYI:
|
|
self.skipTest("Skipping test_get_soc_pstate as it is not implemented yet.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_soc_pstate(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_socket_handles(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_get_socket_handles as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
try:
|
|
msg = f''
|
|
ret = amdsmi.amdsmi_get_socket_handles()
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_socket_info(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
sockets = amdsmi.amdsmi_get_socket_handles()
|
|
self.assertGreaterEqual(len(sockets), 1)
|
|
# TODO Find maximum number of sockets
|
|
self.assertLessEqual(len(sockets), 32)
|
|
for i in range(0, len(sockets)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_socket_info(sockets[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_temp_metric(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
for temperature_type_name, temperature_type, temperature_type_cond in self.temperature_types:
|
|
for temperature_metric_name, temperature_metric, temperature_metric_cond in self.temperature_metrics:
|
|
try:
|
|
msg = f'gpu({i}): temperature_type=({temperature_type_name}) temperature_metric({temperature_metric_name}): '
|
|
ret = amdsmi.amdsmi_get_temp_metric(processors[i], temperature_type, temperature_metric)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if not temperature_type_cond == self.PASS:
|
|
if self._check_ret(msg, e, temperature_type_cond):
|
|
raise_exception = e
|
|
elif not temperature_metric_cond == self.PASS:
|
|
if self._check_ret(msg, e, temperature_metric_cond):
|
|
raise_exception = e
|
|
else:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_threads_per_core(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_get_threads_per_core as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
# TODO threads_per_core
|
|
try:
|
|
msg = f'threads_per_core: '
|
|
ret = amdsmi.amdsmi_get_threads_per_core()
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_utilization_count(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_get_utilization_count as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
for utilization_counter_type_name, utilization_counter_type, utilization_counter_type_cond in self.utilization_counter_types:
|
|
try:
|
|
msg = f'gpu({i}): utilization_counter_type({utilization_counter_type_name}): '
|
|
ret = amdsmi.amdsmi_get_utilization_count(processors[i], utilization_counter_type)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, utilization_counter_type_cond):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_violation_status(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_violation_status(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_xgmi_info(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_xgmi_info(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_xgmi_plpd(self):
|
|
if self.TODO_SKIP_NYI:
|
|
self.skipTest("Skipping test_get_xgmi_plpd as it is not implemented yet.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_get_xgmi_plpd(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_gpu_counter_group_supported(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_gpu_counter_group_supported as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
for event_group_name, event_group, event_group_cond in self.event_groups:
|
|
try:
|
|
msg = f'gpu({i}): event_group({event_group_name}): '
|
|
ret = amdsmi.amdsmi_gpu_counter_group_supported(processors[i], event_group)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, event_group_cond):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
if False: # TODO: create_counter, destroy_counter, read_counter, get_gpu_available_counters, gpu_control_counter
|
|
''' Check these:
|
|
test_get_gpu_pci_replay_counter
|
|
test_get_gpu_xcd_counter
|
|
test_gpu_counter_group_supported
|
|
'''
|
|
|
|
|
|
def test_gpu_create_counter(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_gpu_create_counter as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
for event_type_name, event_type, event_type_cond in self.event_types:
|
|
try:
|
|
msg = f'gpu({i}): event_type({event_type_name}): '
|
|
ret = amdsmi.amdsmi_gpu_create_counter(processors[i], event_type)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, event_type_cond):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_gpu_destroy_counter(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_gpu_destroy_counter as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
# TODO event_handle = 0
|
|
event_handle = 0
|
|
try:
|
|
msg = f'event_handle({event_handle}): '
|
|
ret = event_handle
|
|
amdsmi.amdsmi_gpu_destroy_counter(event_handle)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_gpu_read_counter(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_gpu_read_counter as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO event_handle = 0
|
|
event_handle = 0
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): event_handle({event_handle}): '
|
|
ret = amdsmi.amdsmi_gpu_read_counter(event_handle)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_get_gpu_available_counters(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_get_gpu_available_counters as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
for event_group_name, event_group_type, event_group_cond in self.event_groups:
|
|
try:
|
|
msg = f'gpu({i}): event_group({event_group_name}) '
|
|
ret = amdsmi.amdsmi_get_gpu_available_counters(processors[i], event_group_type)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, event_group_cond):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_gpu_control_counter(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_gpu_control_counter as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
# TODO event_handle = 0
|
|
event_handle = 0
|
|
for counter_command_name, counter_command, counter_commands_cond in self.counter_commands:
|
|
try:
|
|
msg = f'counter_command({counter_command_name}): '
|
|
ret = amdsmi.amdsmi_gpu_control_counter(event_handle, counter_command)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_gpu_validate_ras_eeprom(self):
|
|
if self.TODO_SKIP_NYI:
|
|
self.skipTest("Skipping test_gpu_validate_ras_eeprom as it is not implemented yet.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_gpu_validate_ras_eeprom(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_gpu_xgmi_error_status(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_gpu_xgmi_error_status(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_init(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
try:
|
|
msg = f''
|
|
ret = amdsmi.amdsmi_init()
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_shut_down(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
try:
|
|
msg = f''
|
|
ret = amdsmi.amdsmi_shut_down()
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_init_gpu_event_notification(self):
|
|
if self.TODO_SKIP_NYI:
|
|
self.skipTest("Skipping test_init_gpu_event_notification as it is not implemented yet.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_init_gpu_event_notification(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_is_P2P_accessible(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
for j in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i},{j}): '
|
|
ret = amdsmi.amdsmi_is_P2P_accessible(processors[i], processors[j])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_is_gpu_power_management_enabled(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_is_gpu_power_management_enabled(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_reset_gpu(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_reset_gpu(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_reset_gpu_fan(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_reset_gpu_fan(processors[i], 0)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_reset_gpu_xgmi_error(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_reset_gpu_xgmi_error(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_clk_freq(self):
|
|
if self.TODO_SKIP_NOT_COMPLETE:
|
|
self.skipTest("Skipping test_set_clk_freq as it is not complete.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO freq_bitmask = 0
|
|
freq_bitmask = 0
|
|
for i in range(0, len(processors)):
|
|
for clk_type_name, clk_type, clk_cond in self.clk_types:
|
|
try:
|
|
msg = f'gpu({i}): clk_type({clk_type_name}): freq_bitmask({freq_bitmask}): '
|
|
ret = amdsmi.amdsmi_set_clk_freq(processors[i], clk_type, freq_bitmask)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, clk_cond):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_cpu_core_boostlimit(self):
|
|
if self.TODO_SKIP_NOT_COMPLETE:
|
|
self.skipTest("Skipping test_set_cpu_core_boostlimit as it is not complete.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO boost_limit = 0
|
|
boost_limit = 0
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): boost_limit({boost_limit}): '
|
|
ret = amdsmi.amdsmi_set_cpu_core_boostlimit(processors[i], boost_limit)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_cpu_df_pstate_range(self):
|
|
if self.TODO_SKIP_NOT_COMPLETE:
|
|
self.skipTest("Skipping test_set_cpu_df_pstate_range as it is not complete.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO max_pstate = 0, min_pstate = 0
|
|
max_pstate = 0
|
|
min_pstate = 0
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): max_pstate({max_pstate}) min_pstate({min_pstate}): '
|
|
ret = amdsmi.amdsmi_set_cpu_df_pstate_range(processors[i], max_pstate, min_pstate)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_cpu_gmi3_link_width_range(self):
|
|
if self.TODO_SKIP_NOT_COMPLETE:
|
|
self.skipTest("Skipping test_set_cpu_gmi3_link_width_range as it is not complete.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO min_link_width = 0, max_link_width = 0
|
|
min_link_width = 0
|
|
max_link_width = 0
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): min_link_width({min_link_width}) max_link_width({max_link_width}): '
|
|
ret = amdsmi.amdsmi_set_cpu_gmi3_link_width_range(processors[i], min_link_width, max_link_width)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_cpu_pcie_link_rate(self):
|
|
if self.TODO_SKIP_NOT_COMPLETE:
|
|
self.skipTest("Skipping test_set_cpu_pcie_link_rate as it is not complete.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO rate_ctrl = 0
|
|
rate_ctrl = 0
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): rate_ctrl({rate_ctrl}): '
|
|
ret = amdsmi.amdsmi_set_cpu_pcie_link_rate(processors[i], rate_ctrl)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_cpu_pwr_efficiency_mode(self):
|
|
if self.TODO_SKIP_NYI:
|
|
self.skipTest("Skipping test_set_cpu_pwr_efficiency_mode as it is not implemented is not yet implemented.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO mode = 0
|
|
mode = 0
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): mode({mode}): '
|
|
ret = amdsmi.set_cpu_pwr_efficiency_mode(processors[i], mode)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_cpu_socket_boostlimit(self):
|
|
if self.TODO_SKIP_NOT_COMPLETE:
|
|
self.skipTest("Skipping test_set_cpu_socket_boostlimit as it is not complete.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO boost_limit = 0
|
|
boost_limit = 0
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): boost_limit({boost_limit}): '
|
|
ret = amdsmi.amdsmi_set_cpu_socket_boostlimit(processors[i], boost_limit)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_cpu_socket_lclk_dpm_level(self):
|
|
if self.TODO_SKIP_NOT_COMPLETE:
|
|
self.skipTest("Skipping test_set_cpu_socket_lclk_dpm_level as it is not complete.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO nbio_id = 0, min_val = 0, max_val = 0
|
|
nbio_id = 0
|
|
min_val = 0
|
|
max_val = 0
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): nbio_id({nbio_id}) min_val({min_val}) max_val({max_val}): '
|
|
ret = amdsmi.amdsmi_set_cpu_socket_lclk_dpm_level(processors[i], nbio_id, min_val, max_val)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_cpu_socket_power_cap(self):
|
|
if self.TODO_SKIP_NOT_COMPLETE:
|
|
self.skipTest("Skipping test_set_cpu_socket_power_cap as it is not complete.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO power_cap = 0
|
|
power_cap = 0
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): power_cap({power_cap}): '
|
|
ret = amdsmi.amdsmi_set_cpu_socket_power_cap(processors[i], power_cap)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_cpu_xgmi_width(self):
|
|
if self.TODO_SKIP_NOT_COMPLETE:
|
|
self.skipTest("Skipping test_set_cpu_xgmi_width as it is not complete.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO min_width = 0, max_width = 0
|
|
min_width = 0
|
|
max_width = 0
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): min_width({min_width} max_width({max_width}): )'
|
|
ret = amdsmi.amdsmi_set_cpu_xgmi_width(processors[i], min_width , max_width)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_gpu_accelerator_partition_profile(self):
|
|
if self.TODO_SKIP_NOT_COMPLETE:
|
|
self.skipTest("Skipping test_set_gpu_accelerator_partition_profile as it is not complete.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO profile_index = 0
|
|
profile_index = 0
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): profile_index({profile_index}): '
|
|
ret = amdsmi.amdsmi_set_gpu_accelerator_partition_profile(processors[i], profile_index)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_gpu_clk_limit(self):
|
|
if self.TODO_SKIP_NOT_COMPLETE:
|
|
self.skipTest("Skipping test_set_gpu_clk_limit as it is not complete.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO value = 0 is for min and max, need to separate out values
|
|
value = 0
|
|
for i in range(0, len(processors)):
|
|
for clk_type_name, clk_type, clk_cond in self.clk_types:
|
|
for clk_limit_type_name, clk_limit_type, clk_limit_cond in self.clk_limit_types:
|
|
try:
|
|
msg = f'gpu({i}): value({value}) clock_type=({clk_type_name}) clock_limit_type({clk_limit_type_name}): '
|
|
ret = amdsmi.amdsmi_set_gpu_clk_limit(processors[i], clk_type, clk_limit_type, value)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if not clk_cond == self.PASS:
|
|
self._check_ret(msg, e, clk_cond)
|
|
raise_exception = e
|
|
elif not clk_limit_type == self.PASS:
|
|
self._check_ret(msg, e, clk_limit_type)
|
|
raise_exception = e
|
|
else:
|
|
self._check_ret(msg, e, self.PASS)
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_gpu_clk_range(self):
|
|
if self.TODO_SKIP_NOT_COMPLETE:
|
|
self.skipTest("Skipping test_set_gpu_clk_range as it is not complete.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO min_clk_value = 0 max_clk_value = 0
|
|
min_clk_value = 0
|
|
max_clk_value = 0
|
|
for i in range(0, len(processors)):
|
|
for clk_type_name, clk_type, clk_cond in self.clk_types:
|
|
try:
|
|
msg = f'gpu({i}): min_clk_value({min_clk_value}) max_clk_value({max_clk_value}) clk_type({clk_type_name}): '
|
|
ret = amdsmi.amdsmi_set_gpu_clk_range(processors[i], min_clk_value, max_clk_value, clk_type)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, clk_cond):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_gpu_compute_partition(self):
|
|
if self.TODO_SKIP_NOT_COMPLETE:
|
|
self.skipTest("Skipping test_set_gpu_compute_partition as it is not complete.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
for compute_partition_type_name, compute_partition_type, compute_partition_type_cond in self.compute_partition_types:
|
|
try:
|
|
msg = f'gpu({i}): compute_partition_type({compute_partition_type_name}): '
|
|
ret = amdsmi.amdsmi_set_gpu_compute_partition(processors[i], compute_partition_type)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, compute_partition_type_cond):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_gpu_event_notification_mask(self):
|
|
if self.TODO_SKIP_NYI:
|
|
self.skipTest("Skipping test_set_gpu_event_notification_mask as it is not implemented yet.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_set_gpu_event_notification_mask(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_gpu_fan_speed(self):
|
|
if self.TODO_SKIP_NOT_COMPLETE:
|
|
self.skipTest("Skipping test_set_gpu_fan_speed as it is not complete.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO fan_speed = 0
|
|
fan_speed = 0
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): fan_speed({fan_speed}): '
|
|
ret = amdsmi.amdsmi_set_gpu_fan_speed(processors[i], 0, fan_speed)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_gpu_memory_partition(self):
|
|
if self.TODO_SKIP_NOT_COMPLETE:
|
|
self.skipTest("Skipping test_set_gpu_memory_partition as it is not complete.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
for memory_partition_type_name, memory_partition_type, memory_partition_type_cond in self.memory_partition_types:
|
|
try:
|
|
msg = f'gpu({i}): memory_partition_type({memory_partition_type_name}): '
|
|
ret = amdsmi.amdsmi_set_gpu_memory_partition(processors[i], memory_partition_type)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, memory_partition_type_cond):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_gpu_memory_partition_mode(self):
|
|
if self.TODO_SKIP_NOT_COMPLETE:
|
|
self.skipTest("Skipping test_set_gpu_memory_partition_mode as it is not complete.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
for memory_partition_type_name, memory_partition_type, memory_partition_type_cond in self.memory_partition_types:
|
|
try:
|
|
msg = f'gpu({i}): memory_partition_type({memory_partition_type_name}): '
|
|
ret = amdsmi.amdsmi_set_gpu_memory_partition_mode(processors[i], memory_partition_type)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, memory_partition_type_cond):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_gpu_od_clk_info(self):
|
|
if self.TODO_SKIP_NOT_COMPLETE:
|
|
self.skipTest("Skipping test_set_gpu_od_clk_info as it is not complete.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO value = 0
|
|
value = 0
|
|
for i in range(0, len(processors)):
|
|
for freq_ind_name, freq_ind, freq_ind_cond in self.freq_inds:
|
|
for clk_type_name, clk_type, clk_cond in self.clk_types:
|
|
try:
|
|
msg = f'gpu({i}): freq_ind({freq_ind_name}) value({value}) clk_type({clk_type_name}): '
|
|
ret = amdsmi.amdsmi_set_gpu_od_clk_info(processors[i], freq_ind, value, clk_type)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if not freq_ind_cond == self.PASS:
|
|
self._check_ret(msg, e, freq_ind_cond)
|
|
raise_exception = e
|
|
elif not clk_cond == self.PASS:
|
|
self._check_ret(msg, e, clk_cond)
|
|
raise_exception = e
|
|
else:
|
|
self._check_ret(msg, e, self.PASS)
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_gpu_od_volt_info(self):
|
|
if self.TODO_SKIP_NOT_COMPLETE:
|
|
self.skipTest("Skipping test_set_gpu_od_volt_info as it is not complete.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO vpoint = 0 clk_value = 0 volt_value = 0
|
|
vpoint = 0
|
|
clk_value = 0
|
|
volt_value = 0
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): vpoint({vpoint}) clk_value({clk_value}) volt_value({volt_value}): '
|
|
ret = amdsmi.amdsmi_set_gpu_od_volt_info(processors[i], vpoint, clk_value, volt_value)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_gpu_overdrive_level(self):
|
|
if self.TODO_SKIP_NOT_COMPLETE:
|
|
self.skipTest("Skipping test_set_gpu_overdrive_level as it is not complete.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO overdrive_value = 0
|
|
overdrive_value = 0
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): overdrive_value({overdrive_value}): '
|
|
ret = amdsmi.amdsmi_set_gpu_overdrive_level(processors[i], overdrive_value)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_gpu_pci_bandwidth(self):
|
|
if self.TODO_SKIP_NOT_COMPLETE:
|
|
self.skipTest("Skipping test_set_gpu_pci_bandwidth as it is not complete.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO bitmask = 0
|
|
bitmask = 0
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): bitmask({bitmask}): '
|
|
ret = amdsmi.amdsmi_set_gpu_pci_bandwidth(processors[i], bitmask)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_gpu_perf_determinism_mode(self):
|
|
if self.TODO_SKIP_NOT_COMPLETE:
|
|
self.skipTest("Skipping test_set_gpu_perf_determinism_mode as it is not complete.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO clk_value = 0
|
|
clk_value = 0
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): clk_value({clk_value}): '
|
|
ret = amdsmi.amdsmi_set_gpu_perf_determinism_mode(processors[i], clk_value)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_gpu_perf_level(self):
|
|
if self.TODO_SKIP_NOT_COMPLETE:
|
|
self.skipTest("Skipping test_set_gpu_perf_level as it is not complete.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO Need to set back to default
|
|
for i in range(0, len(processors)):
|
|
for dev_perf_level_name, dev_perf_level, dev_perf_level_cond in self.dev_perf_levels:
|
|
try:
|
|
msg = f'gpu({i}): dev_perf_level({dev_perf_level_name}): '
|
|
ret = amdsmi.amdsmi_set_gpu_perf_level(processors[i], dev_perf_level)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, dev_perf_level_cond):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_gpu_power_profile(self):
|
|
if self.TODO_SKIP_NOT_COMPLETE:
|
|
self.skipTest("Skipping test_set_gpu_power_profile as it is not complete.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
for power_profile_preset_mask, power_profile_preset_masks_cond in self.power_profile_preset_masks:
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_set_gpu_power_profile(processors[i], 0, power_profile_preset_mask)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, power_profile_preset_masks_cond):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_gpu_process_isolation(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_set_gpu_process_isolation as it is not yet implemented.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO pisolate = 0
|
|
pisolate = 0
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_set_gpu_process_isolation(processors[i], pisolate)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_power_cap(self):
|
|
if self.TODO_SKIP_NOT_COMPLETE:
|
|
self.skipTest("Skipping test_set_power_cap as it is not complete.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO cap = 0
|
|
cap = 0
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_set_power_cap(processors[i], 0, cap)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_soc_pstate(self):
|
|
if self.TODO_SKIP_NOT_COMPLETE:
|
|
self.skipTest("Skipping test_set_soc_pstate as it is not complete.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO policy_id = 0
|
|
policy_id = 0
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_set_soc_pstate(processors[i], policy_id)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_set_xgmi_plpd(self):
|
|
if self.TODO_SKIP_NOT_COMPLETE:
|
|
self.skipTest("Skipping test_set_xgmi_plpd as it is not complete.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
# TODO policy_id = 0
|
|
policy_id = 0
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_set_xgmi_plpd(processors[i], policy_id)
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_status_code_to_string(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_status_code_to_string as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
# TODO status = 0
|
|
status = 0
|
|
status_code_to_string = amdsmi.amdsmi_status_code_to_string(status)
|
|
self._print(f' {status} status_code_to_string: {status_code_to_string}')
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_stop_gpu_event_notification(self):
|
|
if self.TODO_SKIP_NYI:
|
|
self.skipTest("Skipping test_stop_gpu_event_notification as it is not implemented yet.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_stop_gpu_event_notification(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_topo_get_link_type(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
for j in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i},{j}): '
|
|
ret = amdsmi.amdsmi_topo_get_link_type(processors[i], processors[j])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_topo_get_link_weight(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
for j in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i},{j}): '
|
|
ret = amdsmi.amdsmi_topo_get_link_weight(processors[i], processors[j])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_topo_get_numa_node_number(self):
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i}): '
|
|
ret = amdsmi.amdsmi_topo_get_numa_node_number(processors[i])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
|
|
def test_topo_get_p2p_status(self):
|
|
if self.TODO_SKIP_FAIL:
|
|
self.skipTest("Skipping test_topo_get_p2p_status as it fails.")
|
|
raise_exception = None
|
|
self.setUp()
|
|
processors = amdsmi.amdsmi_get_processor_handles()
|
|
self.assertGreaterEqual(len(processors), 1)
|
|
self.assertLessEqual(len(processors), 32)
|
|
for i in range(0, len(processors)):
|
|
for j in range(0, len(processors)):
|
|
try:
|
|
msg = f'gpu({i},{j}): '
|
|
ret = amdsmi.amdsmi_topo_get_p2p_status(processors[i], processors[j])
|
|
self._print(msg, ret)
|
|
except amdsmi.AmdSmiLibraryException as e:
|
|
if self._check_ret(msg, e, self.PASS):
|
|
raise_exception = e
|
|
if raise_exception:
|
|
raise raise_exception
|
|
self.tearDown()
|
|
|
|
if __name__ == '__main__':
|
|
verbose=1
|
|
if '-q' in sys.argv or '--quiet' in sys.argv:
|
|
verbose=0
|
|
elif '-v' in sys.argv or '--verbose' in sys.argv:
|
|
verbose=2
|
|
|
|
unittest.main()
|