[SWDEV-573540] Add DRM-based wake for suspended AMD GPUs (#2510)

Implements automatic device wake using getDRMDeviceId() DRM call when GPUs
are detected in low-power state. This ensures rocm-smi can access device
information on suspended GPUs.

Signed-off-by: Bindhiya Kanangot Balakrishnan <Bindhiya.KanangotBalakrishnan@amd.com>
This commit is contained in:
Bindhiya Kanangot Balakrishnan
2026-01-08 10:19:45 -06:00
zatwierdzone przez GitHub
rodzic ac1fa8dccb
commit 8326c33d33
@@ -4518,7 +4518,19 @@ if __name__ == '__main__':
if not checkAmdGpus(deviceList):
logging.warning('No AMD GPUs specified')
if not check_runtime_status():
logging.warning('AMD GPU device(s) is/are in a low-power state. Check power control/runtime_status\n')
wake_device_failed = False
logging.debug('Using DRM device ID call to wake suspended devices')
for device in deviceList:
try:
device_id = getDRMDeviceId(device, silent=True)
if device_id == 'N/A':
wake_device_failed = True
logging.debug(f'Failed to wake device {device} via DRM call')
except Exception as e:
wake_device_failed = True
logging.debug(f'Exception waking device {device}: {str(e)}')
if wake_device_failed:
logging.warning('AMD GPU device(s) is/are in a low-power state. Check power control/runtime_status\n')
if isConciseInfoRequested(args):
showAllConcise(deviceList)
if args.showhw: