From fc003e8db5ca6752d8b53249eaa2cd5b1d3a4b4d Mon Sep 17 00:00:00 2001 From: foreman Date: Thu, 19 Dec 2019 12:20:17 -0500 Subject: [PATCH] P4 to Git Change 2048585 by kjayapra@2_HIPWS_P2P_ROCM2 on 2019/12/19 12:15:48 SWDEV-215976 - Map IPC pointers to all devices by default, since Peer is enabled @ roc::init anyway. Affected files ... ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocdevice.cpp#147 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocdevice.hpp#46 edit --- rocclr/runtime/device/rocm/rocdevice.cpp | 12 +++++++++++- rocclr/runtime/device/rocm/rocdevice.hpp | 1 + 2 files changed, 12 insertions(+), 1 deletion(-) diff --git a/rocclr/runtime/device/rocm/rocdevice.cpp b/rocclr/runtime/device/rocm/rocdevice.cpp index dce32bce70..2cc53cd4b8 100644 --- a/rocclr/runtime/device/rocm/rocdevice.cpp +++ b/rocclr/runtime/device/rocm/rocdevice.cpp @@ -216,6 +216,8 @@ Device::~Device() { delete settings_; settings_ = nullptr; } + + delete[] p2p_agents_list_; } bool NullDevice::initCompiler(bool isOffline) { #if defined(WITH_COMPILER_LIB) @@ -1074,6 +1076,13 @@ bool Device::populateOCLDeviceConstants() { } } + /* Keep track of all P2P Agents in a Array including current device handle for IPC */ + p2p_agents_list_ = new hsa_agent_t[1 + p2p_agents_.size()]; + p2p_agents_list_[0] = getBackendDevice(); + for (size_t agent_idx = 0; agent_idx < p2p_agents_.size(); ++agent_idx) { + p2p_agents_list_[1 + agent_idx] = p2p_agents_[agent_idx]; + } + size_t group_segment_size = 0; if (HSA_STATUS_SUCCESS != hsa_amd_memory_pool_get_info(group_segment_, HSA_AMD_MEMORY_POOL_INFO_SIZE, @@ -1718,11 +1727,12 @@ amd::Memory *Device::IpcAttach(const void* handle, size_t mem_size, unsigned int amd::Memory* amd_mem_obj = nullptr; hsa_status_t hsa_status = HSA_STATUS_SUCCESS; + /* FIX_ME (SWDEV-215976): Mapping for all devices is not optimal. In future map only for devices on need basis */ /* Retrieve the devPtr from the handle */ hsa_agent_t hsa_agent = getBackendDevice(); hsa_status = hsa_amd_ipc_memory_attach(reinterpret_cast(handle), - mem_size, 1, &hsa_agent, dev_ptr); + mem_size, (1 + p2p_agents_.size()), p2p_agents_list_, dev_ptr); if (hsa_status != HSA_STATUS_SUCCESS) { LogError("[OCL] HSA failed to attach IPC memory"); diff --git a/rocclr/runtime/device/rocm/rocdevice.hpp b/rocclr/runtime/device/rocm/rocdevice.hpp index 4fe0eea6d1..b257e1cf6d 100644 --- a/rocclr/runtime/device/rocm/rocdevice.hpp +++ b/rocclr/runtime/device/rocm/rocdevice.hpp @@ -439,6 +439,7 @@ class Device : public NullDevice { static std::vector gpu_agents_; std::vector p2p_agents_; //!< List of P2P agents available for this device hsa_agent_t _bkendDevice; + hsa_agent_t* p2p_agents_list_; hsa_profile_t agent_profile_; hsa_amd_memory_pool_t group_segment_; hsa_amd_memory_pool_t system_segment_;