Files
rocm-systems/runtime/hsa-runtime/core/inc/driver.h
T
Honglei Huang 6c87f5b5ce rocr/driver: add memory residency management interface in driver
This commit introduces MakeMemoryResident and MakeMemoryUnresident
functions to KfdDriver and XdnaDriver classes.

- Added implementations in amd_kfd_driver.cpp
- Added stubs in amd_xdna_driver.cpp returning HSA_STATUS_ERROR
- Updated header files amd_kfd_driver.h and amd_xdna_driver.h
- Removed MakeKfdMemoryResident/Unresident from amd_memory_region.cpp

Signed-off-by: Honglei Huang <Honglei1.Huang@amd.com>
2025-07-16 13:15:45 +08:00

362 خطوط
17 KiB
C++

////////////////////////////////////////////////////////////////////////////////
//
// The University of Illinois/NCSA
// Open Source License (NCSA)
//
// Copyright (c) 2023-2025, Advanced Micro Devices, Inc. All rights reserved.
//
// Developed by:
//
// AMD Research and AMD HSA Software Development
//
// Advanced Micro Devices, Inc.
//
// www.amd.com
//
// Permission is hereby granted, free of charge, to any person obtaining a copy
// of this software and associated documentation files (the "Software"), to
// deal with the Software without restriction, including without limitation
// the rights to use, copy, modify, merge, publish, distribute, sublicense,
// and/or sell copies of the Software, and to permit persons to whom the
// Software is furnished to do so, subject to the following conditions:
//
// - Redistributions of source code must retain the above copyright notice,
// this list of conditions and the following disclaimers.
// - Redistributions in binary form must reproduce the above copyright
// notice, this list of conditions and the following disclaimers in
// the documentation and/or other materials provided with the distribution.
// - Neither the names of Advanced Micro Devices, Inc,
// nor the names of its contributors may be used to endorse or promote
// products derived from this Software without specific prior written
// permission.
//
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
// THE CONTRIBUTORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
// OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
// ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
// DEALINGS WITH THE SOFTWARE.
//
////////////////////////////////////////////////////////////////////////////////
#ifndef HSA_RUNTME_CORE_INC_DRIVER_H_
#define HSA_RUNTME_CORE_INC_DRIVER_H_
#include <cstdint>
#include <limits>
#include <string>
#include "core/inc/memory_region.h"
#include "hsakmt/hsakmttypes.h"
#include "inc/hsa.h"
namespace rocr {
namespace core {
class Queue;
enum class DriverQuery { GET_DRIVER_VERSION };
enum class DriverType { XDNA = 0, KFD, NUM_DRIVER_TYPES };
/// @brief Handle for exported / imported memory.
struct ShareableHandle {
uint64_t handle{};
bool IsValid() const { return handle != 0; }
};
/// @brief Kernel driver interface.
///
/// @details A class used to provide an interface between the core runtime
/// and agent kernel drivers. It also maintains state associated with active
/// kernel drivers.
class Driver {
public:
Driver(DriverType kernel_driver_type, std::string devnode_name);
virtual ~Driver() = default;
/// @brief Initialize the driver's state after opening.
virtual hsa_status_t Init() = 0;
/// @brief Release the driver's resources and close the kernel-mode
/// driver.
virtual hsa_status_t ShutDown() = 0;
/// @brief Get driver version information.
/// @retval DriverVersionInfo containing the driver's version information.
const HsaVersionInfo& Version() const { return version_; }
/// @brief Query the kernel-model driver.
/// @retval HSA_STATUS_SUCCESS if the kernel-model driver query was
/// successful.
virtual hsa_status_t QueryKernelModeDriver(DriverQuery query) = 0;
/// @brief Open a connection to the driver using name_.
/// @retval HSA_STATUS_SUCCESS if the driver was opened successfully.
virtual hsa_status_t Open() = 0;
/// @brief Close a connection to the open driver using fd_.
/// @retval HSA_STATUS_SUCCESS if the driver was opened successfully.
virtual hsa_status_t Close() = 0;
/// @brief Get the system properties for nodes managed by this driver.
virtual hsa_status_t GetSystemProperties(HsaSystemProperties& sys_props) const = 0;
/// @brief Get the properties for a specific node managed by this driver.
virtual hsa_status_t GetNodeProperties(HsaNodeProperties& node_props, uint32_t node_id) const = 0;
/// @brief Get the edge (IO link) properties of a specific node (that is
/// managed by this driver) in the topology graph.
/// @param[out] io_link_props IO link properties of the node specified by @p node_id.
/// @param[in] node_id ID of the node whose link properties are being queried.
virtual hsa_status_t GetEdgeProperties(std::vector<HsaIoLinkProperties>& io_link_props,
uint32_t node_id) const = 0;
/// @brief Get the memory properties of a specific node.
/// @param[in] node_id Node ID of the agent.
/// @param[out] mem_props Memory properties of the node specified by @p node_id.
/// @retval HSA_STATUS_SUCCESS if the driver sucessfully returns the node's
/// memory properties.
virtual hsa_status_t GetMemoryProperties(uint32_t node_id,
std::vector<HsaMemoryProperties>& mem_props) const = 0;
/// @brief Get the cache properties of a specific node.
/// @param[in] node_ide Node ID of the agent.
/// @param[out] cache_props Cache properties of the node specified by @p node_id.
/// @retval HSA_STATUS_SUCCESS if the driver successfully returns the node's cache properties.
virtual hsa_status_t GetCacheProperties(uint32_t node_id, uint32_t processor_id,
std::vector<HsaCacheProperties>& cache_props) const = 0;
/// @brief Allocate agent-accessible memory (system or agent-local memory).
/// @param[out] mem pointer to newly allocated memory.
/// @retval HSA_STATUS_SUCCESS if memory was successfully allocated or
/// hsa_status_t error code if the memory allocation failed.
virtual hsa_status_t AllocateMemory(const MemoryRegion &mem_region,
MemoryRegion::AllocateFlags alloc_flags,
void **mem, size_t size,
uint32_t node_id) = 0;
virtual hsa_status_t FreeMemory(void *mem, size_t size) = 0;
/// @brief Create an agent dispatch queue with user-mode access rights.
/// @param[in] node_id Node ID of the agent on which the queue is being created.
/// @param[in] type Queue's type.
/// @param[in] queue_pct Maximum percentage of a queue's occupancy allowed.
/// @param[in] priority Queue's priority for scheduling.
/// @param[in] sdma_engine_id ID of the SDMA engine on which the queue is being created. Only used
/// if @p type is one of the SDMA queue types.
/// @param[in] queue_addr Address of the queue's ring buffer.
/// @param[in] queue_size_bytes Size of the queue's ring buffer in bytes.
/// @param[in] event HsaEvent for event-driven callbacks.
/// @param[out] queue_resource Queue resource information populated by the driver.
virtual hsa_status_t CreateQueue(uint32_t node_id, HSA_QUEUE_TYPE type, uint32_t queue_pct,
HSA_QUEUE_PRIORITY priority, uint32_t sdma_engine_id,
void* queue_addr, uint64_t queue_size_bytes, HsaEvent* event,
HsaQueueResource& queue_resource) const = 0;
/// @brief Destroy a queue.
/// @param queue_id Kernel-mode driver's assigned queue ID.
virtual hsa_status_t DestroyQueue(HSA_QUEUEID queue_id) const = 0;
/// @brief Update a queue's properties.
/// @param[in] queue_id Kernel-mode driver's assigned queue ID.
/// @param[in] queue_pct Maximum percentage of a queue's occupancy allowed.
/// @param[in] priority Queue's priority for scheduling.
/// @param[in] queue_addr Queue's ring buffer base address.
/// @param[in] queue_size_bytes Size of the queue's ring buffer in bytes.
/// @param[in] event HsaEvent for event-driven callbacks.
virtual hsa_status_t UpdateQueue(HSA_QUEUEID queue_id, uint32_t queue_pct,
HSA_QUEUE_PRIORITY priority, void* queue_addr,
uint64_t queue_size_bytes, HsaEvent* event) const = 0;
/// @brief Set the CU mask for a queue.
/// @details This sets the CU bitmask for a queue. The CU mask determines which CUs
/// a queue's dispatches can target. Currently this is only supported for GPU devices.
/// @param[in] queue_id Kernel-mode driver's assigned queue ID.
/// @param[in] cu_mask_count Number of CU bits in the mask.
/// @param[in] queue_cu_mask New CU mask for the queue.
virtual hsa_status_t SetQueueCUMask(HSA_QUEUEID queue_id, uint32_t cu_mask_count,
uint32_t* queue_cu_mask) const = 0;
/// @brief Allocate global wave sync (GWS) resource for a queue. This is only supported for GPUs.
/// GWS can be used to synchronize wavefronts across the entire GPU device.
/// @param[in] queue_id Kernel-mode driver's assigned queue ID.
/// @param[in] num_gws Number of GWS slots.
/// @param[in] first_gws First GWS slot.
virtual hsa_status_t AllocQueueGWS(HSA_QUEUEID queue_id, uint32_t num_gws,
uint32_t* first_gws) const = 0;
/// @brief Imports memory using dma-buf.
///
/// @param[in] mem virtual address
/// @param[in] size memory size in bytes
/// @param[out] dmabuf_fd dma-buf file descriptor
/// @param[out] offset memory offset in bytes
virtual hsa_status_t ExportDMABuf(void *mem, size_t size, int *dmabuf_fd,
size_t *offset) = 0;
/// @brief Imports a memory chunk via dma-buf.
///
/// @param[in] dmabuf_fd dma-buf file descriptor
/// @param[in] agent agent to import the memory for
/// @param[out] handle handle to the imported memory
virtual hsa_status_t ImportDMABuf(int dmabuf_fd, core::Agent &agent,
core::ShareableHandle &handle) = 0;
/// @brief Maps the memory associated with the handle.
///
/// @param[in] handle handle to the memory object
/// @param[in] mem virtual address associated with the handle
/// @param[in] offset memory offset in bytes
/// @param[in] size memory size in bytes
/// @param[out] perms new permissions
virtual hsa_status_t Map(core::ShareableHandle handle, void *mem,
size_t offset, size_t size,
hsa_access_permission_t perms) = 0;
/// @brief Unmaps the memory associated with the handle.
///
/// @param[in] handle handle to the memory object
/// @param[in] mem virtual address associated with the handle
/// @param[in] offset memory offset in bytes
/// @param[in] size memory size in bytes
virtual hsa_status_t Unmap(core::ShareableHandle handle, void *mem,
size_t offset, size_t size) = 0;
/// @brief Releases the object associated with the handle.
///
/// @param[in] handle handle of the object to release
virtual hsa_status_t
ReleaseShareableHandle(core::ShareableHandle &handle) = 0;
/// @brief Acquire a streaming performance monitor on an agent.
/// @param[in] preferred_node_id Node ID of the preferred agent.
virtual hsa_status_t SPMAcquire(uint32_t preferred_node_id) const = 0;
/// @brief Release a streaming performance monitor on an agent.
/// @param[in] preferred_node_id Node ID of the preferred agent.
virtual hsa_status_t SPMRelease(uint32_t preferred_node_id) const = 0;
/// @brief Setup the destination user-mode buffer for streaming performance monitor data.
/// @param[in] preferred_node_id Node ID of the preferred agent.
/// @param[in] size_bytes Size of the destination buffer in bytes.
/// @param[in, out] timeout Timeout in milliseconds.
/// @param[out] size_copied Size of data copied in bytes.
/// @param[in] dest_mem_addr Destination address for streaming performance data. Set to NULL to
/// stop copy on previous buffer.
/// @param[out] is_spm_data_loss Data was lost if true.
virtual hsa_status_t SPMSetDestBuffer(uint32_t preferred_node_id, uint32_t size_bytes,
uint32_t* timeout, uint32_t* size_copied,
void* dest_mem_addr, bool* is_spm_data_loss) const = 0;
/// @brief Open anonymous file descriptor to enable events and read SMI events.
/// @param[in] node_id Node ID to receive the SMI event from.
/// @param[out] fd Anonymous file descriptor.
/// @retval HSA_STATUS_ERROR_INVALID_AGENT if the agent's driver doesn't support
/// SMI events.
virtual hsa_status_t OpenSMI(uint32_t node_id, int* fd) const {
return HSA_STATUS_ERROR_INVALID_AGENT;
}
/// @brief Sets trap handler and trap buffer to be used for all queues associated
/// with the specified NodeId within this process context
/// @param[in] node_id Node ID of the agent
/// @param[in] base Trap handler base address
/// @param[in] base_size Trap handler base size
/// @param[in] buffer_base Trap buffer base address
/// @param[in] buffer_base_size Trap buffer size
/// @return HSA_STATUS_SUCCESS if the driver successfully sets the trap handler.
virtual hsa_status_t SetTrapHandler(uint32_t node_id, const void* base, uint64_t base_size,
const void* buffer_base, uint64_t buffer_base_size) const = 0;
/// @brief Gets the device handle for a specific node.
/// @param node_id Node ID of the agent
/// @param device_handle Device handle
/// @return HSA_STATUS_SUCCESS if the driver successfully returns the device
virtual hsa_status_t GetDeviceHandle(uint32_t node_id, void** device_handle) const = 0;
/// @brief Gets clock counters for particular Node
/// @param[in] node_id Node ID of the agent
/// @param[out] clock_counter Clock counter
/// @return HSA_STATUS_SUCCESS if the driver successfully returns the clock
virtual hsa_status_t GetClockCounters(uint32_t node_id,
HsaClockCounters* clock_counter) const = 0;
/// @brief Get the tile configuration for a specific node.
///
/// @param[in] node_id Node ID of the agent
/// @param[out] config Pointer to tile configuration
/// @return HSA_STATUS_SUCCESS if the driver successfully returns the tile configuration.
virtual hsa_status_t GetTileConfig(uint32_t node_id, HsaGpuTileConfig* config) const = 0;
/// @brief Check if the HSA KMT Model is enabled
/// @param[out] enable True if the model is enabled, false otherwise
virtual hsa_status_t IsModelEnabled(bool* enable) const = 0;
/// @brief Gets the wallclock frequency for a specific node.
/// @param[in] node_id Node ID of the agent
/// @param[out] frequency Pointer to the wallclock frequency
/// @return HSA_STATUS_SUCCESS if the wallclock frequency was successfully retrieved, or an error
/// code.
virtual hsa_status_t GetWallclockFrequency(uint32_t node_id, uint64_t* frequency) const = 0;
/// @brief Allocates scratch memory for the agent.
/// @param[in] node_id Node ID of the agent
/// @param[in] size Size of the scratch memory
/// @param[out] mem Pointer to the scratch memory
/// @return HSA_STATUS_SUCCESS if scratch memory allocated successfully.
virtual hsa_status_t AllocateScratchMemory(uint32_t node_id, uint64_t size, void** mem) const = 0;
/// @brief Inquires memory available for allocation as a memory buffer
/// @param[in] node_id Node ID of the agent
/// @param[out] available_size Available memory size in bytes
/// @return HSA_STATUS_SUCCESS if the driver successfully returns the available memory size.
virtual hsa_status_t AvailableMemory(uint32_t node_id, uint64_t* available_size) const = 0;
/// @brief Register memory to GPU
/// @param[in] ptr Address of memory to be registered
/// @param[in] size Size of memory
/// @param[in] mem_flags Flags of memory registering
/// @return HSA_STATUS_SUCCESS if memory registered successfully.
virtual hsa_status_t RegisterMemory(void* ptr, uint64_t size, HsaMemFlags mem_flags) const = 0;
/// @brief Unregisters with a memory
/// @param[in] ptr Pointer of memory
/// @return HSA_STATUS_SUCCESS if deregister memory successfully.
virtual hsa_status_t DeregisterMemory(void* ptr) const = 0;
/// @brief Make the memory is resident and can be accessed by GPU
/// @param[in] mem address of memory to be made resident
/// @param[in] size size of memory
/// @param[out] alternate_va alternate virtual address
/// @param[in] mem_flags memory flags can be null
/// @param[in] num_nodes number of nodes to be used can be 0 if not used
/// @param[in] nodes nodes to be used can be null
/// @return HSA_STATUS_SUCCESS if the driver successfully makes the memory
virtual hsa_status_t MakeMemoryResident(const void* mem, size_t size, uint64_t* alternate_va,
const HsaMemMapFlags* mem_flags = nullptr,
uint32_t num_nodes = 0,
const uint32_t* nodes = nullptr) const = 0;
/// @brief Releases the residency of the memory
/// @param[in] mem address of memory to be made unresident
/// @return HSA_STATUS_SUCCESS if the driver successfully makes the memory
virtual hsa_status_t MakeMemoryUnresident(const void* mem) const = 0;
/// Unique identifier for supported kernel-mode drivers.
const DriverType kernel_driver_type_;
protected:
HsaVersionInfo version_{std::numeric_limits<uint32_t>::max(),
std::numeric_limits<uint32_t>::max()};
const std::string devnode_name_;
int fd_ = -1;
};
} // namespace core
} // namespace rocr
#endif // header guard