8b529e7b29
In order for pre-commit to be useful, everything needs to meet a common baseline. Signed-off-by: Mario Limonciello (AMD) <superm1@kernel.org>
523 wiersze
18 KiB
C++
523 wiersze
18 KiB
C++
/*
|
|
* Copyright © Advanced Micro Devices, Inc., or its affiliates.
|
|
*
|
|
* SPDX-License-Identifier: MIT
|
|
*/
|
|
|
|
#include "hsa_test.h"
|
|
|
|
#include <atomic>
|
|
#include <iostream>
|
|
|
|
#define PRINT_ATTRIBUTE(attribute, value, metric) \
|
|
std::cout << #attribute " = " << value << " " << metric << std::endl;
|
|
|
|
static size_t ToMB(size_t size) { return (size / (1024 * 1024)); }
|
|
|
|
HsaTest::HsaTest(const char* test_name) : test_name_(test_name) {
|
|
std::cout << "Running " << test_name_ << std::endl;
|
|
std::cout << "------------------------------------------------\n";
|
|
}
|
|
|
|
HsaTest::~HsaTest() {}
|
|
|
|
void HsaTest::Init() {
|
|
hsa_status_t stat = hsa_init();
|
|
if (stat != HSA_STATUS_SUCCESS) {
|
|
std::cerr << "hsa_init fail with status " << stat << std::endl;
|
|
}
|
|
|
|
stat = hsa_iterate_agents(IterateAgents, (void*)this);
|
|
}
|
|
|
|
void HsaTest::Cleanup() { hsa_shut_down(); }
|
|
|
|
hsa_status_t HsaTest::IterateAgents(hsa_agent_t agent, void* data) {
|
|
HsaTest* hsatest = (HsaTest*)data;
|
|
|
|
AgentProps prop(agent);
|
|
|
|
if (prop.device_type == HSA_DEVICE_TYPE_CPU) {
|
|
hsatest->cpus_.push_back(agent);
|
|
} else if (prop.device_type == HSA_DEVICE_TYPE_GPU) {
|
|
hsatest->gpus_.push_back(agent);
|
|
}
|
|
|
|
hsa_amd_memory_pool_t pools[3] = {{0}, {0}, {0}};
|
|
hsa_status_t stat =
|
|
hsa_amd_agent_iterate_memory_pools(agent, IteratePools, pools);
|
|
|
|
hsatest->global_fine_[agent.handle] = pools[0];
|
|
hsatest->global_coarse_[agent.handle] = pools[1];
|
|
hsatest->group_[agent.handle] = pools[2];
|
|
|
|
return HSA_STATUS_SUCCESS;
|
|
}
|
|
|
|
hsa_status_t HsaTest::IteratePools(hsa_amd_memory_pool_t pool, void* data) {
|
|
hsa_amd_memory_pool_t* pools = (hsa_amd_memory_pool_t*)data;
|
|
|
|
PoolProps prop(pool);
|
|
|
|
if (prop.segment == HSA_AMD_SEGMENT_GLOBAL) {
|
|
if (prop.global_flag & HSA_AMD_MEMORY_POOL_GLOBAL_FLAG_FINE_GRAINED) {
|
|
pools[0].handle = pool.handle;
|
|
} else {
|
|
pools[1].handle = pool.handle;
|
|
}
|
|
} else if (prop.segment == HSA_AMD_SEGMENT_GROUP) {
|
|
pools[2].handle = pool.handle;
|
|
}
|
|
|
|
return HSA_STATUS_SUCCESS;
|
|
}
|
|
|
|
HsaTest::AgentProps::AgentProps(hsa_agent_t agent) {
|
|
if (agent.handle == 0) {
|
|
return;
|
|
}
|
|
|
|
hsa_agent_get_info(agent, HSA_AGENT_INFO_NAME, (void*)name);
|
|
hsa_agent_get_info(agent, HSA_AGENT_INFO_VENDOR_NAME, (void*)vendor_name);
|
|
hsa_agent_get_info(agent, HSA_AGENT_INFO_FEATURE, (void*)&feature);
|
|
hsa_agent_get_info(agent, HSA_AGENT_INFO_MACHINE_MODEL,
|
|
(void*)&machine_model);
|
|
hsa_agent_get_info(agent, HSA_AGENT_INFO_PROFILE, (void*)&profile);
|
|
hsa_agent_get_info(agent, HSA_AGENT_INFO_DEFAULT_FLOAT_ROUNDING_MODE,
|
|
(void*)&default_float_rounding_mode);
|
|
hsa_agent_get_info(agent,
|
|
HSA_AGENT_INFO_BASE_PROFILE_DEFAULT_FLOAT_ROUNDING_MODES,
|
|
(void*)&base_profile_float_rounding_mode);
|
|
hsa_agent_get_info(agent, HSA_AGENT_INFO_FAST_F16_OPERATION,
|
|
(void*)&fast_f16_operation);
|
|
hsa_agent_get_info(agent, HSA_AGENT_INFO_WAVEFRONT_SIZE,
|
|
(void*)&wavefront_size);
|
|
hsa_agent_get_info(agent, HSA_AGENT_INFO_WORKGROUP_MAX_DIM,
|
|
(void*)workgroup_max_dim);
|
|
hsa_agent_get_info(agent, HSA_AGENT_INFO_WORKGROUP_MAX_SIZE,
|
|
(void*)&workgroup_max_size);
|
|
hsa_agent_get_info(agent, HSA_AGENT_INFO_GRID_MAX_DIM, (void*)&grid_max_dim);
|
|
hsa_agent_get_info(agent, HSA_AGENT_INFO_GRID_MAX_SIZE,
|
|
(void*)&grid_max_size);
|
|
hsa_agent_get_info(agent, HSA_AGENT_INFO_FBARRIER_MAX_SIZE,
|
|
(void*)&fbarrier_max_size);
|
|
hsa_agent_get_info(agent, HSA_AGENT_INFO_QUEUES_MAX, (void*)&queue_max);
|
|
hsa_agent_get_info(agent, HSA_AGENT_INFO_QUEUE_MIN_SIZE,
|
|
(void*)&queue_min_size);
|
|
hsa_agent_get_info(agent, HSA_AGENT_INFO_QUEUE_MAX_SIZE,
|
|
(void*)&queue_max_size);
|
|
hsa_agent_get_info(agent, HSA_AGENT_INFO_QUEUE_TYPE, (void*)&queue_type);
|
|
hsa_agent_get_info(agent, HSA_AGENT_INFO_NODE, (void*)&node);
|
|
hsa_agent_get_info(agent, HSA_AGENT_INFO_DEVICE, (void*)&device_type);
|
|
hsa_agent_get_info(agent, HSA_AGENT_INFO_CACHE_SIZE, (void*)cache_size);
|
|
hsa_agent_get_info(agent, HSA_AGENT_INFO_ISA, (void*)&isa);
|
|
hsa_agent_get_info(agent, HSA_AGENT_INFO_EXTENSIONS, (void*)extensions);
|
|
hsa_agent_get_info(agent, HSA_AGENT_INFO_VERSION_MAJOR,
|
|
(void*)&version_major);
|
|
hsa_agent_get_info(agent, HSA_AGENT_INFO_VERSION_MINOR,
|
|
(void*)&version_minor);
|
|
}
|
|
|
|
HsaTest::PoolProps::PoolProps(hsa_amd_memory_pool_t pool) {
|
|
if (pool.handle == 0) {
|
|
return;
|
|
}
|
|
|
|
hsa_amd_memory_pool_get_info(pool, HSA_AMD_MEMORY_POOL_INFO_SEGMENT,
|
|
(void*)&segment);
|
|
hsa_amd_memory_pool_get_info(pool, HSA_AMD_MEMORY_POOL_INFO_GLOBAL_FLAGS,
|
|
(void*)&global_flag);
|
|
hsa_amd_memory_pool_get_info(pool, HSA_AMD_MEMORY_POOL_INFO_SIZE,
|
|
(void*)&size);
|
|
hsa_amd_memory_pool_get_info(pool,
|
|
HSA_AMD_MEMORY_POOL_INFO_RUNTIME_ALLOC_ALLOWED,
|
|
(void*)&alloc_allowed);
|
|
hsa_amd_memory_pool_get_info(pool,
|
|
HSA_AMD_MEMORY_POOL_INFO_RUNTIME_ALLOC_GRANULE,
|
|
(void*)&alloc_granule);
|
|
hsa_amd_memory_pool_get_info(pool,
|
|
HSA_AMD_MEMORY_POOL_INFO_RUNTIME_ALLOC_ALIGNMENT,
|
|
(void*)&alloc_alignment);
|
|
hsa_amd_memory_pool_get_info(pool, HSA_AMD_MEMORY_POOL_INFO_ACCESSIBLE_BY_ALL,
|
|
(void*)&all_accessible);
|
|
}
|
|
|
|
HsaTest::Kernel::Kernel(hsa_agent_t agent, std::string hsail_text)
|
|
: agent_(agent), hsail_file_(hsail_text) {
|
|
program_.handle = 0;
|
|
code_object_.handle = 0;
|
|
executable_.handle = 0;
|
|
|
|
AgentProps prop(agent_);
|
|
profile_ = prop.profile;
|
|
|
|
Initialize();
|
|
}
|
|
|
|
HsaTest::Kernel::~Kernel() { Cleanup(); }
|
|
|
|
uint64_t HsaTest::Kernel::GetCodeHandle(const char* kernel_name) {
|
|
kernel_symbol_ = {0};
|
|
if (HSA_STATUS_SUCCESS != hsa_executable_get_symbol(executable_, NULL,
|
|
kernel_name, agent_, 0,
|
|
&kernel_symbol_)) {
|
|
return 0;
|
|
}
|
|
|
|
uint64_t code_handle = 0;
|
|
if (HSA_STATUS_SUCCESS !=
|
|
hsa_executable_symbol_get_info(kernel_symbol_,
|
|
HSA_EXECUTABLE_SYMBOL_INFO_KERNEL_OBJECT,
|
|
&code_handle)) {
|
|
return 0;
|
|
}
|
|
|
|
return code_handle;
|
|
}
|
|
|
|
hsa_status_t HsaTest::Kernel::GetScratchSize(uint32_t* size) {
|
|
|
|
hsa_status_t status;
|
|
status = hsa_executable_symbol_get_info(kernel_symbol_,
|
|
HSA_EXECUTABLE_SYMBOL_INFO_KERNEL_PRIVATE_SEGMENT_SIZE, size);
|
|
return status;
|
|
}
|
|
|
|
void HsaTest::Kernel::Initialize() {
|
|
CreateProgramFromHsailFile();
|
|
CreateCodeObjectAndExecutable();
|
|
}
|
|
|
|
void HsaTest::Kernel::Cleanup() {
|
|
if (executable_.handle != 0) {
|
|
hsa_executable_destroy(executable_);
|
|
executable_.handle = 0;
|
|
}
|
|
|
|
if (code_object_.handle != 0) {
|
|
hsa_code_object_destroy(code_object_);
|
|
code_object_.handle = 0;
|
|
}
|
|
|
|
if (program_.handle != 0) {
|
|
hsa_ext_program_destroy(program_);
|
|
program_.handle = 0;
|
|
}
|
|
}
|
|
|
|
bool HsaTest::Kernel::CreateProgramFromHsailFile() {
|
|
if (HSA_STATUS_SUCCESS !=
|
|
hsa_ext_program_create(HSA_MACHINE_MODEL_LARGE, profile_,
|
|
HSA_DEFAULT_FLOAT_ROUNDING_MODE_ZERO, NULL,
|
|
&program_)) {
|
|
return false;
|
|
}
|
|
|
|
if (!tool_.assembleFromFile(hsail_file_.c_str())) {
|
|
return false;
|
|
}
|
|
|
|
hsa_ext_module_t module = tool_.brigModule();
|
|
if (HSA_STATUS_SUCCESS != hsa_ext_program_add_module(program_, module)) {
|
|
return false;
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
bool HsaTest::Kernel::CreateCodeObjectAndExecutable() {
|
|
hsa_isa_t isa = {0};
|
|
if (HSA_STATUS_SUCCESS !=
|
|
hsa_agent_get_info(agent_, HSA_AGENT_INFO_ISA, &isa)) {
|
|
return false;
|
|
}
|
|
|
|
hsa_ext_control_directives_t control_directives = {0};
|
|
if (HSA_STATUS_SUCCESS !=
|
|
hsa_ext_program_finalize(program_, isa, 0, control_directives, "",
|
|
HSA_CODE_OBJECT_TYPE_PROGRAM, &code_object_)) {
|
|
return false;
|
|
}
|
|
|
|
if (HSA_STATUS_SUCCESS != hsa_executable_create(profile_,
|
|
HSA_EXECUTABLE_STATE_UNFROZEN,
|
|
"", &executable_)) {
|
|
return false;
|
|
}
|
|
|
|
if (HSA_STATUS_SUCCESS !=
|
|
hsa_executable_load_code_object(executable_, agent_, code_object_, "")) {
|
|
return false;
|
|
}
|
|
|
|
if (HSA_STATUS_SUCCESS != hsa_executable_freeze(executable_, "")) {
|
|
return false;
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
void HsaTest::GetGpuPeer(hsa_agent_t master,
|
|
std::vector<hsa_agent_t>& gpu_peers) {
|
|
AgentProps master_prop(master);
|
|
for (hsa_agent_t agent : gpus_) {
|
|
AgentProps agent_prop(agent);
|
|
if (master.handle == agent.handle ||
|
|
agent_prop.device_type != HSA_DEVICE_TYPE_GPU) {
|
|
continue;
|
|
}
|
|
|
|
hsa_amd_memory_pool_t peer_local_pool = global_coarse_[agent.handle];
|
|
|
|
hsa_amd_memory_pool_access_t access =
|
|
HSA_AMD_MEMORY_POOL_ACCESS_NEVER_ALLOWED;
|
|
if (HSA_STATUS_SUCCESS == hsa_amd_agent_memory_pool_get_info(
|
|
master, peer_local_pool,
|
|
HSA_AMD_AGENT_MEMORY_POOL_INFO_ACCESS,
|
|
(void*)&access) &&
|
|
access != HSA_AMD_MEMORY_POOL_ACCESS_NEVER_ALLOWED) {
|
|
gpu_peers.push_back(agent);
|
|
}
|
|
}
|
|
}
|
|
|
|
void* HsaTest::AllocateSystemMemory(bool fine_grain, size_t size) {
|
|
if (cpus_.size() == 0) {
|
|
return NULL;
|
|
}
|
|
|
|
hsa_amd_memory_pool_t pool = (fine_grain) ? global_fine_[cpus_[0].handle]
|
|
: global_coarse_[cpus_[0].handle];
|
|
|
|
void* ptr = NULL;
|
|
if (HSA_STATUS_SUCCESS != hsa_amd_memory_pool_allocate(pool, size, 0, &ptr)) {
|
|
return NULL;
|
|
}
|
|
|
|
return ptr;
|
|
}
|
|
|
|
void* HsaTest::AllocateLocalMemory(hsa_agent_t agent, size_t size) {
|
|
if (gpus_.size() == 0) {
|
|
return NULL;
|
|
}
|
|
|
|
hsa_amd_memory_pool_t pool = global_coarse_[agent.handle];
|
|
|
|
void* ptr = NULL;
|
|
if (HSA_STATUS_SUCCESS != hsa_amd_memory_pool_allocate(pool, size, 0, &ptr)) {
|
|
return NULL;
|
|
}
|
|
|
|
return ptr;
|
|
}
|
|
|
|
void HsaTest::FreeMemory(void* ptr) { hsa_amd_memory_pool_free(ptr); }
|
|
|
|
void HsaTest::LaunchPacket(hsa_queue_t& queue, hsa_packet_type_t type,
|
|
void* packet) {
|
|
uint32_t queue_bitmask = queue.size - 1;
|
|
const uint64_t write_index = hsa_queue_add_write_index_acq_rel(&queue, 1);
|
|
|
|
static const uint16_t kInvalidPacketHeader = HSA_PACKET_TYPE_INVALID;
|
|
|
|
if (type == HSA_PACKET_TYPE_KERNEL_DISPATCH) {
|
|
hsa_kernel_dispatch_packet_t* dispatch_packet =
|
|
reinterpret_cast<hsa_kernel_dispatch_packet_t*>(packet);
|
|
const uint16_t temp_header = dispatch_packet->header;
|
|
dispatch_packet->header = kInvalidPacketHeader;
|
|
|
|
// Populate queue buffer.
|
|
hsa_kernel_dispatch_packet_t* queue_buffer =
|
|
reinterpret_cast<hsa_kernel_dispatch_packet_t*>(queue.base_address);
|
|
queue_buffer[write_index & queue_bitmask] = *dispatch_packet;
|
|
|
|
// Enable packet.
|
|
std::atomic_thread_fence(std::memory_order_release);
|
|
queue_buffer[write_index & queue_bitmask].header = temp_header;
|
|
dispatch_packet->header = temp_header;
|
|
} else if (type == HSA_PACKET_TYPE_BARRIER_AND) {
|
|
hsa_barrier_and_packet_t* barrier_and_packet =
|
|
reinterpret_cast<hsa_barrier_and_packet_t*>(packet);
|
|
const uint16_t temp_header = barrier_and_packet->header;
|
|
barrier_and_packet->header = kInvalidPacketHeader;
|
|
|
|
// Populate queue buffer.
|
|
hsa_barrier_and_packet_t* queue_buffer =
|
|
reinterpret_cast<hsa_barrier_and_packet_t*>(queue.base_address);
|
|
queue_buffer[write_index & queue_bitmask] = *barrier_and_packet;
|
|
|
|
// Enable packet.
|
|
std::atomic_thread_fence(std::memory_order_release);
|
|
queue_buffer[write_index & queue_bitmask].header = temp_header;
|
|
barrier_and_packet->header = temp_header;
|
|
} else if (type == HSA_PACKET_TYPE_BARRIER_OR) {
|
|
hsa_barrier_or_packet_t* barrier_or_packet =
|
|
reinterpret_cast<hsa_barrier_or_packet_t*>(packet);
|
|
const uint16_t temp_header = barrier_or_packet->header;
|
|
barrier_or_packet->header = kInvalidPacketHeader;
|
|
|
|
// Populate queue buffer.
|
|
hsa_barrier_or_packet_t* queue_buffer =
|
|
reinterpret_cast<hsa_barrier_or_packet_t*>(queue.base_address);
|
|
queue_buffer[write_index & queue_bitmask] = *barrier_or_packet;
|
|
|
|
// Enable packet.
|
|
std::atomic_thread_fence(std::memory_order_release);
|
|
queue_buffer[write_index & queue_bitmask].header = temp_header;
|
|
barrier_or_packet->header = temp_header;
|
|
}
|
|
|
|
hsa_signal_store_release(queue.doorbell_signal, write_index);
|
|
}
|
|
|
|
void HsaTest::PrintAgentInfo(AgentProps& prop) {
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_NAME, prop.name, "");
|
|
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_VENDOR_NAME, prop.vendor_name, "");
|
|
|
|
const char* feature_strings[] = {"NONE", "HSA_AGENT_FEATURE_DISPATCH",
|
|
"HSA_AGENT_FEATURE_AGENT_DISPATCH"};
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_FEATURE, feature_strings[prop.feature], "");
|
|
|
|
const char* model_strings[] = {"HSA_MACHINE_MODEL_SMALL",
|
|
"HSA_MACHINE_MODEL_LARGE"};
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_MACHINE_MODEL,
|
|
model_strings[prop.machine_model], "");
|
|
|
|
const char* profile_strings[] = {"HSA_PROFILE_BASE", "HSA_PROFILE_FULL"};
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_PROFILE, profile_strings[prop.profile], "");
|
|
|
|
const char* default_float_rounding_strings[] = {
|
|
"HSA_DEFAULT_FLOAT_ROUNDING_MODE_DEFAULT",
|
|
"HSA_DEFAULT_FLOAT_ROUNDING_MODE_ZERO",
|
|
"HSA_DEFAULT_FLOAT_ROUNDING_MODE_NEAR"};
|
|
PRINT_ATTRIBUTE(
|
|
HSA_AGENT_INFO_DEFAULT_FLOAT_ROUNDING_MODE,
|
|
default_float_rounding_strings[prop.default_float_rounding_mode], "");
|
|
PRINT_ATTRIBUTE(
|
|
HSA_AGENT_INFO_BASE_PROFILE_DEFAULT_FLOAT_ROUNDING_MODES,
|
|
default_float_rounding_strings[prop.base_profile_float_rounding_mode],
|
|
"");
|
|
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_FAST_F16_OPERATION, prop.fast_f16_operation,
|
|
"");
|
|
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_WAVEFRONT_SIZE, prop.wavefront_size, "");
|
|
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_WORKGROUP_MAX_DIM[0],
|
|
prop.workgroup_max_dim[0], "");
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_WORKGROUP_MAX_DIM[1],
|
|
prop.workgroup_max_dim[1], "");
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_WORKGROUP_MAX_DIM[2],
|
|
prop.workgroup_max_dim[2], "");
|
|
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_WORKGROUP_MAX_SIZE, prop.workgroup_max_size,
|
|
"");
|
|
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_GRID_MAX_DIM.x, prop.grid_max_dim.x, "");
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_GRID_MAX_DIM.y, prop.grid_max_dim.y, "");
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_GRID_MAX_DIM.z, prop.grid_max_dim.z, "");
|
|
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_GRID_MAX_SIZE, prop.grid_max_size, "");
|
|
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_FBARRIER_MAX_SIZE, prop.fbarrier_max_size, "");
|
|
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_QUEUES_MAX, prop.queue_max, "");
|
|
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_QUEUE_MIN_SIZE, prop.queue_min_size, "");
|
|
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_QUEUE_MAX_SIZE, prop.queue_max_size, "");
|
|
|
|
const char* queue_type_strings[] = {"HSA_QUEUE_TYPE_MULTI",
|
|
"HSA_QUEUE_TYPE_SINGLE"};
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_QUEUE_TYPE,
|
|
queue_type_strings[prop.queue_type], "");
|
|
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_NODE, prop.node, "");
|
|
|
|
const char* device_type_strings[] = {
|
|
"HSA_DEVICE_TYPE_CPU", "HSA_DEVICE_TYPE_GPU", "HSA_DEVICE_TYPE_DSP"};
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_DEVICE, device_type_strings[prop.device_type],
|
|
"");
|
|
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_CACHE_SIZE[0], prop.cache_size[0], "bytes");
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_CACHE_SIZE[1], prop.cache_size[1], "bytes");
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_CACHE_SIZE[2], prop.cache_size[2], "bytes");
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_CACHE_SIZE[3], prop.cache_size[3], "bytes");
|
|
|
|
std::string extensions = "";
|
|
extensions += (prop.extensions[HSA_EXTENSION_FINALIZER])
|
|
? "HSA_EXTENSION_FINALIZER | "
|
|
: "";
|
|
extensions +=
|
|
(prop.extensions[HSA_EXTENSION_IMAGES]) ? "HSA_EXTENSION_IMAGES | " : "";
|
|
extensions += (prop.extensions[HSA_EXTENSION_AMD_PROFILER])
|
|
? "HSA_EXTENSION_AMD_PROFILER "
|
|
: "";
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_EXTENSIONS, extensions, "");
|
|
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_VERSION_MAJOR, prop.version_major, "");
|
|
PRINT_ATTRIBUTE(HSA_AGENT_INFO_VERSION_MINOR, prop.version_minor, "");
|
|
}
|
|
|
|
void HsaTest::PrintPeers(hsa_agent_t agent) {
|
|
std::cout << "Peer GPUs: ";
|
|
std::vector<hsa_agent_t> gpu_peers;
|
|
GetGpuPeer(agent, gpu_peers);
|
|
if (gpu_peers.size() > 0) {
|
|
for (hsa_agent_t peer_agent : gpu_peers) {
|
|
// Get the index of the peer in gpus_.
|
|
size_t peer_idx = 0;
|
|
for (; peer_idx < gpus_.size(); ++peer_idx) {
|
|
if (peer_agent.handle == gpus_[peer_idx].handle) {
|
|
std::cout << "GPU[" << peer_idx << "] ";
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
std::cout << std::endl;
|
|
} else {
|
|
std::cout << "No peer GPUs\n";
|
|
}
|
|
}
|
|
|
|
void HsaTest::PrintPoolInfo(PoolProps& prop) {
|
|
const char* segment_strings[] = {
|
|
"HSA_SEGMENT_GLOBAL", "HSA_AMD_SEGMENT_READONLY",
|
|
"HSA_AMD_SEGMENT_PRIVATE", "HSA_AMD_SEGMENT_GROUP"};
|
|
PRINT_ATTRIBUTE(HSA_AMD_MEMORY_POOL_INFO_SEGMENT,
|
|
segment_strings[prop.segment], "");
|
|
|
|
std::string global_flag = "";
|
|
global_flag +=
|
|
(prop.global_flag & HSA_AMD_MEMORY_POOL_GLOBAL_FLAG_KERNARG_INIT)
|
|
? "HSA_AMD_MEMORY_POOL_GLOBAL_FLAG_KERNARG_INIT | "
|
|
: "";
|
|
global_flag +=
|
|
(prop.global_flag & HSA_AMD_MEMORY_POOL_GLOBAL_FLAG_FINE_GRAINED)
|
|
? "HSA_AMD_MEMORY_POOL_GLOBAL_FLAG_FINE_GRAINED | "
|
|
: "";
|
|
global_flag +=
|
|
(prop.global_flag & HSA_AMD_MEMORY_POOL_GLOBAL_FLAG_COARSE_GRAINED)
|
|
? "HSA_AMD_MEMORY_POOL_GLOBAL_FLAG_COARSE_GRAINED "
|
|
: "";
|
|
PRINT_ATTRIBUTE(HSA_AMD_MEMORY_POOL_INFO_GLOBAL_FLAGS, global_flag, "");
|
|
|
|
static const size_t kMb = 1024 * 1024;
|
|
if (prop.size >= kMb) {
|
|
PRINT_ATTRIBUTE(HSA_AMD_MEMORY_POOL_INFO_SIZE, ToMB(prop.size), "MB");
|
|
} else {
|
|
PRINT_ATTRIBUTE(HSA_AMD_MEMORY_POOL_INFO_SIZE, prop.size, "bytes");
|
|
}
|
|
|
|
PRINT_ATTRIBUTE(HSA_AMD_MEMORY_POOL_INFO_RUNTIME_ALLOC_ALLOWED,
|
|
prop.alloc_allowed, "");
|
|
PRINT_ATTRIBUTE(HSA_AMD_MEMORY_POOL_INFO_RUNTIME_ALLOC_GRANULE,
|
|
prop.alloc_granule, "bytes");
|
|
PRINT_ATTRIBUTE(HSA_AMD_MEMORY_POOL_INFO_RUNTIME_ALLOC_ALIGNMENT,
|
|
prop.alloc_alignment, "bytes");
|
|
PRINT_ATTRIBUTE(HSA_AMD_MEMORY_POOL_INFO_ACCESSIBLE_BY_ALL,
|
|
prop.all_accessible, "");
|
|
}
|