From 1113d554f00cf66e073014974cae4cdc2ca5f853 Mon Sep 17 00:00:00 2001
From: foreman
Date: Tue, 13 Mar 2018 12:33:01 -0400
Subject: [PATCH] P4 to Git Change 1526407 by cpaquot@cpaquot-ocl-lc-lnx on
2018/03/13 12:24:51
SWDEV-145570 - [HIP] Separate device runtime and driver APIs
Affected files ...
... //depot/stg/opencl/drivers/opencl/api/hip/hip_device.cpp#5 edit
... //depot/stg/opencl/drivers/opencl/api/hip/hip_device_runtime.cpp#1 add
[ROCm/hip commit: 22aeb7f4f3fc9f7f0b79451a3301619d0129fe3b]
---
projects/hip/api/hip/hip_device.cpp | 455 -----------------
projects/hip/api/hip/hip_device_runtime.cpp | 533 ++++++++++++++++++++
2 files changed, 533 insertions(+), 455 deletions(-)
create mode 100644 projects/hip/api/hip/hip_device_runtime.cpp
diff --git a/projects/hip/api/hip/hip_device.cpp b/projects/hip/api/hip/hip_device.cpp
index c719f30122..ae9cba963d 100644
--- a/projects/hip/api/hip/hip_device.cpp
+++ b/projects/hip/api/hip/hip_device.cpp
@@ -24,20 +24,6 @@ THE SOFTWARE.
#include "hip_internal.hpp"
-hipError_t hipGetDevice(int *deviceId) {
-
- HIP_INIT_API(deviceId);
-
- if (deviceId != nullptr) {
- // this needs to return default device. For now return 0 always
- *deviceId = 0;
- } else {
- return hipErrorInvalidValue;
- }
-
- return hipSuccess;
-}
-
hipError_t hipDeviceGet(hipDevice_t *device, int deviceId)
{
HIP_INIT_API(device, deviceId);
@@ -51,239 +37,6 @@ hipError_t hipDeviceGet(hipDevice_t *device, int deviceId)
return hipSuccess;
};
-hipError_t hipGetDeviceCount(int* count) {
-
- HIP_INIT_API(count);
-
- if (count == nullptr) {
- return hipErrorInvalidValue;
- }
-
- // Get all available devices
- *count = g_context->devices().size();
-
- return hipSuccess;
-}
-
-hipError_t hipDeviceGetAttribute(int* pi, hipDeviceAttribute_t attr, int device) {
-
- HIP_INIT_API(pi, attr, device);
-
- if (pi == nullptr) {
- return hipErrorInvalidValue;
- }
-
- //if (unsigned(device) >= g_context->devices().size()) {
- // return hipErrorInvalidDevice;
- //}
- //auto* deviceHandle = g_context->devices()[device];
-
- //FIXME: should we cache the props, or just select from deviceHandle->info_?
- hipDeviceProp_t prop = {0};
- hipError_t err = hipGetDeviceProperties(&prop, device);
- if (err != hipSuccess) return err;
-
- switch (attr) {
- case hipDeviceAttributeMaxThreadsPerBlock:
- *pi = prop.maxThreadsPerBlock;
- break;
- case hipDeviceAttributeMaxBlockDimX:
- *pi = prop.maxThreadsDim[0];
- break;
- case hipDeviceAttributeMaxBlockDimY:
- *pi = prop.maxThreadsDim[1];
- break;
- case hipDeviceAttributeMaxBlockDimZ:
- *pi = prop.maxThreadsDim[2];
- break;
- case hipDeviceAttributeMaxGridDimX:
- *pi = prop.maxGridSize[0];
- break;
- case hipDeviceAttributeMaxGridDimY:
- *pi = prop.maxGridSize[1];
- break;
- case hipDeviceAttributeMaxGridDimZ:
- *pi = prop.maxGridSize[2];
- break;
- case hipDeviceAttributeMaxSharedMemoryPerBlock:
- *pi = prop.sharedMemPerBlock;
- break;
- case hipDeviceAttributeTotalConstantMemory:
- *pi = prop.totalConstMem;
- break;
- case hipDeviceAttributeWarpSize:
- *pi = prop.warpSize;
- break;
- case hipDeviceAttributeMaxRegistersPerBlock:
- *pi = prop.regsPerBlock;
- break;
- case hipDeviceAttributeClockRate:
- *pi = prop.clockRate;
- break;
- case hipDeviceAttributeMemoryClockRate:
- *pi = prop.memoryClockRate;
- break;
- case hipDeviceAttributeMemoryBusWidth:
- *pi = prop.memoryBusWidth;
- break;
- case hipDeviceAttributeMultiprocessorCount:
- *pi = prop.multiProcessorCount;
- break;
- case hipDeviceAttributeComputeMode:
- *pi = prop.computeMode;
- break;
- case hipDeviceAttributeL2CacheSize:
- *pi = prop.l2CacheSize;
- break;
- case hipDeviceAttributeMaxThreadsPerMultiProcessor:
- *pi = prop.maxThreadsPerMultiProcessor;
- break;
- case hipDeviceAttributeComputeCapabilityMajor:
- *pi = prop.major;
- break;
- case hipDeviceAttributeComputeCapabilityMinor:
- *pi = prop.minor;
- break;
- case hipDeviceAttributePciBusId:
- *pi = prop.pciBusID;
- break;
- case hipDeviceAttributeConcurrentKernels:
- *pi = prop.concurrentKernels;
- break;
- case hipDeviceAttributePciDeviceId:
- *pi = prop.pciDeviceID;
- break;
- case hipDeviceAttributeMaxSharedMemoryPerMultiprocessor:
- *pi = prop.maxSharedMemoryPerMultiProcessor;
- break;
- case hipDeviceAttributeIsMultiGpuBoard:
- *pi = prop.isMultiGpuBoard;
- break;
- default:
- return hipErrorInvalidValue;
- }
-
- return hipSuccess;
-}
-
-hipError_t hipGetDeviceProperties(hipDeviceProp_t* props, int device) {
-
- HIP_INIT_API(props, device);
-
- if (props == nullptr) {
- return hipErrorInvalidValue;
- }
-
- if (unsigned(device) >= g_context->devices().size()) {
- return hipErrorInvalidDevice;
- }
- auto* deviceHandle = g_context->devices()[device];
-
- hipDeviceProp_t deviceProps = {0};
-
- const auto& info = deviceHandle->info();
- ::strncpy(deviceProps.name, info.boardName_, 128);
- deviceProps.totalGlobalMem = info.globalMemSize_;
- deviceProps.sharedMemPerBlock = info.localMemSizePerCU_;
- deviceProps.regsPerBlock = info.availableSGPRs_;
- deviceProps.warpSize = info.wavefrontWidth_;
- deviceProps.maxThreadsPerBlock = info.maxWorkGroupSize_;
- deviceProps.maxThreadsDim[0] = info.maxWorkItemSizes_[0];
- deviceProps.maxThreadsDim[1] = info.maxWorkItemSizes_[1];
- deviceProps.maxThreadsDim[2] = info.maxWorkItemSizes_[2];
- deviceProps.maxGridSize[0] = UINT32_MAX;
- deviceProps.maxGridSize[1] = UINT32_MAX;
- deviceProps.maxGridSize[2] = UINT32_MAX;
- deviceProps.clockRate = info.maxEngineClockFrequency_;
- deviceProps.memoryClockRate = info.maxMemoryClockFrequency_;
- deviceProps.memoryBusWidth = info.globalMemChannels_ * 32;
- deviceProps.totalConstMem = info.maxConstantBufferSize_;
- deviceProps.major = info.gfxipVersion_ / 100;
- deviceProps.minor = info.gfxipVersion_ % 100;
- deviceProps.multiProcessorCount = info.maxComputeUnits_;
- deviceProps.l2CacheSize = info.l2CacheSize_;
- deviceProps.maxThreadsPerMultiProcessor = info.simdPerCU_;
- deviceProps.computeMode = 0;
- deviceProps.clockInstructionRate = info.timeStampFrequency_;
- deviceProps.arch.hasGlobalInt32Atomics = 1;
- deviceProps.arch.hasGlobalFloatAtomicExch = 1;
- deviceProps.arch.hasSharedInt32Atomics = 1;
- deviceProps.arch.hasSharedFloatAtomicExch = 1;
- deviceProps.arch.hasFloatAtomicAdd = 0;
- deviceProps.arch.hasGlobalInt64Atomics = 1;
- deviceProps.arch.hasSharedInt64Atomics = 1;
- deviceProps.arch.hasDoubles = 1;
- deviceProps.arch.hasWarpVote = 0;
- deviceProps.arch.hasWarpBallot = 0;
- deviceProps.arch.hasWarpShuffle = 0;
- deviceProps.arch.hasFunnelShift = 0;
- deviceProps.arch.hasThreadFenceSystem = 1;
- deviceProps.arch.hasSyncThreadsExt = 0;
- deviceProps.arch.hasSurfaceFuncs = 0;
- deviceProps.arch.has3dGrid = 1;
- deviceProps.arch.hasDynamicParallelism = 0;
- deviceProps.concurrentKernels = 1;
- deviceProps.pciDomainID = info.deviceTopology_.pcie.function;
- deviceProps.pciBusID = info.deviceTopology_.pcie.bus;
- deviceProps.pciDeviceID = info.deviceTopology_.pcie.device;
- deviceProps.maxSharedMemoryPerMultiProcessor = info.localMemSizePerCU_;
- //deviceProps.isMultiGpuBoard = info.;
- deviceProps.canMapHostMemory = 1;
- deviceProps.gcnArch = info.gfxipVersion_;
-
- *props = deviceProps;
- return hipSuccess;
-}
-
-hipError_t hipDeviceSetCacheConfig(hipFuncCache_t cacheConfig) {
-
- HIP_INIT_API(cacheConfig);
-
- // No way to set cache config yet.
-
- return hipSuccess;
-}
-
-hipError_t hipDeviceGetCacheConfig(hipFuncCache_t *cacheConfig) {
- HIP_INIT_API(cacheConfig);
-
- if(cacheConfig == nullptr) {
- return hipErrorInvalidValue;
- }
-
- *cacheConfig = hipFuncCache_t();
-
- return hipSuccess;
-}
-
-hipError_t hipSetDeviceFlags(unsigned int flags) {
-
- HIP_INIT_API(flags);
-
- assert(0 && "Unimplemented");
-
- return hipSuccess;
-};
-
-hipError_t hipDeviceGetLimit (size_t *pValue, hipLimit_t limit) {
-
- HIP_INIT_API(pValue, limit);
-
- auto* deviceHandle = g_context->devices()[0];
- const auto& info = deviceHandle->info();
-
- if(pValue == nullptr) {
- return hipErrorInvalidValue;
- }
- if(limit == hipLimitMallocHeapSize) {
- *pValue = info.globalMemSize_;
- return hipSuccess;
- } else {
- return hipErrorUnsupportedLimit;
- }
-
-}
-
hipError_t hipFuncSetCacheConfig (const void* func, hipFuncCache_t cacheConfig) {
HIP_INIT_API(cacheConfig);
@@ -293,166 +46,6 @@ hipError_t hipFuncSetCacheConfig (const void* func, hipFuncCache_t cacheConfig)
return hipSuccess;
}
-hipError_t hipDeviceSetSharedMemConfig (hipSharedMemConfig config) {
-
- HIP_INIT_API(config);
-
- // No way to set cache config yet.
-
- return hipSuccess;
-}
-
-hipError_t hipDeviceGetSharedMemConfig (hipSharedMemConfig *pConfig) {
-
- HIP_INIT_API(pConfig);
-
- *pConfig = hipSharedMemBankSizeFourByte;
-
- return hipSuccess;
-}
-
-
-hipError_t hipChooseDevice(int* device, const hipDeviceProp_t* properties) {
-
- HIP_INIT_API(device, properties);
-
- if (device == nullptr || properties == nullptr) {
- return hipErrorInvalidValue;
- }
-
- *device = 0;
- cl_uint maxMatchedCount = 0;
-
- for (cl_uint i = 0; i< g_context->devices().size(); ++i) {
- hipDeviceProp_t currentProp = {0};
- cl_uint validPropCount = 0;
- cl_uint matchedCount = 0;
- hipError_t err = hipGetDeviceProperties(¤tProp, i);
- if (properties->major != 0) {
- validPropCount++;
- if(currentProp.major >= properties->major) {
- matchedCount++;
- }
- }
- if (properties->minor != 0) {
- validPropCount++;
- if(currentProp.minor >= properties->minor) {
- matchedCount++;
- }
- }
- if(properties->totalGlobalMem != 0) {
- validPropCount++;
- if(currentProp.totalGlobalMem >= properties->totalGlobalMem) {
- matchedCount++;
- }
- }
- if(properties->sharedMemPerBlock != 0) {
- validPropCount++;
- if(currentProp.sharedMemPerBlock >= properties->sharedMemPerBlock) {
- matchedCount++;
- }
- }
- if(properties->maxThreadsPerBlock != 0) {
- validPropCount++;
- if(currentProp.maxThreadsPerBlock >= properties->maxThreadsPerBlock ) {
- matchedCount++;
- }
- }
- if(properties->totalConstMem != 0) {
- validPropCount++;
- if(currentProp.totalConstMem >= properties->totalConstMem ) {
- matchedCount++;
- }
- }
- if(properties->multiProcessorCount != 0) {
- validPropCount++;
- if(currentProp.multiProcessorCount >=
- properties->multiProcessorCount ) {
- matchedCount++;
- }
- }
- if(properties->maxThreadsPerMultiProcessor != 0) {
- validPropCount++;
- if(currentProp.maxThreadsPerMultiProcessor >=
- properties->maxThreadsPerMultiProcessor ) {
- matchedCount++;
- }
- }
- if(properties->memoryClockRate != 0) {
- validPropCount++;
- if(currentProp.memoryClockRate >= properties->memoryClockRate ) {
- matchedCount++;
- }
- }
- if(properties->memoryBusWidth != 0) {
- validPropCount++;
- if(currentProp.memoryBusWidth >= properties->memoryBusWidth ) {
- matchedCount++;
- }
- }
- if(properties->l2CacheSize != 0) {
- validPropCount++;
- if(currentProp.l2CacheSize >= properties->l2CacheSize ) {
- matchedCount++;
- }
- }
- if(properties->regsPerBlock != 0) {
- validPropCount++;
- if(currentProp.regsPerBlock >= properties->regsPerBlock ) {
- matchedCount++;
- }
- }
- if(properties->maxSharedMemoryPerMultiProcessor != 0) {
- validPropCount++;
- if(currentProp.maxSharedMemoryPerMultiProcessor >=
- properties->maxSharedMemoryPerMultiProcessor ) {
- matchedCount++;
- }
- }
- if(properties->warpSize != 0) {
- validPropCount++;
- if(currentProp.warpSize >= properties->warpSize ) {
- matchedCount++;
- }
- }
- if(validPropCount == matchedCount) {
- *device = matchedCount > maxMatchedCount ? i : *device;
- maxMatchedCount = std::max(matchedCount, maxMatchedCount);
- }
- }
-
- return hipSuccess;
-}
-
-
-hipError_t hipDeviceGetByPCIBusId (int* device, const char* pciBusIdstr) {
-
- HIP_INIT_API(device, pciBusIdstr);
-
- if (device == nullptr || pciBusIdstr == nullptr) {
- return hipErrorInvalidValue;
- }
-
- int pciBusID = -1;
- int pciDeviceID = -1;
- int pciDomainID = -1;
-
- if (sscanf (pciBusIdstr, "%04x:%02x:%02x", &pciDomainID, &pciBusID, &pciDeviceID) == 0x3) {
- for (cl_uint i = 0; i < g_context->devices().size(); i++) {
- auto* deviceHandle = g_context->devices()[i];
- auto& info = deviceHandle->info();
-
- if (pciBusID == info.deviceTopology_.pcie.bus) {
- *device = i;
- break;
- }
- }
- }
-
- return hipSuccess;
-}
-
-
hipError_t hipDeviceTotalMem (size_t *bytes, hipDevice_t device) {
HIP_INIT_API(bytes, device);
@@ -513,51 +106,3 @@ hipError_t hipDeviceGetName(char *name, int len, hipDevice_t device) {
return hipSuccess;
}
-
-hipError_t hipDeviceGetPCIBusId (char *pciBusId, int len, int device) {
-
- HIP_INIT_API((void*)pciBusId, len, device);
-
- if (device < 0 || device > (cl_int)g_context->devices().size()) {
- return hipErrorInvalidDevice;
- }
-
- if (pciBusId == nullptr || len < 0) {
- return hipErrorInvalidValue;
- }
-
- auto* deviceHandle = g_context->devices()[device];
- const auto& info = deviceHandle->info();
- snprintf (pciBusId, len, "%04x:%02x:%02x.0",
- info.deviceTopology_.pcie.function,
- info.deviceTopology_.pcie.bus,
- info.deviceTopology_.pcie.device);
-
-
- return hipSuccess;
-}
-
-hipError_t hipSetDevice(int deviceId)
-{
- HIP_INIT_API(deviceId);
-
- assert(0 && "Unimplemented");
-
- return hipErrorUnknown;
-}
-
-hipError_t hipDeviceReset(void)
-{
- HIP_INIT_API();
-
- assert(0 && "Unimplemented");
-
- return hipErrorUnknown;
-}
-
-
-hipError_t hipDeviceSynchronize(void)
-{
- // FIXME: should wait on all streams
- return hipSuccess;
-}
diff --git a/projects/hip/api/hip/hip_device_runtime.cpp b/projects/hip/api/hip/hip_device_runtime.cpp
new file mode 100644
index 0000000000..b9b6ccb68e
--- /dev/null
+++ b/projects/hip/api/hip/hip_device_runtime.cpp
@@ -0,0 +1,533 @@
+/*
+Copyright (c) 2018 - present Advanced Micro Devices, Inc. All rights reserved.
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in
+all copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
+THE SOFTWARE.
+*/
+
+#include
+
+#include "hip_internal.hpp"
+
+hipError_t hipChooseDevice(int* device, const hipDeviceProp_t* properties) {
+
+ HIP_INIT_API(device, properties);
+
+ if (device == nullptr || properties == nullptr) {
+ return hipErrorInvalidValue;
+ }
+
+ *device = 0;
+ cl_uint maxMatchedCount = 0;
+
+ for (cl_uint i = 0; i< g_context->devices().size(); ++i) {
+ hipDeviceProp_t currentProp = {0};
+ cl_uint validPropCount = 0;
+ cl_uint matchedCount = 0;
+ hipError_t err = hipGetDeviceProperties(¤tProp, i);
+ if (properties->major != 0) {
+ validPropCount++;
+ if(currentProp.major >= properties->major) {
+ matchedCount++;
+ }
+ }
+ if (properties->minor != 0) {
+ validPropCount++;
+ if(currentProp.minor >= properties->minor) {
+ matchedCount++;
+ }
+ }
+ if(properties->totalGlobalMem != 0) {
+ validPropCount++;
+ if(currentProp.totalGlobalMem >= properties->totalGlobalMem) {
+ matchedCount++;
+ }
+ }
+ if(properties->sharedMemPerBlock != 0) {
+ validPropCount++;
+ if(currentProp.sharedMemPerBlock >= properties->sharedMemPerBlock) {
+ matchedCount++;
+ }
+ }
+ if(properties->maxThreadsPerBlock != 0) {
+ validPropCount++;
+ if(currentProp.maxThreadsPerBlock >= properties->maxThreadsPerBlock ) {
+ matchedCount++;
+ }
+ }
+ if(properties->totalConstMem != 0) {
+ validPropCount++;
+ if(currentProp.totalConstMem >= properties->totalConstMem ) {
+ matchedCount++;
+ }
+ }
+ if(properties->multiProcessorCount != 0) {
+ validPropCount++;
+ if(currentProp.multiProcessorCount >=
+ properties->multiProcessorCount ) {
+ matchedCount++;
+ }
+ }
+ if(properties->maxThreadsPerMultiProcessor != 0) {
+ validPropCount++;
+ if(currentProp.maxThreadsPerMultiProcessor >=
+ properties->maxThreadsPerMultiProcessor ) {
+ matchedCount++;
+ }
+ }
+ if(properties->memoryClockRate != 0) {
+ validPropCount++;
+ if(currentProp.memoryClockRate >= properties->memoryClockRate ) {
+ matchedCount++;
+ }
+ }
+ if(properties->memoryBusWidth != 0) {
+ validPropCount++;
+ if(currentProp.memoryBusWidth >= properties->memoryBusWidth ) {
+ matchedCount++;
+ }
+ }
+ if(properties->l2CacheSize != 0) {
+ validPropCount++;
+ if(currentProp.l2CacheSize >= properties->l2CacheSize ) {
+ matchedCount++;
+ }
+ }
+ if(properties->regsPerBlock != 0) {
+ validPropCount++;
+ if(currentProp.regsPerBlock >= properties->regsPerBlock ) {
+ matchedCount++;
+ }
+ }
+ if(properties->maxSharedMemoryPerMultiProcessor != 0) {
+ validPropCount++;
+ if(currentProp.maxSharedMemoryPerMultiProcessor >=
+ properties->maxSharedMemoryPerMultiProcessor ) {
+ matchedCount++;
+ }
+ }
+ if(properties->warpSize != 0) {
+ validPropCount++;
+ if(currentProp.warpSize >= properties->warpSize ) {
+ matchedCount++;
+ }
+ }
+ if(validPropCount == matchedCount) {
+ *device = matchedCount > maxMatchedCount ? i : *device;
+ maxMatchedCount = std::max(matchedCount, maxMatchedCount);
+ }
+ }
+
+ return hipSuccess;
+}
+
+hipError_t hipDeviceGetAttribute(int* pi, hipDeviceAttribute_t attr, int device) {
+
+ HIP_INIT_API(pi, attr, device);
+
+ if (pi == nullptr) {
+ return hipErrorInvalidValue;
+ }
+
+ //if (unsigned(device) >= g_context->devices().size()) {
+ // return hipErrorInvalidDevice;
+ //}
+ //auto* deviceHandle = g_context->devices()[device];
+
+ //FIXME: should we cache the props, or just select from deviceHandle->info_?
+ hipDeviceProp_t prop = {0};
+ hipError_t err = hipGetDeviceProperties(&prop, device);
+ if (err != hipSuccess) return err;
+
+ switch (attr) {
+ case hipDeviceAttributeMaxThreadsPerBlock:
+ *pi = prop.maxThreadsPerBlock;
+ break;
+ case hipDeviceAttributeMaxBlockDimX:
+ *pi = prop.maxThreadsDim[0];
+ break;
+ case hipDeviceAttributeMaxBlockDimY:
+ *pi = prop.maxThreadsDim[1];
+ break;
+ case hipDeviceAttributeMaxBlockDimZ:
+ *pi = prop.maxThreadsDim[2];
+ break;
+ case hipDeviceAttributeMaxGridDimX:
+ *pi = prop.maxGridSize[0];
+ break;
+ case hipDeviceAttributeMaxGridDimY:
+ *pi = prop.maxGridSize[1];
+ break;
+ case hipDeviceAttributeMaxGridDimZ:
+ *pi = prop.maxGridSize[2];
+ break;
+ case hipDeviceAttributeMaxSharedMemoryPerBlock:
+ *pi = prop.sharedMemPerBlock;
+ break;
+ case hipDeviceAttributeTotalConstantMemory:
+ *pi = prop.totalConstMem;
+ break;
+ case hipDeviceAttributeWarpSize:
+ *pi = prop.warpSize;
+ break;
+ case hipDeviceAttributeMaxRegistersPerBlock:
+ *pi = prop.regsPerBlock;
+ break;
+ case hipDeviceAttributeClockRate:
+ *pi = prop.clockRate;
+ break;
+ case hipDeviceAttributeMemoryClockRate:
+ *pi = prop.memoryClockRate;
+ break;
+ case hipDeviceAttributeMemoryBusWidth:
+ *pi = prop.memoryBusWidth;
+ break;
+ case hipDeviceAttributeMultiprocessorCount:
+ *pi = prop.multiProcessorCount;
+ break;
+ case hipDeviceAttributeComputeMode:
+ *pi = prop.computeMode;
+ break;
+ case hipDeviceAttributeL2CacheSize:
+ *pi = prop.l2CacheSize;
+ break;
+ case hipDeviceAttributeMaxThreadsPerMultiProcessor:
+ *pi = prop.maxThreadsPerMultiProcessor;
+ break;
+ case hipDeviceAttributeComputeCapabilityMajor:
+ *pi = prop.major;
+ break;
+ case hipDeviceAttributeComputeCapabilityMinor:
+ *pi = prop.minor;
+ break;
+ case hipDeviceAttributePciBusId:
+ *pi = prop.pciBusID;
+ break;
+ case hipDeviceAttributeConcurrentKernels:
+ *pi = prop.concurrentKernels;
+ break;
+ case hipDeviceAttributePciDeviceId:
+ *pi = prop.pciDeviceID;
+ break;
+ case hipDeviceAttributeMaxSharedMemoryPerMultiprocessor:
+ *pi = prop.maxSharedMemoryPerMultiProcessor;
+ break;
+ case hipDeviceAttributeIsMultiGpuBoard:
+ *pi = prop.isMultiGpuBoard;
+ break;
+ default:
+ return hipErrorInvalidValue;
+ }
+
+ return hipSuccess;
+}
+
+hipError_t hipDeviceGetByPCIBusId(int* device, const char*pciBusIdstr) {
+
+ HIP_INIT_API(device, pciBusIdstr);
+
+ if (device == nullptr || pciBusIdstr == nullptr) {
+ return hipErrorInvalidValue;
+ }
+
+ int pciBusID = -1;
+ int pciDeviceID = -1;
+ int pciDomainID = -1;
+
+ if (sscanf (pciBusIdstr, "%04x:%02x:%02x", &pciDomainID, &pciBusID, &pciDeviceID) == 0x3) {
+ for (cl_uint i = 0; i < g_context->devices().size(); i++) {
+ auto* deviceHandle = g_context->devices()[i];
+ auto& info = deviceHandle->info();
+
+ if (pciBusID == info.deviceTopology_.pcie.bus) {
+ *device = i;
+ break;
+ }
+ }
+ }
+
+ return hipSuccess;
+}
+
+hipError_t hipDeviceGetCacheConfig ( hipFuncCache_t * cacheConfig ) {
+ HIP_INIT_API(cacheConfig);
+
+ if(cacheConfig == nullptr) {
+ return hipErrorInvalidValue;
+ }
+
+ *cacheConfig = hipFuncCache_t();
+
+ return hipSuccess;
+}
+
+hipError_t hipDeviceGetLimit ( size_t* pValue, hipLimit_t limit ) {
+
+ HIP_INIT_API(pValue, limit);
+
+ auto* deviceHandle = g_context->devices()[0];
+ const auto& info = deviceHandle->info();
+
+ if(pValue == nullptr) {
+ return hipErrorInvalidValue;
+ }
+ if(limit == hipLimitMallocHeapSize) {
+ *pValue = info.globalMemSize_;
+ return hipSuccess;
+ } else {
+ return hipErrorUnsupportedLimit;
+ }
+}
+
+/**
+hipError_t hipDeviceGetP2PAttribute ( int* value, hipDeviceP2PAttr attr, int srcDevice, int dstDevice ) {
+ assert(0);
+ return hipSuccess;
+}
+**/
+
+hipError_t hipDeviceGetPCIBusId ( char* pciBusId, int len, int device ) {
+
+ HIP_INIT_API((void*)pciBusId, len, device);
+
+ if (device < 0 || device > (cl_int)g_context->devices().size()) {
+ return hipErrorInvalidDevice;
+ }
+
+ if (pciBusId == nullptr || len < 0) {
+ return hipErrorInvalidValue;
+ }
+
+ auto* deviceHandle = g_context->devices()[device];
+ const auto& info = deviceHandle->info();
+ snprintf (pciBusId, len, "%04x:%02x:%02x.0",
+ info.deviceTopology_.pcie.function,
+ info.deviceTopology_.pcie.bus,
+ info.deviceTopology_.pcie.device);
+
+
+ return hipSuccess;
+}
+
+hipError_t hipDeviceGetSharedMemConfig ( hipSharedMemConfig * pConfig ) {
+ HIP_INIT_API(pConfig);
+
+ *pConfig = hipSharedMemBankSizeFourByte;
+
+ return hipSuccess;
+}
+
+hipError_t hipDeviceGetStreamPriorityRange ( int* leastPriority, int* greatestPriority ) {
+ assert(0);
+ return hipSuccess;
+}
+
+hipError_t hipDeviceReset ( void ) {
+ HIP_INIT_API();
+
+ assert(0 && "Unimplemented");
+
+ return hipErrorUnknown;
+}
+
+hipError_t hipDeviceSetCacheConfig ( hipFuncCache_t cacheConfig ) {
+ HIP_INIT_API(cacheConfig);
+
+ // No way to set cache config yet.
+
+ return hipSuccess;
+}
+
+hipError_t hipDeviceSetLimit ( hipLimit_t limit, size_t value ) {
+ return hipErrorUnknown;
+}
+
+hipError_t hipDeviceSetSharedMemConfig ( hipSharedMemConfig config ) {
+ HIP_INIT_API(config);
+
+ // No way to set cache config yet.
+
+ return hipSuccess;
+}
+
+hipError_t hipDeviceSynchronize ( void ) {
+ return hipSuccess;
+}
+
+hipError_t hipGetDevice ( int* deviceId ) {
+ HIP_INIT_API(deviceId);
+
+ if (deviceId != nullptr) {
+ // this needs to return default device. For now return 0 always
+ *deviceId = 0;
+ } else {
+ return hipErrorInvalidValue;
+ }
+
+ return hipSuccess;
+}
+
+hipError_t hipGetDeviceCount ( int* count ) {
+ HIP_INIT_API(count);
+
+ if (count == nullptr) {
+ return hipErrorInvalidValue;
+ }
+
+ // Get all available devices
+ *count = g_context->devices().size();
+
+ return hipSuccess;
+}
+
+hipError_t hipGetDeviceFlags ( unsigned int* flags ) {
+ return hipErrorUnknown;
+}
+
+hipError_t hipGetDeviceProperties ( hipDeviceProp_t* props, int device ) {
+ HIP_INIT_API(props, device);
+
+ if (props == nullptr) {
+ return hipErrorInvalidValue;
+ }
+
+ if (unsigned(device) >= g_context->devices().size()) {
+ return hipErrorInvalidDevice;
+ }
+ auto* deviceHandle = g_context->devices()[device];
+
+ hipDeviceProp_t deviceProps = {0};
+
+ const auto& info = deviceHandle->info();
+ ::strncpy(deviceProps.name, info.boardName_, 128);
+ deviceProps.totalGlobalMem = info.globalMemSize_;
+ deviceProps.sharedMemPerBlock = info.localMemSizePerCU_;
+ deviceProps.regsPerBlock = info.availableSGPRs_;
+ deviceProps.warpSize = info.wavefrontWidth_;
+ deviceProps.maxThreadsPerBlock = info.maxWorkGroupSize_;
+ deviceProps.maxThreadsDim[0] = info.maxWorkItemSizes_[0];
+ deviceProps.maxThreadsDim[1] = info.maxWorkItemSizes_[1];
+ deviceProps.maxThreadsDim[2] = info.maxWorkItemSizes_[2];
+ deviceProps.maxGridSize[0] = UINT32_MAX;
+ deviceProps.maxGridSize[1] = UINT32_MAX;
+ deviceProps.maxGridSize[2] = UINT32_MAX;
+ deviceProps.clockRate = info.maxEngineClockFrequency_;
+ deviceProps.memoryClockRate = info.maxMemoryClockFrequency_;
+ deviceProps.memoryBusWidth = info.globalMemChannels_ * 32;
+ deviceProps.totalConstMem = info.maxConstantBufferSize_;
+ deviceProps.major = info.gfxipVersion_ / 100;
+ deviceProps.minor = info.gfxipVersion_ % 100;
+ deviceProps.multiProcessorCount = info.maxComputeUnits_;
+ deviceProps.l2CacheSize = info.l2CacheSize_;
+ deviceProps.maxThreadsPerMultiProcessor = info.simdPerCU_;
+ deviceProps.computeMode = 0;
+ deviceProps.clockInstructionRate = info.timeStampFrequency_;
+ deviceProps.arch.hasGlobalInt32Atomics = 1;
+ deviceProps.arch.hasGlobalFloatAtomicExch = 1;
+ deviceProps.arch.hasSharedInt32Atomics = 1;
+ deviceProps.arch.hasSharedFloatAtomicExch = 1;
+ deviceProps.arch.hasFloatAtomicAdd = 0;
+ deviceProps.arch.hasGlobalInt64Atomics = 1;
+ deviceProps.arch.hasSharedInt64Atomics = 1;
+ deviceProps.arch.hasDoubles = 1;
+ deviceProps.arch.hasWarpVote = 0;
+ deviceProps.arch.hasWarpBallot = 0;
+ deviceProps.arch.hasWarpShuffle = 0;
+ deviceProps.arch.hasFunnelShift = 0;
+ deviceProps.arch.hasThreadFenceSystem = 1;
+ deviceProps.arch.hasSyncThreadsExt = 0;
+ deviceProps.arch.hasSurfaceFuncs = 0;
+ deviceProps.arch.has3dGrid = 1;
+ deviceProps.arch.hasDynamicParallelism = 0;
+ deviceProps.concurrentKernels = 1;
+ deviceProps.pciDomainID = info.deviceTopology_.pcie.function;
+ deviceProps.pciBusID = info.deviceTopology_.pcie.bus;
+ deviceProps.pciDeviceID = info.deviceTopology_.pcie.device;
+ deviceProps.maxSharedMemoryPerMultiProcessor = info.localMemSizePerCU_;
+ //deviceProps.isMultiGpuBoard = info.;
+ deviceProps.canMapHostMemory = 1;
+ deviceProps.gcnArch = info.gfxipVersion_;
+
+ *props = deviceProps;
+ return hipSuccess;
+}
+
+hipError_t hipIpcCloseMemHandle ( void* devPtr ) {
+ HIP_INIT_API(devPtr);
+
+ assert(0 && "Unimplemented");
+
+ return hipErrorUnknown;
+}
+
+hipError_t hipIpcGetEventHandle ( hipIpcEventHandle_t* handle, hipEvent_t event ) {
+ HIP_INIT_API(handle, event);
+
+ assert(0 && "Unimplemented");
+
+ return hipErrorUnknown;
+}
+
+hipError_t hipIpcGetMemHandle ( hipIpcMemHandle_t* handle, void* devPtr ) {
+ HIP_INIT_API(handle, devPtr);
+
+ assert(0 && "Unimplemented");
+
+ return hipErrorUnknown;
+}
+
+hipError_t hipIpcOpenEventHandle ( hipEvent_t* event, hipIpcEventHandle_t handle ) {
+ HIP_INIT_API(event, handle);
+
+ assert(0 && "Unimplemented");
+
+ return hipErrorUnknown;
+}
+
+hipError_t hipIpcOpenMemHandle ( void** devPtr, hipIpcMemHandle_t handle, unsigned int flags ) {
+ HIP_INIT_API(devPtr, handle, flags);
+
+ assert(0 && "Unimplemented");
+
+ return hipErrorUnknown;
+}
+
+hipError_t hipSetDevice ( int device ) {
+ HIP_INIT_API(device);
+
+ assert(0 && "Unimplemented");
+
+ return hipErrorUnknown;
+}
+
+hipError_t hipSetDeviceFlags ( unsigned int flags ) {
+ HIP_INIT_API(flags);
+
+ assert(0 && "Unimplemented");
+
+ return hipSuccess;
+}
+
+hipError_t hipSetValidDevices ( int* device_arr, int len ) {
+ HIP_INIT_API(device_arr, len);
+
+ assert(0 && "Unimplemented");
+
+ return hipErrorUnknown;
+}
+