8618ed31ca
SWDEV-111478 - [Vega] Clinfo doesn't report the CPU as a CL device. amdocl12cl64.dll is not loaded in Windows 10 (RS1) because the driverstore path wasn't searched to load for this module. Added the path to fix this issue. ReviewBoardURL = http://ocltc.amd.com/reviews/r/12211/ Affected files ... ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpudevice.cpp#563 edit ... //depot/stg/opencl/drivers/opencl/runtime/os/os.cpp#6 edit
172 строки
4.1 KiB
C++
172 строки
4.1 KiB
C++
//
|
|
// Copyright (c) 2008 Advanced Micro Devices, Inc. All rights reserved.
|
|
//
|
|
|
|
#include "os/os.hpp"
|
|
#include "thread/thread.hpp"
|
|
|
|
#include <string>
|
|
#include <cstring>
|
|
|
|
#if defined(_WIN32) || defined(__CYGWIN__)
|
|
# include <windows.h>
|
|
#else // !_WIN32
|
|
# include <time.h>
|
|
# include <unistd.h>
|
|
#endif // !_WIN32
|
|
|
|
#if defined(ATI_ARCH_X86)
|
|
#include <xmmintrin.h> // for _mm_pause
|
|
#endif // ATI_ARCH_X86
|
|
|
|
namespace amd {
|
|
|
|
void*
|
|
Os::loadLibrary(const char* libraryname)
|
|
{
|
|
void* handle = Os::loadLibrary_(libraryname);
|
|
if (handle != NULL) {
|
|
return handle;
|
|
}
|
|
|
|
// Try with the system library prefix and extension instead.
|
|
std::string str = libraryname;
|
|
|
|
size_t namestart = str.rfind(fileSeparator());
|
|
namestart = (namestart != std::string::npos) ? namestart + 1 : 0;
|
|
|
|
const char* prefix = Os::libraryPrefix();
|
|
if (prefix != NULL
|
|
&& str.compare(namestart, strlen(prefix), prefix) == 0) {
|
|
// It is alread present, not need to prepend it.
|
|
prefix = NULL;
|
|
}
|
|
size_t dot = str.rfind('.');
|
|
if (dot != std::string::npos) {
|
|
// check that the dot was on the filename not a dir name.
|
|
if (namestart < dot) {
|
|
// strip the previous extension.
|
|
str.resize(dot);
|
|
}
|
|
}
|
|
if (prefix != NULL && prefix[0] != '\0') {
|
|
str.insert(namestart, prefix);
|
|
}
|
|
str.append(Os::libraryExtension());
|
|
|
|
handle = Os::loadLibrary_(str.c_str());
|
|
if (handle != NULL || str.find(fileSeparator()) != std::string::npos) {
|
|
return handle;
|
|
}
|
|
|
|
#if defined(ATI_OS_WIN)
|
|
// Try with the DriverStore path
|
|
HMODULE hm = NULL;
|
|
if (!GetModuleHandleExA(GET_MODULE_HANDLE_EX_FLAG_FROM_ADDRESS
|
|
| GET_MODULE_HANDLE_EX_FLAG_UNCHANGED_REFCOUNT,
|
|
(LPCSTR)&loadLibrary, &hm)) return NULL;
|
|
|
|
char cszDllPath[1024] = { 0 };
|
|
if (!GetModuleFileNameA(hm, cszDllPath, sizeof(cszDllPath)))
|
|
return NULL;
|
|
|
|
LPSTR cszFileName;
|
|
char buffer[1024] = { 0 };
|
|
if (!GetFullPathNameA(cszDllPath, sizeof(buffer), buffer, &cszFileName))
|
|
return NULL;
|
|
|
|
std::string newPath;
|
|
newPath = cszDllPath;
|
|
newPath.replace(newPath.find(cszFileName), strlen(libraryname), libraryname);
|
|
|
|
handle = Os::loadLibrary_(newPath.c_str());
|
|
if (handle != NULL) {
|
|
return handle;
|
|
}
|
|
#endif
|
|
|
|
// Try to find the lib in the current directory.
|
|
return Os::loadLibrary((std::string(".") + fileSeparator()
|
|
+ std::string(libraryname)).c_str());
|
|
}
|
|
|
|
size_t Os::pageSize_ = 0;
|
|
|
|
int Os::processorCount_ = 0;
|
|
|
|
void
|
|
Os::spinPause()
|
|
{
|
|
#if defined(ATI_ARCH_X86)
|
|
_mm_pause();
|
|
#elif defined(__ARM_ARCH_7A__)
|
|
__asm__ __volatile__("yield");
|
|
#endif
|
|
}
|
|
|
|
void
|
|
Os::sleep(long n)
|
|
{
|
|
// FIXME_lmoriche: Should be nano-seconds not seconds.
|
|
#ifdef _WIN32
|
|
::Sleep(n);
|
|
#else // !_WIN32
|
|
time_t seconds = (time_t) n / 1000;
|
|
long nanoseconds = ((long) n - seconds * 1000) * 1000000;
|
|
timespec ts = { seconds, nanoseconds };
|
|
::nanosleep(&ts, NULL);
|
|
#endif // !_WIN32
|
|
}
|
|
|
|
void
|
|
Os::touchStackPages(address bottom, address top)
|
|
{
|
|
top = alignDown(top, pageSize_) - pageSize_;
|
|
while (top >= bottom) {
|
|
*top = 0;
|
|
top -= pageSize_;
|
|
}
|
|
}
|
|
|
|
bool
|
|
Os::skipIDIV(address& pc)
|
|
{
|
|
address insn = pc;
|
|
if (insn[0] == 0x66) { // LCP prefix
|
|
insn += 1;
|
|
}
|
|
if ((insn[0] & 0xf0) == 0x40) { // REX prefix
|
|
insn += 1;
|
|
}
|
|
if (insn[0] == 0xf6 || insn[0] == 0xf7) { // IDIV
|
|
// This is a DivisionError: skip the insn and resume execution
|
|
char mod = insn[1] >> 6;
|
|
char rm = insn[1] & 0x7;
|
|
insn += 2; // skip opcode and mod/rm
|
|
|
|
if (rm == 0x4 && mod != 0x3) {
|
|
insn += 1; // sib follows mod/rm
|
|
}
|
|
|
|
if ((mod == 0x0 && rm == 0x5) || mod == 0x2) {
|
|
insn += 4; // disp32
|
|
}
|
|
else if (mod == 0x1) {
|
|
insn += 1; // disp8
|
|
}
|
|
pc = insn;
|
|
return true;
|
|
}
|
|
return false;
|
|
}
|
|
|
|
void
|
|
Os::setThreadAffinity(const void* handle, unsigned int cpu)
|
|
{
|
|
ThreadAffinityMask mask;
|
|
mask.set(cpu);
|
|
setThreadAffinity(handle, mask);
|
|
}
|
|
|
|
} // namespace amd
|