465c1c0287
SWDEV-102733 - [OCL-LC-ROCm] Cmake build Write CMakeLists.txt to enable building with and without the DK environment - Change the coding convention of the runtime files. Use Google's Style (https://google.github.io/styleguide/cppguide.html). Affected files ... ... //depot/stg/opencl/drivers/opencl/.clang-format#1 add ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_agent_amd.h#2 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_command.cpp#13 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_context.cpp#53 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_counter.cpp#2 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_d3d10.cpp#15 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_d3d11.cpp#22 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_d3d9.cpp#32 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_debugger_amd.cpp#8 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_debugger_amd.h#7 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_device.cpp#61 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_event.cpp#10 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_execute.cpp#23 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_gl.cpp#53 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_icd.cpp#27 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_icd_amd.h#18 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_kernel.h#24 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_kernel_info_amd.cpp#3 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_kernel_info_amd.h#4 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_lqdflash_amd.cpp#17 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_lqdflash_amd.h#6 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_memobj.cpp#81 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_object.cpp#3 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_pipe.cpp#6 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_platform_amd.cpp#2 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_platform_amd.h#2 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_profile_amd.cpp#3 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_profile_amd.h#2 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_program.cpp#41 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_sampler.cpp#6 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_sdi_amd.cpp#3 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_sdi_amd.h#2 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_semaphore_amd.h#3 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_svm.cpp#20 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_thread_trace_amd.cpp#8 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_thread_trace_amd.h#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/appprofile.cpp#17 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/appprofile.hpp#12 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/blit.cpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/blit.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/blitcl.cpp#11 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpubinary.cpp#11 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpubinary.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpubuiltins.cpp#13 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpubuiltins.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpucommand.cpp#66 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpucommand.hpp#40 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpudevice.cpp#280 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpudevice.hpp#96 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpufeat.hpp#3 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpukernel.hpp#8 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpumapping.cpp#6 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpumapping.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpuprogram.cpp#70 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpuprogram.hpp#14 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpusettings.cpp#33 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpusettings.hpp#2 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cputables.hpp#5 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpuvirtual.cpp#26 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpuvirtual.hpp#13 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/device.cpp#209 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/device.hpp#284 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuappprofile.cpp#12 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuappprofile.hpp#7 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpubinary.cpp#58 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpubinary.hpp#27 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpublit.cpp#126 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpublit.hpp#41 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpucompiler.cpp#156 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuconstbuf.cpp#10 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuconstbuf.hpp#7 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpucounters.cpp#12 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpucounters.hpp#9 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpudebugger.hpp#7 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpudebugmanager.cpp#10 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpudebugmanager.hpp#6 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpudefs.hpp#147 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpudevice.cpp#567 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpudevice.hpp#163 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpukernel.cpp#318 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpukernel.hpp#126 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpumemory.cpp#131 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpumemory.hpp#50 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuprintf.cpp#44 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuprintf.hpp#15 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuprogram.cpp#232 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuprogram.hpp#69 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuresource.cpp#238 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuresource.hpp#87 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpusched.hpp#19 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuschedcl.cpp#35 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuscsi.cpp#37 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpusettings.cpp#350 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpusettings.hpp#98 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gputhreadtrace.cpp#9 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gputhreadtrace.hpp#7 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gputimestamp.cpp#27 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gputimestamp.hpp#16 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gputrap.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuvirtual.cpp#410 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuvirtual.hpp#140 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuwavelimiter.cpp#13 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuwavelimiter.hpp#9 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/hwdebug.cpp#7 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/hwdebug.hpp#8 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palappprofile.cpp#2 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palappprofile.hpp#3 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palbinary.cpp#2 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palbinary.hpp#3 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palblit.cpp#13 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palblit.hpp#5 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palcompiler.cpp#15 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palconstbuf.cpp#2 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palconstbuf.hpp#3 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palcounters.cpp#11 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palcounters.hpp#9 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paldebugger.hpp#3 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paldebugmanager.cpp#2 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paldebugmanager.hpp#3 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paldefs.hpp#16 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paldevice.cpp#45 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paldevice.hpp#16 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paldeviced3d10.cpp#2 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paldeviced3d11.cpp#2 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paldeviced3d9.cpp#2 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paldevicegl.cpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palkernel.cpp#34 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palkernel.hpp#11 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palmemory.cpp#13 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palmemory.hpp#3 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palprintf.cpp#5 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palprintf.hpp#3 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palprogram.cpp#39 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palprogram.hpp#17 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palresource.cpp#28 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palresource.hpp#12 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palsched.hpp#3 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palschedcl.cpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palsettings.cpp#24 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palsettings.hpp#10 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palthreadtrace.cpp#3 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palthreadtrace.hpp#5 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paltimestamp.cpp#2 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paltimestamp.hpp#3 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paltrap.hpp#2 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palvirtual.cpp#48 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palvirtual.hpp#21 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palwavelimiter.cpp#3 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palwavelimiter.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/mesa_glinterop.h#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocappprofile.cpp#6 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocappprofile.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocbinary.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocblit.cpp#17 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocblit.hpp#8 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/roccompiler.cpp#32 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/roccompilerlib.cpp#6 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/roccompilerlib.hpp#5 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocdefs.hpp#10 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocdevice.cpp#48 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocdevice.hpp#20 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocglinterop.cpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocglinterop.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rockernel.cpp#22 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rockernel.hpp#16 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocmemory.cpp#15 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocmemory.hpp#8 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocprintf.cpp#7 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocprintf.hpp#5 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocprogram.cpp#64 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocprogram.hpp#23 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocregisters.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocsettings.cpp#17 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocsettings.hpp#8 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocvirtual.cpp#34 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocvirtual.hpp#10 edit ... //depot/stg/opencl/drivers/opencl/runtime/os/alloc.cpp#7 edit ... //depot/stg/opencl/drivers/opencl/runtime/os/alloc.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/os/os.cpp#8 edit ... //depot/stg/opencl/drivers/opencl/runtime/os/os.hpp#30 edit ... //depot/stg/opencl/drivers/opencl/runtime/os/os_posix.cpp#42 edit ... //depot/stg/opencl/drivers/opencl/runtime/os/os_win32.cpp#47 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/agent.cpp#8 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/agent.hpp#6 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/command.cpp#78 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/command.hpp#83 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/commandqueue.cpp#23 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/commandqueue.hpp#18 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/context.cpp#42 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/context.hpp#26 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/counter.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/interop.hpp#12 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/kernel.cpp#23 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/kernel.hpp#18 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/memory.cpp#127 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/memory.hpp#100 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/ndrange.cpp#8 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/ndrange.hpp#9 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/object.cpp#2 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/object.hpp#17 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/perfctr.hpp#5 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/program.cpp#86 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/program.hpp#41 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/runtime.cpp#35 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/runtime.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/sampler.hpp#8 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/threadtrace.hpp#6 edit ... //depot/stg/opencl/drivers/opencl/runtime/thread/atomic.hpp#7 edit ... //depot/stg/opencl/drivers/opencl/runtime/thread/monitor.cpp#7 edit ... //depot/stg/opencl/drivers/opencl/runtime/thread/monitor.hpp#8 edit ... //depot/stg/opencl/drivers/opencl/runtime/thread/semaphore.cpp#10 edit ... //depot/stg/opencl/drivers/opencl/runtime/thread/semaphore.hpp#7 edit ... //depot/stg/opencl/drivers/opencl/runtime/thread/thread.cpp#14 edit ... //depot/stg/opencl/drivers/opencl/runtime/thread/thread.hpp#15 edit ... //depot/stg/opencl/drivers/opencl/runtime/top.hpp#26 edit ... //depot/stg/opencl/drivers/opencl/runtime/utils/concurrent.hpp#8 edit ... //depot/stg/opencl/drivers/opencl/runtime/utils/debug.cpp#5 edit ... //depot/stg/opencl/drivers/opencl/runtime/utils/debug.hpp#7 edit ... //depot/stg/opencl/drivers/opencl/runtime/utils/flags.cpp#16 edit ... //depot/stg/opencl/drivers/opencl/runtime/utils/flags.hpp#271 edit ... //depot/stg/opencl/drivers/opencl/runtime/utils/macros.hpp#8 edit ... //depot/stg/opencl/drivers/opencl/runtime/utils/util.hpp#12 edit ... //depot/stg/opencl/drivers/opencl/runtime/utils/versions.hpp#2150 edit
537 строки
16 KiB
C++
537 строки
16 KiB
C++
//
|
|
// Copyright 2011 Advanced Micro Devices, Inc. All rights reserved.
|
|
//
|
|
|
|
#include "device/cpu/cpuvirtual.hpp"
|
|
#include "device/cpu/cpudevice.hpp"
|
|
#include "device/cpu/cpucommand.hpp"
|
|
#include "device/blit.hpp"
|
|
#include "platform/command.hpp"
|
|
#include "platform/commandqueue.hpp"
|
|
#include "platform/memory.hpp"
|
|
#include "platform/sampler.hpp"
|
|
#include "os/os.hpp"
|
|
#include <algorithm>
|
|
|
|
namespace cpu {
|
|
|
|
amd::Atomic<size_t> VirtualCPU::numWorkerThreads_(0);
|
|
|
|
VirtualCPU::VirtualCPU(Device& device) : device::VirtualDevice(device), acceptingCommands_(false) {
|
|
const size_t numCores = device.info().maxComputeUnits_;
|
|
|
|
if ((numWorkerThreads_ += numCores) >= Device::getMaxWorkerThreadsNumber()) {
|
|
numWorkerThreads_ -= numCores;
|
|
cores_ = NULL;
|
|
return;
|
|
}
|
|
|
|
cores_ = new (std::nothrow) WorkerThread*[numCores];
|
|
if (cores_ == NULL) {
|
|
return;
|
|
}
|
|
|
|
// Clear memory for the worker threads
|
|
memset(cores_, 0, numCores * sizeof(WorkerThread*));
|
|
|
|
#if defined(__linux__)
|
|
const bool isNuma =
|
|
#if defined(NUMA_SUPPORT)
|
|
device.getNumaMask() == NULL;
|
|
#else
|
|
false;
|
|
#endif // NUMA_SUPPORT
|
|
const amd::Os::ThreadAffinityMask* affinityMask = isNuma ? NULL :
|
|
#else
|
|
const amd::Os::ThreadAffinityMask* affinityMask =
|
|
#endif
|
|
device.getWorkerThreadsAffinity();
|
|
|
|
uint coreId = affinityMask != NULL ? affinityMask->getFirstSet() : (uint)-1;
|
|
|
|
for (size_t i = 0; i < numCores; ++i) {
|
|
WorkerThread* thread = cores_[i] = new WorkerThread(device);
|
|
if (thread == NULL) {
|
|
for (size_t j = 0; j < i; ++j) {
|
|
cores_[j]->resume();
|
|
}
|
|
return;
|
|
}
|
|
|
|
if (thread->state() != amd::Thread::INITIALIZED) {
|
|
return;
|
|
}
|
|
|
|
#if defined(__linux__)
|
|
if (!isNuma) {
|
|
if (coreId == (uint)-1) {
|
|
thread->setAffinity((uint)i);
|
|
} else {
|
|
thread->setAffinity(coreId);
|
|
coreId = affinityMask->getNextSet(coreId);
|
|
}
|
|
}
|
|
#else // On Windows we set an affinity mask and not a specific ID.
|
|
if (coreId != (uint)-1) {
|
|
thread->setAffinity(*affinityMask);
|
|
}
|
|
#endif
|
|
thread->start();
|
|
}
|
|
|
|
blitMgr_ = new device::HostBlitManager(*this);
|
|
if ((NULL == blitMgr_) || !blitMgr_->create(device)) {
|
|
LogError("Could not create BlitManager!");
|
|
return;
|
|
}
|
|
|
|
acceptingCommands_ = true;
|
|
}
|
|
|
|
VirtualCPU::~VirtualCPU() {
|
|
if (cores_ == NULL) {
|
|
return;
|
|
}
|
|
|
|
delete blitMgr_;
|
|
|
|
const size_t numCores = device().info().maxComputeUnits_;
|
|
for (size_t i = 0; i < numCores; ++i) {
|
|
delete cores_[i];
|
|
}
|
|
numWorkerThreads_ -= numCores;
|
|
delete[] cores_;
|
|
}
|
|
|
|
bool VirtualCPU::terminate() {
|
|
if (cores_ == NULL) {
|
|
return true;
|
|
}
|
|
|
|
const size_t numCores = device().info().maxComputeUnits_;
|
|
for (size_t i = 0; i < numCores; ++i) {
|
|
if (cores_[i]) {
|
|
cores_[i]->terminate();
|
|
}
|
|
}
|
|
return true;
|
|
}
|
|
|
|
void VirtualCPU::submitReadMemory(amd::ReadMemoryCommand& vcmd) {
|
|
vcmd.setStatus(CL_RUNNING);
|
|
|
|
bool result = false;
|
|
device::Memory memory(vcmd.source());
|
|
|
|
// Ensure memory up-to-date
|
|
vcmd.source().cacheWriteBack();
|
|
|
|
switch (vcmd.type()) {
|
|
case CL_COMMAND_READ_BUFFER:
|
|
result = blitMgr().readBuffer(memory, vcmd.destination(), vcmd.origin(), vcmd.size(),
|
|
vcmd.isEntireMemory());
|
|
break;
|
|
case CL_COMMAND_READ_BUFFER_RECT:
|
|
result = blitMgr().readBufferRect(memory, vcmd.destination(), vcmd.bufRect(), vcmd.hostRect(),
|
|
vcmd.size(), vcmd.isEntireMemory());
|
|
break;
|
|
case CL_COMMAND_READ_IMAGE:
|
|
result = blitMgr().readImage(memory, vcmd.destination(), vcmd.origin(), vcmd.size(),
|
|
vcmd.rowPitch(), vcmd.slicePitch(), vcmd.isEntireMemory());
|
|
break;
|
|
default:
|
|
LogError("Unsupported type for the read command");
|
|
break;
|
|
}
|
|
|
|
if (!result) {
|
|
LogError("submitReadMemory failed!");
|
|
vcmd.setStatus(CL_INVALID_OPERATION);
|
|
} else {
|
|
vcmd.setStatus(CL_COMPLETE);
|
|
}
|
|
}
|
|
|
|
void VirtualCPU::submitWriteMemory(amd::WriteMemoryCommand& vcmd) {
|
|
vcmd.setStatus(CL_RUNNING);
|
|
|
|
bool result = false;
|
|
device::Memory memory(vcmd.destination());
|
|
|
|
// Ensure memory up-to-date
|
|
vcmd.destination().cacheWriteBack();
|
|
|
|
// Process different write commands
|
|
switch (vcmd.type()) {
|
|
case CL_COMMAND_WRITE_BUFFER:
|
|
result = blitMgr().writeBuffer(vcmd.source(), memory, vcmd.origin(), vcmd.size(),
|
|
vcmd.isEntireMemory());
|
|
break;
|
|
case CL_COMMAND_WRITE_BUFFER_RECT:
|
|
result = blitMgr().writeBufferRect(vcmd.source(), memory, vcmd.hostRect(), vcmd.bufRect(),
|
|
vcmd.size(), vcmd.isEntireMemory());
|
|
break;
|
|
case CL_COMMAND_WRITE_IMAGE:
|
|
result = blitMgr().writeImage(vcmd.source(), memory, vcmd.origin(), vcmd.size(),
|
|
vcmd.rowPitch(), vcmd.slicePitch(), vcmd.isEntireMemory());
|
|
break;
|
|
default:
|
|
LogError("Unsupported type for the write command");
|
|
break;
|
|
}
|
|
|
|
// Mark cache as clean (CPU works directly on backing store)
|
|
vcmd.destination().signalWrite(NULL);
|
|
|
|
if (!result) {
|
|
LogError("submitWriteMemory failed!");
|
|
vcmd.setStatus(CL_INVALID_OPERATION);
|
|
} else {
|
|
vcmd.setStatus(CL_COMPLETE);
|
|
}
|
|
}
|
|
|
|
|
|
void VirtualCPU::submitCopyMemory(amd::CopyMemoryCommand& vcmd) {
|
|
vcmd.setStatus(CL_RUNNING);
|
|
|
|
// Ensure memory up-to-date
|
|
vcmd.source().cacheWriteBack();
|
|
vcmd.destination().cacheWriteBack();
|
|
|
|
// Translate memory references and ensure cache up-to-date
|
|
device::Memory dstMemory(vcmd.destination());
|
|
device::Memory srcMemory(vcmd.source());
|
|
|
|
bool result = false;
|
|
|
|
// Check if HW can be used for memory copy
|
|
switch (vcmd.type()) {
|
|
case CL_COMMAND_COPY_BUFFER:
|
|
result = blitMgr().copyBuffer(srcMemory, dstMemory, vcmd.srcOrigin(), vcmd.dstOrigin(),
|
|
vcmd.size(), vcmd.isEntireMemory());
|
|
break;
|
|
case CL_COMMAND_COPY_BUFFER_RECT:
|
|
result = blitMgr().copyBufferRect(srcMemory, dstMemory, vcmd.srcRect(), vcmd.dstRect(),
|
|
vcmd.size(), vcmd.isEntireMemory());
|
|
break;
|
|
case CL_COMMAND_COPY_IMAGE_TO_BUFFER:
|
|
result = blitMgr().copyImageToBuffer(srcMemory, dstMemory, vcmd.srcOrigin(), vcmd.dstOrigin(),
|
|
vcmd.size(), vcmd.isEntireMemory());
|
|
break;
|
|
case CL_COMMAND_COPY_BUFFER_TO_IMAGE:
|
|
result = blitMgr().copyBufferToImage(srcMemory, dstMemory, vcmd.srcOrigin(), vcmd.dstOrigin(),
|
|
vcmd.size(), vcmd.isEntireMemory());
|
|
break;
|
|
case CL_COMMAND_COPY_IMAGE:
|
|
result = blitMgr().copyImage(srcMemory, dstMemory, vcmd.srcOrigin(), vcmd.dstOrigin(),
|
|
vcmd.size(), vcmd.isEntireMemory());
|
|
break;
|
|
default:
|
|
LogError("Unsupported command type for memory copy!");
|
|
break;
|
|
}
|
|
|
|
// Mark cache as clean (CPU works directly on backing store)
|
|
vcmd.destination().signalWrite(NULL);
|
|
|
|
if (!result) {
|
|
LogError("submitCopyMemory failed!");
|
|
vcmd.setStatus(CL_INVALID_OPERATION);
|
|
} else {
|
|
vcmd.setStatus(CL_COMPLETE);
|
|
}
|
|
}
|
|
|
|
void VirtualCPU::submitMapMemory(amd::MapMemoryCommand& cmd) {
|
|
cmd.setStatus(CL_RUNNING);
|
|
|
|
if (cmd.mapFlags() & CL_MAP_READ || cmd.mapFlags() & CL_MAP_WRITE) {
|
|
LogInfo("cpu::VirtualCPU::submitMapMemory() CL_MAP_READ and CL_MAP_WRITE ignored");
|
|
}
|
|
|
|
// Ensure memory up-to-date
|
|
cmd.memory().cacheWriteBack();
|
|
|
|
cmd.setStatus(CL_COMPLETE);
|
|
}
|
|
|
|
void VirtualCPU::submitUnmapMemory(amd::UnmapMemoryCommand& cmd) {
|
|
cmd.setStatus(CL_RUNNING);
|
|
|
|
// Mark cache as clean (CPU works directly on backing store)
|
|
cmd.memory().signalWrite(NULL);
|
|
|
|
//! @todo:dgladdin: strictly speaking we should check that the mem object was mapped
|
|
cmd.setStatus(CL_COMPLETE);
|
|
}
|
|
|
|
void VirtualCPU::submitFillMemory(amd::FillMemoryCommand& vcmd) {
|
|
vcmd.setStatus(CL_RUNNING);
|
|
|
|
device::Memory memory(vcmd.memory());
|
|
|
|
vcmd.memory().cacheWriteBack();
|
|
|
|
bool result = false;
|
|
|
|
// Find the the right fill operation
|
|
switch (vcmd.type()) {
|
|
case CL_COMMAND_FILL_BUFFER:
|
|
result = blitMgr().fillBuffer(memory, vcmd.pattern(), vcmd.patternSize(), vcmd.origin(),
|
|
vcmd.size(), vcmd.isEntireMemory());
|
|
break;
|
|
case CL_COMMAND_FILL_IMAGE:
|
|
result = blitMgr().fillImage(memory, vcmd.pattern(), vcmd.origin(), vcmd.size(),
|
|
vcmd.isEntireMemory());
|
|
break;
|
|
default:
|
|
LogError("Unsupported command type for FillMemory!");
|
|
break;
|
|
}
|
|
|
|
vcmd.memory().signalWrite(NULL);
|
|
|
|
if (!result) {
|
|
LogError("submitFillMemory failed!");
|
|
vcmd.setStatus(CL_INVALID_OPERATION);
|
|
} else {
|
|
vcmd.setStatus(CL_COMPLETE);
|
|
}
|
|
}
|
|
|
|
//! Helper function for forcing a cache sync for all kernel parameters
|
|
static void syncAllParams(amd::NDRangeKernelCommand& cmd) {
|
|
const amd::Kernel& kernel = cmd.kernel();
|
|
const amd::KernelParameters& kernelParam = kernel.parameters();
|
|
const amd::KernelSignature& signature = kernel.signature();
|
|
const amd::Device& device = cmd.queue()->device();
|
|
|
|
for (size_t i = 0; i < signature.numParameters(); ++i) {
|
|
const amd::KernelParameterDescriptor& desc = signature.at(i);
|
|
if (desc.type_ == T_POINTER && desc.size_ > 0 &&
|
|
!kernelParam.boundToSvmPointer(device, cmd.parameters(), i)) {
|
|
address ptr = (address)(cmd.parameters() + desc.offset_);
|
|
amd::Memory* memArg = *(amd::Memory**)ptr;
|
|
|
|
if (memArg != NULL) {
|
|
memArg->cacheWriteBack();
|
|
memArg->signalWrite(NULL);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
void VirtualCPU::computeLocalSizes(amd::NDRangeKernelCommand& command, amd::NDRange& local) {
|
|
bool uniformSize =
|
|
(OPENCL_MAJOR < 2) || command.kernel().getDeviceKernel(device())->getUniformWorkGroupSize();
|
|
|
|
const amd::NDRangeContainer& sizes = command.sizes();
|
|
const size_t numCores = device().info().maxComputeUnits_;
|
|
|
|
const size_t globalSize1D = sizes.global().product();
|
|
const size_t targetNumOperations = std::min(globalSize1D, numCores * 4);
|
|
size_t localSize1D =
|
|
std::min(globalSize1D / targetNumOperations, device().info().maxWorkGroupSize_);
|
|
|
|
for (size_t i = 0; i < local.dimensions(); ++i) {
|
|
const size_t globalSize = sizes.global()[i];
|
|
size_t localSize =
|
|
std::min(std::min(localSize1D, globalSize), device().info().maxWorkItemSizes_[i]);
|
|
|
|
// local must exactly divide global if uniform size is required
|
|
// For non uniform size, we could use the work group size hint
|
|
if (uniformSize && globalSize % localSize != 0) {
|
|
while (true) {
|
|
//! @todo: lmoriche: find a better way
|
|
if (globalSize % localSize == 0) break;
|
|
--localSize;
|
|
}
|
|
}
|
|
local[i] = localSize;
|
|
localSize1D /= localSize;
|
|
}
|
|
|
|
command.setLocalWorkSize(local);
|
|
}
|
|
|
|
|
|
static amd::NDRange computeRemainders(const amd::NDRange& global, const amd::NDRange& local) {
|
|
amd::NDRange remainders(local.dimensions());
|
|
|
|
for (size_t i = 0; i < local.dimensions(); ++i) {
|
|
remainders[i] = (global[i] % local[i] != 0) ? 1 : 0;
|
|
}
|
|
|
|
return remainders;
|
|
}
|
|
|
|
void VirtualCPU::submitKernel(amd::NDRangeKernelCommand& command) {
|
|
const amd::NDRangeContainer& sizes = command.sizes();
|
|
const size_t numCores = device().info().maxComputeUnits_;
|
|
|
|
amd::NDRange local = sizes.local();
|
|
|
|
if (local == 0) {
|
|
computeLocalSizes(command, local);
|
|
}
|
|
amd::NDRange remainders = computeRemainders(sizes.global(), local);
|
|
|
|
// number of groups in each dimensions
|
|
const amd::NDRange numGroups = (sizes.global() / local) + remainders;
|
|
|
|
size_t numOperations = numGroups.product();
|
|
if (numOperations == 0) {
|
|
command.setStatus(CL_COMPLETE);
|
|
return;
|
|
}
|
|
|
|
syncAllParams(command);
|
|
// retain the command here instead of retaining in NDRangeKernelBatch' ctor
|
|
command.retain();
|
|
|
|
size_t batchCount = std::min(numOperations, numCores);
|
|
NDRangeKernelBatch batch(command, *this, numGroups, batchCount);
|
|
|
|
Operation::Counter counter(command, batchCount);
|
|
command.setData(&counter);
|
|
|
|
for (size_t coreId = 0; coreId < batchCount; ++coreId) {
|
|
batch.setCoreId(coreId);
|
|
cores_[coreId]->enqueue(batch);
|
|
cores_[coreId]->flush();
|
|
}
|
|
|
|
command.awaitCompletion();
|
|
command.release();
|
|
}
|
|
|
|
void VirtualCPU::submitNativeFn(amd::NativeFnCommand& command) {
|
|
NativeFn fn(command);
|
|
cores_[0]->enqueue(fn);
|
|
cores_[0]->flush();
|
|
command.awaitCompletion();
|
|
}
|
|
|
|
void VirtualCPU::submitMarker(amd::Marker& command) { command.setStatus(CL_COMPLETE); }
|
|
|
|
void VirtualCPU::submitAcquireExtObjects(amd::AcquireExtObjectsCommand& cmd) {
|
|
//! @todo [odintsov]: create an AcquireExtObjectsOperation and enqueue it
|
|
//! to a core when a core scheduler is around.
|
|
//
|
|
// cores_[0]->enqueue(new AcquireExtObjectsOperation(cmd));
|
|
// the code below will be moved to AcquireExtObjectsOperation::execute()
|
|
cmd.setStatus(CL_RUNNING);
|
|
|
|
//
|
|
// AcquireExtObjects execution starts here
|
|
//
|
|
bool bError = false;
|
|
|
|
//! Go through ext objects by one and call member function to execute
|
|
//! a sequence of external graphics API commands for each external object
|
|
for (std::vector<amd::Memory*>::const_iterator itr = cmd.getMemList().begin();
|
|
itr != cmd.getMemList().end(); itr++) {
|
|
if (*itr) {
|
|
bError |= !((*itr)->mapExtObjectInCQThread());
|
|
}
|
|
}
|
|
if (bError) {
|
|
cmd.setStatus(CL_INVALID_OPERATION);
|
|
} else {
|
|
cmd.setStatus(CL_COMPLETE);
|
|
}
|
|
}
|
|
|
|
void VirtualCPU::submitReleaseExtObjects(amd::ReleaseExtObjectsCommand& cmd) {
|
|
//! @todo [odintsov]: create a ReleaseExtObjectsOperation and enqueue it
|
|
//! to a core when a core scheduler is around.
|
|
//
|
|
// cores_[i]->enqueue(new ReleaseExtObjectsOperation(cmd));
|
|
// the code below will be moved to ReleaseExtObjectsOperation::execute()
|
|
cmd.setStatus(CL_RUNNING);
|
|
|
|
bool bError = false;
|
|
|
|
for (std::vector<amd::Memory*>::const_iterator itr = cmd.getMemList().begin();
|
|
itr != cmd.getMemList().end(); itr++) {
|
|
if (*itr) {
|
|
bError |= !((*itr)->unmapExtObjectInCQThread());
|
|
}
|
|
}
|
|
if (bError) {
|
|
cmd.setStatus(CL_INVALID_OPERATION);
|
|
} else {
|
|
cmd.setStatus(CL_COMPLETE);
|
|
}
|
|
}
|
|
|
|
void VirtualCPU::submitPerfCounter(amd::PerfCounterCommand& cmd) {
|
|
cmd.setStatus(CL_RUNNING);
|
|
LogError("We don't support HW perf counters on CPU");
|
|
cmd.setStatus(CL_INVALID_OPERATION);
|
|
}
|
|
|
|
void VirtualCPU::submitThreadTraceMemObjects(amd::ThreadTraceMemObjectsCommand& cmd) {
|
|
cmd.setStatus(CL_RUNNING);
|
|
LogError("We don't support thread trace on CPU");
|
|
cmd.setStatus(CL_INVALID_OPERATION);
|
|
}
|
|
|
|
void VirtualCPU::submitThreadTrace(amd::ThreadTraceCommand& cmd) {
|
|
cmd.setStatus(CL_RUNNING);
|
|
LogError("We don't support thread trace on CPU");
|
|
cmd.setStatus(CL_INVALID_OPERATION);
|
|
}
|
|
|
|
void VirtualCPU::flush(amd::Command* list, bool wait) {
|
|
amd::Command* head = list;
|
|
|
|
// Release all commands from the link list
|
|
while (head != NULL) {
|
|
amd::Command* it = head->getNext();
|
|
head->release();
|
|
head = it;
|
|
}
|
|
}
|
|
|
|
void VirtualCPU::submitSignal(amd::SignalCommand& cmd) { cmd.setStatus(CL_INVALID_OPERATION); }
|
|
|
|
void VirtualCPU::submitMakeBuffersResident(amd::MakeBuffersResidentCommand& cmd) {
|
|
cmd.setStatus(CL_INVALID_OPERATION);
|
|
}
|
|
|
|
void VirtualCPU::submitSvmFreeMemory(amd::SvmFreeMemoryCommand& cmd) {
|
|
cmd.setStatus(CL_RUNNING);
|
|
if (cmd.pfnFreeFunc() == NULL) {
|
|
// pointers allocated using clSVMAlloc
|
|
for (cl_uint i = 0; i < cmd.svmPointers().size(); i++) {
|
|
amd::SvmBuffer::free(cmd.context(), cmd.svmPointers()[i]);
|
|
}
|
|
} else {
|
|
cmd.pfnFreeFunc()(as_cl(cmd.queue()->asCommandQueue()), cmd.svmPointers().size(),
|
|
(void**)(&(cmd.svmPointers()[0])), cmd.userData());
|
|
}
|
|
cmd.setStatus(CL_COMPLETE);
|
|
}
|
|
|
|
void VirtualCPU::submitSvmCopyMemory(amd::SvmCopyMemoryCommand& cmd) {
|
|
cmd.setStatus(CL_RUNNING);
|
|
amd::SvmBuffer::memFill(cmd.dst(), cmd.src(), cmd.srcSize(), 1);
|
|
cmd.setStatus(CL_COMPLETE);
|
|
}
|
|
|
|
void VirtualCPU::submitSvmFillMemory(amd::SvmFillMemoryCommand& cmd) {
|
|
cmd.setStatus(CL_RUNNING);
|
|
amd::SvmBuffer::memFill(cmd.dst(), cmd.pattern(), cmd.patternSize(), cmd.times());
|
|
cmd.setStatus(CL_COMPLETE);
|
|
}
|
|
|
|
void VirtualCPU::submitSvmMapMemory(amd::SvmMapMemoryCommand& cmd) { cmd.setStatus(CL_COMPLETE); }
|
|
|
|
void VirtualCPU::submitSvmUnmapMemory(amd::SvmUnmapMemoryCommand& cmd) {
|
|
cmd.setStatus(CL_COMPLETE);
|
|
}
|
|
|
|
} // namespace cpu
|