465c1c0287
SWDEV-102733 - [OCL-LC-ROCm] Cmake build Write CMakeLists.txt to enable building with and without the DK environment - Change the coding convention of the runtime files. Use Google's Style (https://google.github.io/styleguide/cppguide.html). Affected files ... ... //depot/stg/opencl/drivers/opencl/.clang-format#1 add ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_agent_amd.h#2 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_command.cpp#13 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_context.cpp#53 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_counter.cpp#2 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_d3d10.cpp#15 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_d3d11.cpp#22 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_d3d9.cpp#32 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_debugger_amd.cpp#8 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_debugger_amd.h#7 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_device.cpp#61 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_event.cpp#10 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_execute.cpp#23 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_gl.cpp#53 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_icd.cpp#27 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_icd_amd.h#18 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_kernel.h#24 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_kernel_info_amd.cpp#3 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_kernel_info_amd.h#4 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_lqdflash_amd.cpp#17 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_lqdflash_amd.h#6 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_memobj.cpp#81 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_object.cpp#3 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_pipe.cpp#6 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_platform_amd.cpp#2 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_platform_amd.h#2 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_profile_amd.cpp#3 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_profile_amd.h#2 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_program.cpp#41 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_sampler.cpp#6 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_sdi_amd.cpp#3 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_sdi_amd.h#2 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_semaphore_amd.h#3 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_svm.cpp#20 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_thread_trace_amd.cpp#8 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_thread_trace_amd.h#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/appprofile.cpp#17 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/appprofile.hpp#12 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/blit.cpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/blit.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/blitcl.cpp#11 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpubinary.cpp#11 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpubinary.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpubuiltins.cpp#13 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpubuiltins.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpucommand.cpp#66 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpucommand.hpp#40 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpudevice.cpp#280 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpudevice.hpp#96 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpufeat.hpp#3 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpukernel.hpp#8 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpumapping.cpp#6 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpumapping.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpuprogram.cpp#70 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpuprogram.hpp#14 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpusettings.cpp#33 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpusettings.hpp#2 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cputables.hpp#5 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpuvirtual.cpp#26 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/cpu/cpuvirtual.hpp#13 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/device.cpp#209 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/device.hpp#284 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuappprofile.cpp#12 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuappprofile.hpp#7 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpubinary.cpp#58 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpubinary.hpp#27 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpublit.cpp#126 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpublit.hpp#41 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpucompiler.cpp#156 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuconstbuf.cpp#10 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuconstbuf.hpp#7 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpucounters.cpp#12 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpucounters.hpp#9 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpudebugger.hpp#7 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpudebugmanager.cpp#10 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpudebugmanager.hpp#6 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpudefs.hpp#147 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpudevice.cpp#567 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpudevice.hpp#163 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpukernel.cpp#318 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpukernel.hpp#126 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpumemory.cpp#131 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpumemory.hpp#50 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuprintf.cpp#44 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuprintf.hpp#15 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuprogram.cpp#232 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuprogram.hpp#69 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuresource.cpp#238 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuresource.hpp#87 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpusched.hpp#19 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuschedcl.cpp#35 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuscsi.cpp#37 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpusettings.cpp#350 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpusettings.hpp#98 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gputhreadtrace.cpp#9 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gputhreadtrace.hpp#7 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gputimestamp.cpp#27 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gputimestamp.hpp#16 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gputrap.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuvirtual.cpp#410 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuvirtual.hpp#140 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuwavelimiter.cpp#13 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/gpu/gpuwavelimiter.hpp#9 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/hwdebug.cpp#7 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/hwdebug.hpp#8 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palappprofile.cpp#2 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palappprofile.hpp#3 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palbinary.cpp#2 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palbinary.hpp#3 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palblit.cpp#13 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palblit.hpp#5 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palcompiler.cpp#15 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palconstbuf.cpp#2 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palconstbuf.hpp#3 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palcounters.cpp#11 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palcounters.hpp#9 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paldebugger.hpp#3 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paldebugmanager.cpp#2 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paldebugmanager.hpp#3 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paldefs.hpp#16 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paldevice.cpp#45 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paldevice.hpp#16 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paldeviced3d10.cpp#2 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paldeviced3d11.cpp#2 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paldeviced3d9.cpp#2 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paldevicegl.cpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palkernel.cpp#34 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palkernel.hpp#11 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palmemory.cpp#13 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palmemory.hpp#3 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palprintf.cpp#5 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palprintf.hpp#3 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palprogram.cpp#39 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palprogram.hpp#17 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palresource.cpp#28 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palresource.hpp#12 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palsched.hpp#3 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palschedcl.cpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palsettings.cpp#24 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palsettings.hpp#10 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palthreadtrace.cpp#3 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palthreadtrace.hpp#5 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paltimestamp.cpp#2 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paltimestamp.hpp#3 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paltrap.hpp#2 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palvirtual.cpp#48 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palvirtual.hpp#21 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palwavelimiter.cpp#3 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palwavelimiter.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/mesa_glinterop.h#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocappprofile.cpp#6 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocappprofile.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocbinary.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocblit.cpp#17 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocblit.hpp#8 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/roccompiler.cpp#32 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/roccompilerlib.cpp#6 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/roccompilerlib.hpp#5 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocdefs.hpp#10 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocdevice.cpp#48 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocdevice.hpp#20 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocglinterop.cpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocglinterop.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rockernel.cpp#22 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rockernel.hpp#16 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocmemory.cpp#15 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocmemory.hpp#8 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocprintf.cpp#7 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocprintf.hpp#5 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocprogram.cpp#64 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocprogram.hpp#23 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocregisters.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocsettings.cpp#17 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocsettings.hpp#8 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocvirtual.cpp#34 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocvirtual.hpp#10 edit ... //depot/stg/opencl/drivers/opencl/runtime/os/alloc.cpp#7 edit ... //depot/stg/opencl/drivers/opencl/runtime/os/alloc.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/os/os.cpp#8 edit ... //depot/stg/opencl/drivers/opencl/runtime/os/os.hpp#30 edit ... //depot/stg/opencl/drivers/opencl/runtime/os/os_posix.cpp#42 edit ... //depot/stg/opencl/drivers/opencl/runtime/os/os_win32.cpp#47 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/agent.cpp#8 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/agent.hpp#6 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/command.cpp#78 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/command.hpp#83 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/commandqueue.cpp#23 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/commandqueue.hpp#18 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/context.cpp#42 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/context.hpp#26 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/counter.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/interop.hpp#12 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/kernel.cpp#23 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/kernel.hpp#18 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/memory.cpp#127 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/memory.hpp#100 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/ndrange.cpp#8 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/ndrange.hpp#9 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/object.cpp#2 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/object.hpp#17 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/perfctr.hpp#5 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/program.cpp#86 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/program.hpp#41 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/runtime.cpp#35 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/runtime.hpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/sampler.hpp#8 edit ... //depot/stg/opencl/drivers/opencl/runtime/platform/threadtrace.hpp#6 edit ... //depot/stg/opencl/drivers/opencl/runtime/thread/atomic.hpp#7 edit ... //depot/stg/opencl/drivers/opencl/runtime/thread/monitor.cpp#7 edit ... //depot/stg/opencl/drivers/opencl/runtime/thread/monitor.hpp#8 edit ... //depot/stg/opencl/drivers/opencl/runtime/thread/semaphore.cpp#10 edit ... //depot/stg/opencl/drivers/opencl/runtime/thread/semaphore.hpp#7 edit ... //depot/stg/opencl/drivers/opencl/runtime/thread/thread.cpp#14 edit ... //depot/stg/opencl/drivers/opencl/runtime/thread/thread.hpp#15 edit ... //depot/stg/opencl/drivers/opencl/runtime/top.hpp#26 edit ... //depot/stg/opencl/drivers/opencl/runtime/utils/concurrent.hpp#8 edit ... //depot/stg/opencl/drivers/opencl/runtime/utils/debug.cpp#5 edit ... //depot/stg/opencl/drivers/opencl/runtime/utils/debug.hpp#7 edit ... //depot/stg/opencl/drivers/opencl/runtime/utils/flags.cpp#16 edit ... //depot/stg/opencl/drivers/opencl/runtime/utils/flags.hpp#271 edit ... //depot/stg/opencl/drivers/opencl/runtime/utils/macros.hpp#8 edit ... //depot/stg/opencl/drivers/opencl/runtime/utils/util.hpp#12 edit ... //depot/stg/opencl/drivers/opencl/runtime/utils/versions.hpp#2150 edit
578 строки
21 KiB
C++
578 строки
21 KiB
C++
//
|
|
// Copyright (c) 2008 Advanced Micro Devices, Inc. All rights reserved.
|
|
//
|
|
|
|
#ifndef GPUPROGRAM_HPP_
|
|
#define GPUPROGRAM_HPP_
|
|
|
|
#include "device/gpu/gpukernel.hpp"
|
|
#include "device/gpu/gpubinary.hpp"
|
|
#include "amd_hsa_loader.hpp"
|
|
|
|
namespace amd {
|
|
namespace option {
|
|
class Options;
|
|
} // option
|
|
namespace hsa {
|
|
namespace loader {
|
|
class Loader;
|
|
class Executable;
|
|
class Context;
|
|
} // loader
|
|
} // hsa
|
|
} // amd
|
|
|
|
//! \namespace gpu GPU Device Implementation
|
|
namespace gpu {
|
|
|
|
/*! \addtogroup GPU GPU Device Implementation
|
|
* @{
|
|
*/
|
|
|
|
//! \struct ILFunc for the opencl program processing
|
|
struct ILFunc : public amd::HeapObject {
|
|
public:
|
|
//! \struct CodeRange for the code ranges
|
|
struct SourceRange : public amd::EmbeddedObject {
|
|
size_t begin_; //!< start code position
|
|
size_t end_; //!< end code position
|
|
};
|
|
|
|
//! \enum IL function state
|
|
enum State {
|
|
Unknown = 0x00000000, //! unknown function
|
|
Regular = 0x00000001, //! regular function from the program
|
|
Kernel = 0x00000002 //! kernel function from the program
|
|
};
|
|
|
|
//! Default constructor
|
|
ILFunc()
|
|
: name_(""),
|
|
index_(0),
|
|
state_(Unknown),
|
|
privateSize_(0),
|
|
localSize_(0),
|
|
hwPrivateSize_(0),
|
|
hwLocalSize_(0),
|
|
flags_(0),
|
|
totalHwPrivateSize_(-1) {
|
|
code_.begin_ = code_.end_ = 0;
|
|
metadata_.begin_ = metadata_.end_ = 0;
|
|
}
|
|
|
|
//! Copy constructor
|
|
ILFunc(const ILFunc& func) { *this = func; }
|
|
|
|
//! Destructor
|
|
~ILFunc() {}
|
|
|
|
//! Overloads operator=
|
|
ILFunc& operator=(const ILFunc& func) {
|
|
name_ = func.name_;
|
|
index_ = func.index_;
|
|
code_ = func.code_;
|
|
metadata_ = func.metadata_;
|
|
state_ = func.state_;
|
|
privateSize_ = func.privateSize_;
|
|
localSize_ = func.localSize_;
|
|
hwPrivateSize_ = func.hwPrivateSize_;
|
|
hwLocalSize_ = func.hwLocalSize_;
|
|
flags_ = func.flags_;
|
|
totalHwPrivateSize_ = func.totalHwPrivateSize_;
|
|
|
|
// Note: we don't copy calls_ and macros_
|
|
return *this;
|
|
}
|
|
|
|
std::string name_; //!< kernel's name
|
|
uint index_; //!< kernel's index
|
|
SourceRange code_; //!< the entire function range in the source
|
|
SourceRange metadata_; //!< the metadata range
|
|
State state_; //!< the function is real, and not intrinsic
|
|
uint privateSize_; //!< private ring allocation by the function
|
|
uint localSize_; //!< local ring allocation by the function
|
|
uint hwPrivateSize_; //!< HW private ring allocation by the function
|
|
uint hwLocalSize_; //!< HW local ring allocation by the function
|
|
uint flags_; //!< The IL func flags/properties
|
|
long long totalHwPrivateSize_; //!< total HW private usage including called functions
|
|
std::vector<ILFunc*> calls_; //! Functions called from the current
|
|
std::vector<uint> macros_; //! Macros, used in the IL function
|
|
|
|
uint totalHwPrivateUsage(); //!< total HW private usage including called functions
|
|
};
|
|
|
|
//! \class empty program
|
|
class NullProgram : public device::Program {
|
|
friend class ClBinary;
|
|
|
|
public:
|
|
//! Default constructor
|
|
NullProgram(NullDevice& nullDev) : device::Program(nullDev), patch_(0) {}
|
|
|
|
//! Default destructor
|
|
~NullProgram();
|
|
|
|
// Initialize Binary for GPU
|
|
virtual bool initClBinary();
|
|
// Release Binary for GPU
|
|
virtual void releaseClBinary();
|
|
|
|
//! Returns global constant buffers
|
|
const std::vector<uint>& glbCb() const { return glbCb_; }
|
|
|
|
protected:
|
|
//! pre-compile setup for GPU
|
|
virtual bool initBuild(amd::option::Options* options);
|
|
|
|
//! post-compile setup for GPU
|
|
virtual bool finiBuild(bool isBuildGood);
|
|
|
|
/*! \brief Compiles GPU CL program to LLVM binary (compiler frontend)
|
|
*
|
|
* \return True if we successefully compiled a GPU program
|
|
*/
|
|
virtual bool compileImpl(const std::string& sourceCode, //!< the program's source code
|
|
const std::vector<const std::string*>& headers, //!< header souce codes
|
|
const char** headerIncludeNames, //!< include names of headers
|
|
amd::option::Options* options //!< compile options's object
|
|
);
|
|
|
|
/*! \brief Compiles LLVM binary to IL code (compiler backend: link+opt+codegen)
|
|
*
|
|
* \return The build error code
|
|
*/
|
|
int compileBinaryToIL(amd::option::Options* options //!< options for compilation
|
|
);
|
|
|
|
/*! \brief Links the compiled IL program with HW
|
|
*
|
|
* \return True if we successefully linked a GPU program
|
|
*/
|
|
virtual bool linkImpl(amd::option::Options* options = NULL //!< options object
|
|
);
|
|
virtual bool linkImpl(const std::vector<device::Program*>& inputPrograms,
|
|
amd::option::Options* options = NULL, //!< options object
|
|
bool createLibrary = false);
|
|
|
|
virtual bool createBinary(amd::option::Options* options);
|
|
|
|
|
|
/*! \brief Parses the GPU program and finds all available kernels
|
|
*
|
|
* \return True if we successefully parsed the GPU program
|
|
*/
|
|
bool parseKernels(const std::string& source //! the program's source code
|
|
);
|
|
|
|
/*! \brief Parse all functions in the program
|
|
*
|
|
* \return True if we successefully parsed all functions
|
|
*/
|
|
bool parseAllILFuncs(const std::string& source //! the program's source code
|
|
);
|
|
|
|
/*! \brief Parse a function's metadata given as source[posBegin:posEnd-1]
|
|
*
|
|
* \return True if we successefully parsed the given metadata
|
|
*/
|
|
bool parseFuncMetadata(const std::string& source, //! string that contains metadata
|
|
size_t posBegin, //! begin of metadata in 'source'
|
|
size_t posEnd //! end of metadata in 'source'
|
|
);
|
|
|
|
/*! \brief Finds functions with the given start and end string in the
|
|
* program
|
|
*
|
|
* \return True if we successefully found all functions
|
|
*/
|
|
bool findILFuncs(const std::string& source, //! the program's source code
|
|
const std::string& func_start, //! the start string of a function
|
|
const std::string& func_end, //! the end string of a function
|
|
size_t& lastFuncPos //! pos to the end of the last func in 'source'
|
|
);
|
|
|
|
|
|
/*! \brief Finds all functions in the program
|
|
*
|
|
* \return True if we successefully found all functions
|
|
*/
|
|
bool findAllILFuncs(const std::string& source, //! the program's source code
|
|
size_t& lastFuncPos //! pos to the end of the last func in 'source'
|
|
);
|
|
|
|
/*! \brief Finds function, corresponded to the provided unique index
|
|
*
|
|
* \return Pointer to the ILFunc structure
|
|
*/
|
|
ILFunc* findILFunc(uint index //! the function unique index
|
|
);
|
|
|
|
//! Destroys all objects, associated with the IL functions
|
|
void freeAllILFuncs();
|
|
|
|
/*! \brief Finds if a provided function is called from the base function
|
|
*
|
|
* \return True if a function is used from the base one
|
|
*/
|
|
bool isCalled(const ILFunc* base, //!< The base function
|
|
const ILFunc* func //!< Function to check for usage
|
|
);
|
|
|
|
//! Patches the "main" function with the call to the current kernel
|
|
void patchMain(std::string& kernel, //! The current kernel's code for compilation
|
|
uint index //! Index of the current kernel in the program
|
|
);
|
|
|
|
//! Adds the IL function object into the list of functions
|
|
void addFunc(ILFunc* func) { funcs_.push_back(func); }
|
|
|
|
//! Empty implementation, since we don't have real HW
|
|
virtual bool allocGlobalData(const void* globalData, //!< Pointer to the global data
|
|
size_t dataSize, //!< The global data size
|
|
uint index //!< Index for the global data store (0 - global heap)
|
|
) {
|
|
glbCb_.push_back(index);
|
|
return true;
|
|
}
|
|
|
|
//! Load binary for offline device.
|
|
virtual bool loadBinary(bool* hasRecompiled);
|
|
|
|
//! Create NullKernel for compiling to isa.
|
|
virtual NullKernel* createKernel(const std::string& name, //!< The kernel's name
|
|
const Kernel::InitData* initData, //!< Initialization data
|
|
const std::string& code, //!< IL source code
|
|
const std::string& metadata, //!< the kernel metadata structure
|
|
bool* created, //!< True if the object was created
|
|
const void* binaryCode = NULL, //!< binary machine code for CAL
|
|
size_t binarySize = 0 //!< the machine code size
|
|
);
|
|
|
|
ClBinary* clBinary() { return static_cast<ClBinary*>(device::Program::clBinary()); }
|
|
const ClBinary* clBinary() const {
|
|
return static_cast<const ClBinary*>(device::Program::clBinary());
|
|
}
|
|
|
|
/*! Get all per-kernel IL from programIL, where programIL is the IL for the
|
|
* whole compilation unit.
|
|
*/
|
|
bool getAllKernelILs(std::map<std::string, std::string>& allKernelILs, std::string& programIL,
|
|
const char* ilKernelName);
|
|
|
|
protected:
|
|
std::vector<PrintfInfo> printf_; //!< Format strings for GPU printf support
|
|
std::vector<uint> glbCb_; //!< Global constant buffers
|
|
|
|
virtual bool isElf(const char* bin) const { return amd::isElfMagic(bin); }
|
|
|
|
virtual const aclTargetInfo& info(const char* str = "");
|
|
|
|
private:
|
|
//! Disable default copy constructor
|
|
NullProgram(const NullProgram&);
|
|
|
|
//! Disable operator=
|
|
NullProgram& operator=(const NullProgram&);
|
|
|
|
//! Initializes the global data store
|
|
bool initGlobalData(const std::string& source, //!< the program's source code
|
|
size_t start //!< start position for the global data search
|
|
);
|
|
|
|
//! Return a typecasted GPU device
|
|
gpu::NullDevice& dev() {
|
|
return const_cast<gpu::NullDevice&>(static_cast<const gpu::NullDevice&>(device()));
|
|
}
|
|
|
|
size_t patch_; //!< Patch call position in the source code.
|
|
std::vector<ILFunc*> funcs_; //!< list of all functions.
|
|
|
|
std::string ilProgram_; //!< IL program after compilation
|
|
};
|
|
|
|
//! \class GPU program
|
|
class Program : public NullProgram {
|
|
public:
|
|
//! GPU program constructor
|
|
Program(Device& gpuDev) : NullProgram(gpuDev), glbData_(NULL) {}
|
|
|
|
//! GPU program destructor
|
|
~Program();
|
|
|
|
//! Get the global data store for this program
|
|
gpu::Memory* glbData() const { return glbData_; }
|
|
|
|
//! Returns TRUE if we successfully allocated the global data store
|
|
//! in video memory
|
|
bool allocGlobalData(const void* globalData, //!< Pointer to the global data
|
|
size_t dataSize, //!< The global data size
|
|
uint index //!< Index for the global data store (0 - global heap)
|
|
);
|
|
|
|
//! Returns TRUE if we could
|
|
virtual bool loadBinary(bool* hasRecompiled);
|
|
|
|
//! Creates the GPU kernel (return base type)
|
|
virtual NullKernel* createKernel(const std::string& name, //!< The kernel's name
|
|
const Kernel::InitData* initData, //!< Initialization data
|
|
const std::string& code, //!< IL source code
|
|
const std::string& metadata, //!< the kernel metadata structure
|
|
bool* created, //!< True if the object was created
|
|
const void* binaryCode = NULL, //!< binary machine code for CAL
|
|
size_t binarySize = 0 //!< the machine code size
|
|
);
|
|
|
|
typedef std::map<uint, gpu::Memory*> HwConstBuffers;
|
|
|
|
//! Global HW constant buffers
|
|
const HwConstBuffers& glbHwCb() const { return constBufs_; }
|
|
|
|
//! Returns pritnf info array
|
|
const std::vector<PrintfInfo>& printfInfo() const { return printf_; }
|
|
|
|
//! Return a typecasted GPU device
|
|
gpu::Device& dev() { return const_cast<gpu::Device&>(static_cast<const gpu::Device&>(device())); }
|
|
|
|
protected:
|
|
private:
|
|
//! Disable copy constructor
|
|
Program(const Program&);
|
|
|
|
//! Disable operator=
|
|
Program& operator=(const Program&);
|
|
|
|
HwConstBuffers constBufs_; //!< Constant buffers for the global store
|
|
gpu::Memory* glbData_; //!< Global data store
|
|
};
|
|
|
|
using namespace amd::hsa::loader;
|
|
class HSAILProgram;
|
|
|
|
class ORCAHSALoaderContext final : public Context {
|
|
public:
|
|
ORCAHSALoaderContext(HSAILProgram* program) : program_(program) {}
|
|
|
|
virtual ~ORCAHSALoaderContext() {}
|
|
|
|
hsa_isa_t IsaFromName(const char* name) override;
|
|
|
|
bool IsaSupportedByAgent(hsa_agent_t agent, hsa_isa_t isa) override;
|
|
|
|
void* SegmentAlloc(amdgpu_hsa_elf_segment_t segment, hsa_agent_t agent, size_t size, size_t align,
|
|
bool zero) override;
|
|
|
|
bool SegmentCopy(amdgpu_hsa_elf_segment_t segment, hsa_agent_t agent, void* dst, size_t offset,
|
|
const void* src, size_t size) override;
|
|
|
|
void SegmentFree(amdgpu_hsa_elf_segment_t segment, hsa_agent_t agent, void* seg,
|
|
size_t size = 0) override;
|
|
|
|
void* SegmentAddress(amdgpu_hsa_elf_segment_t segment, hsa_agent_t agent, void* seg,
|
|
size_t offset) override;
|
|
|
|
void* SegmentHostAddress(amdgpu_hsa_elf_segment_t segment, hsa_agent_t agent, void* seg,
|
|
size_t offset) override {
|
|
return nullptr;
|
|
}
|
|
|
|
bool SegmentFreeze(amdgpu_hsa_elf_segment_t segment, hsa_agent_t agent, void* seg,
|
|
size_t size) override {
|
|
return false;
|
|
}
|
|
|
|
bool ImageExtensionSupported() override { return false; }
|
|
|
|
hsa_status_t ImageCreate(hsa_agent_t agent, hsa_access_permission_t image_permission,
|
|
const hsa_ext_image_descriptor_t* image_descriptor,
|
|
const void* image_data, hsa_ext_image_t* image_handle) override {
|
|
// not supported
|
|
assert(false);
|
|
return HSA_STATUS_ERROR;
|
|
}
|
|
|
|
hsa_status_t ImageDestroy(hsa_agent_t agent, hsa_ext_image_t image_handle) override {
|
|
// not supported
|
|
assert(false);
|
|
return HSA_STATUS_ERROR;
|
|
}
|
|
|
|
hsa_status_t SamplerCreate(hsa_agent_t agent,
|
|
const hsa_ext_sampler_descriptor_t* sampler_descriptor,
|
|
hsa_ext_sampler_t* sampler_handle) override;
|
|
|
|
//! All samplers are owned by HSAILProgram and are deleted in its destructor.
|
|
hsa_status_t SamplerDestroy(hsa_agent_t agent, hsa_ext_sampler_t sampler_handle) override;
|
|
|
|
private:
|
|
void* AgentGlobalAlloc(hsa_agent_t agent, size_t size, size_t align, bool zero) {
|
|
return GpuMemAlloc(size, align, zero);
|
|
}
|
|
|
|
bool AgentGlobalCopy(void* dst, size_t offset, const void* src, size_t size) {
|
|
return GpuMemCopy(dst, offset, src, size);
|
|
}
|
|
|
|
void AgentGlobalFree(void* ptr, size_t size) { GpuMemFree(ptr, size); }
|
|
|
|
void* KernelCodeAlloc(hsa_agent_t agent, size_t size, size_t align, bool zero) {
|
|
return CpuMemAlloc(size, align, zero);
|
|
}
|
|
|
|
bool KernelCodeCopy(void* dst, size_t offset, const void* src, size_t size) {
|
|
return CpuMemCopy(dst, offset, src, size);
|
|
}
|
|
|
|
void KernelCodeFree(void* ptr, size_t size) { CpuMemFree(ptr, size); }
|
|
|
|
void* CpuMemAlloc(size_t size, size_t align, bool zero);
|
|
|
|
bool CpuMemCopy(void* dst, size_t offset, const void* src, size_t size);
|
|
|
|
void CpuMemFree(void* ptr, size_t size) { amd::Os::alignedFree(ptr); }
|
|
|
|
void* GpuMemAlloc(size_t size, size_t align, bool zero);
|
|
|
|
bool GpuMemCopy(void* dst, size_t offset, const void* src, size_t size);
|
|
|
|
void GpuMemFree(void* ptr, size_t size = 0);
|
|
|
|
ORCAHSALoaderContext(const ORCAHSALoaderContext& c);
|
|
|
|
ORCAHSALoaderContext& operator=(const ORCAHSALoaderContext& c);
|
|
|
|
gpu::HSAILProgram* program_;
|
|
};
|
|
|
|
//! \class HSAIL program
|
|
class HSAILProgram : public device::Program {
|
|
friend class ClBinary;
|
|
|
|
public:
|
|
//! Default constructor
|
|
HSAILProgram(Device& device);
|
|
HSAILProgram(NullDevice& device);
|
|
//! Default destructor
|
|
~HSAILProgram();
|
|
|
|
//! Returns the aclBinary associated with the progrm
|
|
aclBinary* binaryElf() const { return static_cast<aclBinary*>(binaryElf_); }
|
|
|
|
void addGlobalStore(Memory* mem) { globalStores_.push_back(mem); }
|
|
|
|
const std::vector<Memory*>& globalStores() const { return globalStores_; }
|
|
|
|
//! Return a typecasted GPU device
|
|
gpu::Device& dev() { return const_cast<gpu::Device&>(static_cast<const gpu::Device&>(device())); }
|
|
|
|
//! Returns GPU kernel table
|
|
const Memory* kernelTable() const { return kernels_; }
|
|
|
|
//! Adds all kernels to the mem handle lists
|
|
void fillResListWithKernels(std::vector<const Memory*>& memList) const;
|
|
|
|
//! Returns the maximum number of scratch regs used in the program
|
|
uint maxScratchRegs() const { return maxScratchRegs_; }
|
|
|
|
//! Add internal static sampler
|
|
void addSampler(Sampler* sampler) { staticSamplers_.push_back(sampler); }
|
|
|
|
//! Returns TRUE if the program just compiled
|
|
bool isNull() const { return isNull_; }
|
|
|
|
//! Returns TRUE if the program contains static samplers
|
|
bool isStaticSampler() const { return (staticSamplers_.size() != 0); }
|
|
|
|
protected:
|
|
//! pre-compile setup for GPU
|
|
virtual bool initBuild(amd::option::Options* options);
|
|
|
|
//! post-compile setup for GPU
|
|
virtual bool finiBuild(bool isBuildGood);
|
|
|
|
/*! \brief Compiles GPU CL program to LLVM binary (compiler frontend)
|
|
*
|
|
* \return True if we successefully compiled a GPU program
|
|
*/
|
|
virtual bool compileImpl(const std::string& sourceCode, //!< the program's source code
|
|
const std::vector<const std::string*>& headers,
|
|
const char** headerIncludeNames,
|
|
amd::option::Options* options //!< compile options's object
|
|
);
|
|
|
|
/* \brief Returns the next stage to compile from, based on sections in binary,
|
|
* also returns completeStages in a vector, which contains at least ACL_TYPE_DEFAULT,
|
|
* sets needOptionsCheck to true if options check is needed to decide whether or not to recompile
|
|
*/
|
|
aclType getCompilationStagesFromBinary(std::vector<aclType>& completeStages,
|
|
bool& needOptionsCheck);
|
|
|
|
/* \brief Returns the next stage to compile from, based on sections and options in binary
|
|
*/
|
|
aclType getNextCompilationStageFromBinary(amd::option::Options* options);
|
|
|
|
bool saveBinaryAndSetType(type_t type);
|
|
|
|
virtual bool linkImpl(amd::option::Options* options);
|
|
|
|
//! Link the device programs.
|
|
virtual bool linkImpl(const std::vector<device::Program*>& inputPrograms,
|
|
amd::option::Options* options, bool createLibrary);
|
|
|
|
virtual bool createBinary(amd::option::Options* options);
|
|
|
|
//! Initialize Binary
|
|
virtual bool initClBinary();
|
|
|
|
//! Release the Binary
|
|
virtual void releaseClBinary();
|
|
|
|
virtual const aclTargetInfo& info(const char* str = "");
|
|
|
|
virtual bool isElf(const char* bin) const {
|
|
return amd::isElfMagic(bin);
|
|
// return false;
|
|
}
|
|
|
|
//! Returns the binary
|
|
// This should ensure that the binary is updated with all the kernels
|
|
// ClBinary& clBinary() { return binary_; }
|
|
ClBinary* clBinary() { return static_cast<ClBinary*>(device::Program::clBinary()); }
|
|
const ClBinary* clBinary() const {
|
|
return static_cast<const ClBinary*>(device::Program::clBinary());
|
|
}
|
|
|
|
private:
|
|
//! Disable default copy constructor
|
|
HSAILProgram(const HSAILProgram&);
|
|
|
|
//! Disable operator=
|
|
HSAILProgram& operator=(const HSAILProgram&);
|
|
|
|
//! Returns all the options to be appended while passing to the
|
|
// compiler library
|
|
std::string hsailOptions();
|
|
|
|
//! Allocate kernel table
|
|
bool allocKernelTable();
|
|
|
|
std::string openCLSource_; //!< Original OpenCL source
|
|
std::string HSAILProgram_; //!< FSAIL program after compilation
|
|
std::string llvmBinary_; //!< LLVM IR binary code
|
|
aclBinary* binaryElf_; //!< Binary for the new compiler library
|
|
void* rawBinary_; //!< Pointer to the raw binary
|
|
aclBinaryOptions binOpts_; //!< Binary options to create aclBinary
|
|
std::vector<Memory*> globalStores_; //!< Global memory for the program
|
|
Memory* kernels_; //!< Table with kernel object pointers
|
|
uint
|
|
maxScratchRegs_; //!< Maximum number of scratch regs used in the program by individual kernel
|
|
std::list<Sampler*> staticSamplers_; //!< List od internal static samplers
|
|
bool isNull_; //!< Null program no memory allocations
|
|
amd::hsa::loader::Loader* loader_; //!< Loader object
|
|
amd::hsa::loader::Executable* executable_; //!< Executable for HSA Loader
|
|
ORCAHSALoaderContext loaderContext_; //!< Context for HSA Loader
|
|
};
|
|
|
|
/*@}*/} // namespace gpu
|
|
|
|
#endif /*GPUPROGRAM_HPP_*/
|