From 3694ab2ce84ce836530bad5ea73d133513bcde76 Mon Sep 17 00:00:00 2001
From: foreman
Date: Fri, 4 Jul 2014 16:17:05 -0400
Subject: [PATCH] initial commit
---
rocclr/compiler/lib/Doxyfile | 1606 +++++++
rocclr/compiler/lib/amdoclcl.def.in | 99 +
rocclr/compiler/lib/amdoclcl.map.in | 104 +
rocclr/compiler/lib/amdoclcl.rc | 75 +
.../compiler/lib/backends/common/backend.hpp | 33 +
.../compiler/lib/backends/common/codegen.cpp | 367 ++
.../compiler/lib/backends/common/codegen.hpp | 87 +
.../lib/backends/common/compiler_stage.cpp | 99 +
.../lib/backends/common/compiler_stage.hpp | 96 +
.../compiler/lib/backends/common/frontend.cpp | 295 ++
.../compiler/lib/backends/common/frontend.hpp | 99 +
.../lib/backends/common/frontend_clang.cpp | 202 +
rocclr/compiler/lib/backends/common/if_acl.h | 15 +
.../compiler/lib/backends/common/library.cpp | 290 ++
.../compiler/lib/backends/common/library.hpp | 59 +
.../compiler/lib/backends/common/linker.cpp | 1299 ++++++
.../compiler/lib/backends/common/linker.hpp | 103 +
.../lib/backends/common/opt_level.cpp | 186 +
.../lib/backends/common/opt_level.hpp | 188 +
.../lib/backends/common/optimizer.cpp | 152 +
.../lib/backends/common/optimizer.hpp | 106 +
rocclr/compiler/lib/backends/common/spir.cpp | 138 +
rocclr/compiler/lib/backends/common/spir.hpp | 40 +
.../lib/backends/common/v0_8/if_acl.cpp | 2736 +++++++++++
.../lib/backends/common/v0_8/if_acl.h | 129 +
rocclr/compiler/lib/complibdefs | 84 +
rocclr/compiler/lib/complibrules | 16 +
rocclr/compiler/lib/include/acl.h | 17 +
rocclr/compiler/lib/include/aclDefs.h | 16 +
rocclr/compiler/lib/include/aclEnums.h | 16 +
rocclr/compiler/lib/include/aclFunctors.h | 16 +
rocclr/compiler/lib/include/aclStructs.h | 16 +
rocclr/compiler/lib/include/aclTypes.h | 17 +
rocclr/compiler/lib/include/v0_8/acl.h | 250 +
rocclr/compiler/lib/include/v0_8/aclDefs.h | 35 +
rocclr/compiler/lib/include/v0_8/aclEnums.h | 318 ++
.../compiler/lib/include/v0_8/aclFunctors.h | 182 +
rocclr/compiler/lib/include/v0_8/aclStructs.h | 305 ++
rocclr/compiler/lib/include/v0_8/aclTypes.h | 88 +
rocclr/compiler/lib/loaders/elf/elf.cpp | 1548 +++++++
rocclr/compiler/lib/loaders/elf/elf.hpp | 399 ++
rocclr/compiler/lib/loaders/elf/elf_utils.cpp | 302 ++
rocclr/compiler/lib/loaders/elf/elf_utils.hpp | 145 +
.../lib/loaders/elf/utils/common/_elftc.h | 542 +++
.../loaders/elf/utils/common/elfdefinitions.h | 2618 +++++++++++
.../elf/utils/common/native-elf-format | 47 +
.../elf/utils/common/native-elf-format.h | 7 +
.../lib/loaders/elf/utils/common/uthash.h | 906 ++++
.../lib/loaders/elf/utils/libelf/README | 12 +
.../lib/loaders/elf/utils/libelf/README.build | 64 +
.../lib/loaders/elf/utils/libelf/Version.map | 97 +
.../lib/loaders/elf/utils/libelf/_libelf.h | 217 +
.../lib/loaders/elf/utils/libelf/_libelf_ar.h | 56 +
.../loaders/elf/utils/libelf/_libelf_config.h | 218 +
.../lib/loaders/elf/utils/libelf/elf.c | 41 +
.../lib/loaders/elf/utils/libelf/elf_begin.c | 337 ++
.../lib/loaders/elf/utils/libelf/elf_cntl.c | 58 +
.../lib/loaders/elf/utils/libelf/elf_data.c | 254 ++
.../lib/loaders/elf/utils/libelf/elf_end.c | 99 +
.../lib/loaders/elf/utils/libelf/elf_errmsg.c | 88 +
.../lib/loaders/elf/utils/libelf/elf_errno.c | 43 +
.../lib/loaders/elf/utils/libelf/elf_fill.c | 39 +
.../lib/loaders/elf/utils/libelf/elf_flag.c | 195 +
.../loaders/elf/utils/libelf/elf_getarhdr.c | 47 +
.../loaders/elf/utils/libelf/elf_getarsym.c | 58 +
.../loaders/elf/utils/libelf/elf_getbase.c | 48 +
.../loaders/elf/utils/libelf/elf_getident.c | 68 +
.../lib/loaders/elf/utils/libelf/elf_hash.c | 56 +
.../lib/loaders/elf/utils/libelf/elf_kind.c | 44 +
.../lib/loaders/elf/utils/libelf/elf_memory.c | 92 +
.../lib/loaders/elf/utils/libelf/elf_next.c | 62 +
.../lib/loaders/elf/utils/libelf/elf_phnum.c | 67 +
.../lib/loaders/elf/utils/libelf/elf_rand.c | 59 +
.../loaders/elf/utils/libelf/elf_rawfile.c | 53 +
.../lib/loaders/elf/utils/libelf/elf_scn.c | 251 +
.../lib/loaders/elf/utils/libelf/elf_shnum.c | 67 +
.../loaders/elf/utils/libelf/elf_shstrndx.c | 82 +
.../lib/loaders/elf/utils/libelf/elf_strptr.c | 134 +
.../lib/loaders/elf/utils/libelf/elf_update.c | 1263 +++++
.../loaders/elf/utils/libelf/elf_version.c | 52 +
.../lib/loaders/elf/utils/libelf/gelf.h | 114 +
.../lib/loaders/elf/utils/libelf/gelf_cap.c | 148 +
.../loaders/elf/utils/libelf/gelf_checksum.c | 58 +
.../lib/loaders/elf/utils/libelf/gelf_dyn.c | 143 +
.../lib/loaders/elf/utils/libelf/gelf_ehdr.c | 167 +
.../lib/loaders/elf/utils/libelf/gelf_fsize.c | 62 +
.../loaders/elf/utils/libelf/gelf_getclass.c | 39 +
.../lib/loaders/elf/utils/libelf/gelf_move.c | 154 +
.../lib/loaders/elf/utils/libelf/gelf_phdr.c | 177 +
.../lib/loaders/elf/utils/libelf/gelf_rel.c | 152 +
.../lib/loaders/elf/utils/libelf/gelf_rela.c | 155 +
.../lib/loaders/elf/utils/libelf/gelf_shdr.c | 130 +
.../lib/loaders/elf/utils/libelf/gelf_sym.c | 153 +
.../loaders/elf/utils/libelf/gelf_syminfo.c | 147 +
.../loaders/elf/utils/libelf/gelf_symshndx.c | 128 +
.../lib/loaders/elf/utils/libelf/gelf_xlate.c | 81 +
.../lib/loaders/elf/utils/libelf/libelf.h | 265 ++
.../loaders/elf/utils/libelf/libelf_align.c | 185 +
.../elf/utils/libelf/libelf_allocate.c | 229 +
.../lib/loaders/elf/utils/libelf/libelf_ar.c | 461 ++
.../loaders/elf/utils/libelf/libelf_ar_util.c | 354 ++
.../elf/utils/libelf/libelf_checksum.c | 100 +
.../loaders/elf/utils/libelf/libelf_convert.c | 3112 +++++++++++++
.../loaders/elf/utils/libelf/libelf_data.c | 114 +
.../loaders/elf/utils/libelf/libelf_ehdr.c | 211 +
.../elf/utils/libelf/libelf_extended.c | 136 +
.../loaders/elf/utils/libelf/libelf_fsize.c | 149 +
.../loaders/elf/utils/libelf/libelf_msize.c | 147 +
.../loaders/elf/utils/libelf/libelf_phdr.c | 161 +
.../loaders/elf/utils/libelf/libelf_shdr.c | 56 +
.../loaders/elf/utils/libelf/libelf_xlate.c | 150 +
.../lib/loaders/elf/utils/libelf/roundup.h | 8 +
.../lib/promotions/oclutils/os/alloc.cpp | 80 +
.../lib/promotions/oclutils/os/alloc.hpp | 30 +
.../lib/promotions/oclutils/os/os.cpp | 145 +
.../lib/promotions/oclutils/os/os.hpp | 506 ++
.../lib/promotions/oclutils/os/os_posix.cpp | 828 ++++
.../lib/promotions/oclutils/os/os_win32.cpp | 1019 +++++
.../lib/promotions/oclutils/os/setjmp.S | 63 +
.../lib/promotions/oclutils/os/setjmp.asm | 110 +
.../lib/promotions/oclutils/thread/atomic.hpp | 669 +++
.../promotions/oclutils/thread/monitor.cpp | 311 ++
.../promotions/oclutils/thread/monitor.hpp | 230 +
.../promotions/oclutils/thread/semaphore.cpp | 96 +
.../promotions/oclutils/thread/semaphore.hpp | 65 +
.../lib/promotions/oclutils/thread/thread.cpp | 191 +
.../lib/promotions/oclutils/thread/thread.hpp | 228 +
.../compiler/lib/promotions/oclutils/top.hpp | 219 +
.../lib/promotions/oclutils/utils/debug.cpp | 102 +
.../lib/promotions/oclutils/utils/debug.hpp | 193 +
.../lib/promotions/oclutils/utils/macros.hpp | 171 +
.../lib/promotions/oclutils/utils/traits.hpp | 108 +
.../lib/promotions/oclutils/utils/util.hpp | 647 +++
rocclr/compiler/lib/utils/OPTIONS.def | 1091 +++++
.../compiler/lib/utils/bif_section_labels.hpp | 153 +
rocclr/compiler/lib/utils/libUtils.h | 17 +
rocclr/compiler/lib/utils/options.cpp | 1579 +++++++
rocclr/compiler/lib/utils/options.hpp | 331 ++
rocclr/compiler/lib/utils/target_mappings.h | 40 +
rocclr/compiler/lib/utils/v0_8/libUtils.cpp | 840 ++++
rocclr/compiler/lib/utils/v0_8/libUtils.h | 179 +
.../compiler/lib/utils/v0_8/target_mappings.h | 282 ++
.../lib/utils/v0_8/target_mappings_amdil.h | 103 +
.../lib/utils/v0_8/target_mappings_amdil64.h | 51 +
.../lib/utils/v0_8/target_mappings_hsail.h | 33 +
.../lib/utils/v0_8/target_mappings_hsail64.h | 32 +
.../lib/utils/v0_8/target_mappings_x64.h | 46 +
.../lib/utils/v0_8/target_mappings_x86.h | 73 +
rocclr/compiler/lib/utils/versions.hpp | 53 +
rocclr/init.txt | 1 -
rocclr/runtime/device/appprofile.cpp | 149 +
rocclr/runtime/device/appprofile.hpp | 74 +
rocclr/runtime/device/blit.cpp | 737 +++
rocclr/runtime/device/blit.hpp | 369 ++
rocclr/runtime/device/blitcl.cpp | 442 ++
rocclr/runtime/device/cpu/cpubinary.cpp | 213 +
rocclr/runtime/device/cpu/cpubinary.hpp | 85 +
rocclr/runtime/device/cpu/cpubuiltins.cpp | 57 +
rocclr/runtime/device/cpu/cpubuiltins.hpp | 20 +
rocclr/runtime/device/cpu/cpucommand.cpp | 676 +++
rocclr/runtime/device/cpu/cpucommand.hpp | 425 ++
rocclr/runtime/device/cpu/cpudevice.cpp | 1141 +++++
rocclr/runtime/device/cpu/cpudevice.hpp | 246 +
rocclr/runtime/device/cpu/cpufeat.hpp | 27 +
rocclr/runtime/device/cpu/cpukernel.S | 87 +
rocclr/runtime/device/cpu/cpukernel.asm | 84 +
rocclr/runtime/device/cpu/cpukernel.hpp | 71 +
rocclr/runtime/device/cpu/cpuprogram.cpp | 1221 +++++
rocclr/runtime/device/cpu/cpuprogram.hpp | 118 +
rocclr/runtime/device/cpu/cpusettings.cpp | 104 +
rocclr/runtime/device/cpu/cpusettings.hpp | 44 +
rocclr/runtime/device/cpu/cputables.hpp | 2015 ++++++++
rocclr/runtime/device/cpu/cpuvirtual.cpp | 627 +++
rocclr/runtime/device/cpu/cpuvirtual.hpp | 80 +
rocclr/runtime/device/cpu/ring.hpp | 207 +
rocclr/runtime/device/device.cpp | 1694 +++++++
rocclr/runtime/device/device.hpp | 1719 +++++++
rocclr/runtime/device/gpu/gpuappprofile.cpp | 98 +
rocclr/runtime/device/gpu/gpuappprofile.hpp | 44 +
rocclr/runtime/device/gpu/gpubinary.cpp | 548 +++
rocclr/runtime/device/gpu/gpubinary.hpp | 143 +
rocclr/runtime/device/gpu/gpublit.cpp | 2845 ++++++++++++
rocclr/runtime/device/gpu/gpublit.hpp | 453 ++
rocclr/runtime/device/gpu/gpucompiler.cpp | 450 ++
rocclr/runtime/device/gpu/gpuconstbuf.cpp | 89 +
rocclr/runtime/device/gpu/gpuconstbuf.hpp | 70 +
rocclr/runtime/device/gpu/gpucounters.cpp | 87 +
rocclr/runtime/device/gpu/gpucounters.hpp | 140 +
rocclr/runtime/device/gpu/gpudefs.hpp | 450 ++
rocclr/runtime/device/gpu/gpudevice.cpp | 2546 +++++++++++
rocclr/runtime/device/gpu/gpudevice.hpp | 626 +++
rocclr/runtime/device/gpu/gpuheap.cpp | 536 +++
rocclr/runtime/device/gpu/gpuheap.hpp | 225 +
rocclr/runtime/device/gpu/gpukernel.cpp | 4049 +++++++++++++++++
rocclr/runtime/device/gpu/gpukernel.hpp | 960 ++++
rocclr/runtime/device/gpu/gpumemory.cpp | 1369 ++++++
rocclr/runtime/device/gpu/gpumemory.hpp | 305 ++
rocclr/runtime/device/gpu/gpuprintf.cpp | 722 +++
rocclr/runtime/device/gpu/gpuprintf.hpp | 193 +
rocclr/runtime/device/gpu/gpuprogram.cpp | 2241 +++++++++
rocclr/runtime/device/gpu/gpuprogram.hpp | 494 ++
rocclr/runtime/device/gpu/gpuresource.cpp | 2089 +++++++++
rocclr/runtime/device/gpu/gpuresource.hpp | 508 +++
rocclr/runtime/device/gpu/gpusched.hpp | 73 +
rocclr/runtime/device/gpu/gpuschedcl.cpp | 467 ++
rocclr/runtime/device/gpu/gpuscr800.cpp | 479 ++
rocclr/runtime/device/gpu/gpuscsi.cpp | 203 +
rocclr/runtime/device/gpu/gpusettings.cpp | 483 ++
rocclr/runtime/device/gpu/gpusettings.hpp | 134 +
rocclr/runtime/device/gpu/gputhreadtrace.cpp | 66 +
rocclr/runtime/device/gpu/gputhreadtrace.hpp | 137 +
rocclr/runtime/device/gpu/gputimestamp.cpp | 119 +
rocclr/runtime/device/gpu/gputimestamp.hpp | 132 +
rocclr/runtime/device/gpu/gpuvirtual.cpp | 3253 +++++++++++++
rocclr/runtime/device/gpu/gpuvirtual.hpp | 538 +++
rocclr/runtime/device/gpu/gslbe/localdefs | 2 +
rocclr/runtime/device/gpu/gslbe/localrules | 1 +
.../device/gpu/gslbe/src/include/cal/cal.h | 304 ++
.../device/gpu/gslbe/src/include/cal/calcl.h | 660 +++
.../gslbe/src/include/extern/udx/d3d/calif.h | 284 ++
.../include/extern/udx/d3d/d3dshaderdefs.h | 99 +
.../gslbe/src/include/extern/udx/d3d/fourcc.h | 110 +
.../gpu/gslbe/src/promotions/Readme.txt | 2 +
.../src/promotions/video/win64a/mmdcore.pdb | Bin 0 -> 536576 bytes
.../promotions/video/win64a/mmdcorecal.pdb | Bin 0 -> 462848 bytes
.../promotions/video/win64a/mmdhwlbarts.pdb | Bin 0 -> 380928 bytes
.../promotions/video/win64a/mmdhwlcaicos.pdb | Bin 0 -> 389120 bytes
.../promotions/video/win64a/mmdhwlcayman.pdb | Bin 0 -> 430080 bytes
.../promotions/video/win64a/mmdhwlcedar.pdb | Bin 0 -> 233472 bytes
.../promotions/video/win64a/mmdhwlcypress.pdb | Bin 0 -> 503808 bytes
.../promotions/video/win64a/mmdhwljuniper.pdb | Bin 0 -> 159744 bytes
.../promotions/video/win64a/mmdhwlkong.pdb | Bin 0 -> 143360 bytes
.../promotions/video/win64a/mmdhwlllano.pdb | Bin 0 -> 290816 bytes
.../promotions/video/win64a/mmdhwlontario.pdb | Bin 0 -> 249856 bytes
.../promotions/video/win64a/mmdhwlr600.pdb | Bin 0 -> 593920 bytes
.../promotions/video/win64a/mmdhwlredwood.pdb | Bin 0 -> 159744 bytes
.../promotions/video/win64a/mmdhwlrs780.pdb | Bin 0 -> 233472 bytes
.../promotions/video/win64a/mmdhwlrs880.pdb | Bin 0 -> 225280 bytes
.../promotions/video/win64a/mmdhwlrv610.pdb | Bin 0 -> 135168 bytes
.../promotions/video/win64a/mmdhwlrv630.pdb | Bin 0 -> 258048 bytes
.../promotions/video/win64a/mmdhwlrv670.pdb | Bin 0 -> 135168 bytes
.../promotions/video/win64a/mmdhwlrv710.pdb | Bin 0 -> 233472 bytes
.../promotions/video/win64a/mmdhwlrv730.pdb | Bin 0 -> 323584 bytes
.../promotions/video/win64a/mmdhwlrv770.pdb | Bin 0 -> 372736 bytes
.../video/win64a/mmdhwlsi_tahiti_p.pdb | Bin 0 -> 299008 bytes
.../promotions/video/win64a/mmdhwltrinity.pdb | Bin 0 -> 241664 bytes
.../promotions/video/win64a/mmdhwlturks.pdb | Bin 0 -> 389120 bytes
.../gpu/gslbe/src/rt/DxxOpenCLInteropExt.h | 88 +
.../device/gpu/gslbe/src/rt/EventQueue.cpp | 202 +
.../device/gpu/gslbe/src/rt/EventQueue.h | 57 +
.../device/gpu/gslbe/src/rt/GSLContext.cpp | 1298 ++++++
.../device/gpu/gslbe/src/rt/GSLContext.h | 180 +
.../device/gpu/gslbe/src/rt/GSLDevice.cpp | 1719 +++++++
.../device/gpu/gslbe/src/rt/GSLDevice.h | 229 +
.../gpu/gslbe/src/rt/GSLDeviceD3D10.cpp | 231 +
.../gpu/gslbe/src/rt/GSLDeviceD3D11.cpp | 154 +
.../device/gpu/gslbe/src/rt/GSLDeviceD3D9.cpp | 56 +
.../device/gpu/gslbe/src/rt/GSLDeviceGL.cpp | 883 ++++
.../gpu/gslbe/src/rt/GSLDeviceLinux.cpp | 9 +
.../device/gpu/gslbe/src/rt/GSLDeviceWin.cpp | 9 +
.../device/gpu/gslbe/src/rt/GSLStubs.cpp | 134 +
.../device/gpu/gslbe/src/rt/backend.cpp | 206 +
.../runtime/device/gpu/gslbe/src/rt/backend.h | 54 +
.../gpu/gslbe/src/rt/inifile/ini_export.cpp | 95 +
.../gpu/gslbe/src/rt/inifile/ini_export.h | 13 +
.../gpu/gslbe/src/rt/inifile/ini_values.h | 334 ++
.../gpu/gslbe/src/rt/inifile/inifile.cpp | 537 +++
.../device/gpu/gslbe/src/rt/inifile/inifile.h | 164 +
.../gslbe/src/rt/inifile/inifile_parser.cpp | 225 +
.../gpu/gslbe/src/rt/inifile/inifile_parser.h | 42 +
rocclr/runtime/device/hsa/hsaappprofile.cpp | 61 +
rocclr/runtime/device/hsa/hsaappprofile.hpp | 27 +
rocclr/runtime/device/hsa/hsabinary.cpp | 152 +
rocclr/runtime/device/hsa/hsabinary.hpp | 56 +
rocclr/runtime/device/hsa/hsablit.cpp | 1827 ++++++++
rocclr/runtime/device/hsa/hsablit.hpp | 401 ++
rocclr/runtime/device/hsa/hsacompiler.cpp | 163 +
rocclr/runtime/device/hsa/hsacompilerlib.cpp | 67 +
rocclr/runtime/device/hsa/hsacompilerlib.hpp | 92 +
.../device/hsa/hsacore_symbol_loader.cpp | 53 +
.../device/hsa/hsacore_symbol_loader.hpp | 75 +
rocclr/runtime/device/hsa/hsacounters.cpp | 144 +
rocclr/runtime/device/hsa/hsacounters.hpp | 103 +
rocclr/runtime/device/hsa/hsadefs.hpp | 42 +
rocclr/runtime/device/hsa/hsadevice.cpp | 914 ++++
rocclr/runtime/device/hsa/hsadevice.hpp | 369 ++
rocclr/runtime/device/hsa/hsakernel.cpp | 571 +++
rocclr/runtime/device/hsa/hsakernel.hpp | 161 +
rocclr/runtime/device/hsa/hsamemory.cpp | 936 ++++
rocclr/runtime/device/hsa/hsamemory.hpp | 200 +
rocclr/runtime/device/hsa/hsaprogram.cpp | 768 ++++
rocclr/runtime/device/hsa/hsaprogram.hpp | 160 +
rocclr/runtime/device/hsa/hsasettings.cpp | 81 +
rocclr/runtime/device/hsa/hsasettings.hpp | 65 +
rocclr/runtime/device/hsa/hsavirtual.cpp | 1545 +++++++
rocclr/runtime/device/hsa/hsavirtual.hpp | 185 +
rocclr/runtime/device/hsa/oclhsa.def | 3 +
rocclr/runtime/device/hsa/oclhsa_common.hpp | 26 +
.../device/hsa/services_symbol_loader.cpp | 52 +
.../device/hsa/services_symbol_loader.hpp | 78 +
rocclr/runtime/device/hsa/system_memory.h | 97 +
rocclr/runtime/os/alloc.cpp | 87 +
rocclr/runtime/os/alloc.hpp | 30 +
rocclr/runtime/os/os.cpp | 145 +
rocclr/runtime/os/os.hpp | 519 +++
rocclr/runtime/os/os_posix.cpp | 882 ++++
rocclr/runtime/os/os_win32.cpp | 1093 +++++
rocclr/runtime/os/setjmp.S | 63 +
rocclr/runtime/os/setjmp.asm | 110 +
rocclr/runtime/platform/agent.cpp | 530 +++
rocclr/runtime/platform/agent.hpp | 150 +
rocclr/runtime/platform/command.cpp | 578 +++
rocclr/runtime/platform/command.hpp | 1561 +++++++
rocclr/runtime/platform/commandqueue.cpp | 197 +
rocclr/runtime/platform/commandqueue.hpp | 254 ++
rocclr/runtime/platform/context.cpp | 363 ++
rocclr/runtime/platform/context.hpp | 198 +
rocclr/runtime/platform/counter.hpp | 33 +
rocclr/runtime/platform/interop.hpp | 50 +
rocclr/runtime/platform/kernel.cpp | 254 ++
rocclr/runtime/platform/kernel.hpp | 221 +
rocclr/runtime/platform/memory.cpp | 1520 +++++++
rocclr/runtime/platform/memory.hpp | 662 +++
rocclr/runtime/platform/ndrange.cpp | 70 +
rocclr/runtime/platform/ndrange.hpp | 213 +
rocclr/runtime/platform/object.cpp | 88 +
rocclr/runtime/platform/object.hpp | 270 ++
rocclr/runtime/platform/perfctr.hpp | 65 +
rocclr/runtime/platform/program.cpp | 656 +++
rocclr/runtime/platform/program.hpp | 200 +
rocclr/runtime/platform/runtime.cpp | 183 +
rocclr/runtime/platform/runtime.hpp | 76 +
rocclr/runtime/platform/sampler.hpp | 175 +
rocclr/runtime/platform/threadtrace.hpp | 129 +
rocclr/runtime/platform/video_session.hpp | 79 +
rocclr/runtime/thread/atomic.hpp | 677 +++
rocclr/runtime/thread/monitor.cpp | 313 ++
rocclr/runtime/thread/monitor.hpp | 233 +
rocclr/runtime/thread/semaphore.cpp | 96 +
rocclr/runtime/thread/semaphore.hpp | 65 +
rocclr/runtime/thread/thread.cpp | 191 +
rocclr/runtime/thread/thread.hpp | 228 +
rocclr/runtime/top.hpp | 171 +
rocclr/runtime/utils/concurrent.hpp | 206 +
rocclr/runtime/utils/debug.cpp | 102 +
rocclr/runtime/utils/debug.hpp | 182 +
rocclr/runtime/utils/flags.cpp | 197 +
rocclr/runtime/utils/flags.hpp | 248 +
rocclr/runtime/utils/macros.hpp | 171 +
rocclr/runtime/utils/util.hpp | 370 ++
rocclr/runtime/utils/versions.hpp | 34 +
351 files changed, 113713 insertions(+), 1 deletion(-)
create mode 100644 rocclr/compiler/lib/Doxyfile
create mode 100644 rocclr/compiler/lib/amdoclcl.def.in
create mode 100644 rocclr/compiler/lib/amdoclcl.map.in
create mode 100644 rocclr/compiler/lib/amdoclcl.rc
create mode 100644 rocclr/compiler/lib/backends/common/backend.hpp
create mode 100644 rocclr/compiler/lib/backends/common/codegen.cpp
create mode 100644 rocclr/compiler/lib/backends/common/codegen.hpp
create mode 100644 rocclr/compiler/lib/backends/common/compiler_stage.cpp
create mode 100644 rocclr/compiler/lib/backends/common/compiler_stage.hpp
create mode 100644 rocclr/compiler/lib/backends/common/frontend.cpp
create mode 100644 rocclr/compiler/lib/backends/common/frontend.hpp
create mode 100644 rocclr/compiler/lib/backends/common/frontend_clang.cpp
create mode 100644 rocclr/compiler/lib/backends/common/if_acl.h
create mode 100644 rocclr/compiler/lib/backends/common/library.cpp
create mode 100644 rocclr/compiler/lib/backends/common/library.hpp
create mode 100644 rocclr/compiler/lib/backends/common/linker.cpp
create mode 100644 rocclr/compiler/lib/backends/common/linker.hpp
create mode 100644 rocclr/compiler/lib/backends/common/opt_level.cpp
create mode 100644 rocclr/compiler/lib/backends/common/opt_level.hpp
create mode 100644 rocclr/compiler/lib/backends/common/optimizer.cpp
create mode 100644 rocclr/compiler/lib/backends/common/optimizer.hpp
create mode 100644 rocclr/compiler/lib/backends/common/spir.cpp
create mode 100644 rocclr/compiler/lib/backends/common/spir.hpp
create mode 100644 rocclr/compiler/lib/backends/common/v0_8/if_acl.cpp
create mode 100644 rocclr/compiler/lib/backends/common/v0_8/if_acl.h
create mode 100644 rocclr/compiler/lib/complibdefs
create mode 100644 rocclr/compiler/lib/complibrules
create mode 100644 rocclr/compiler/lib/include/acl.h
create mode 100644 rocclr/compiler/lib/include/aclDefs.h
create mode 100644 rocclr/compiler/lib/include/aclEnums.h
create mode 100644 rocclr/compiler/lib/include/aclFunctors.h
create mode 100644 rocclr/compiler/lib/include/aclStructs.h
create mode 100644 rocclr/compiler/lib/include/aclTypes.h
create mode 100644 rocclr/compiler/lib/include/v0_8/acl.h
create mode 100644 rocclr/compiler/lib/include/v0_8/aclDefs.h
create mode 100644 rocclr/compiler/lib/include/v0_8/aclEnums.h
create mode 100644 rocclr/compiler/lib/include/v0_8/aclFunctors.h
create mode 100644 rocclr/compiler/lib/include/v0_8/aclStructs.h
create mode 100644 rocclr/compiler/lib/include/v0_8/aclTypes.h
create mode 100644 rocclr/compiler/lib/loaders/elf/elf.cpp
create mode 100644 rocclr/compiler/lib/loaders/elf/elf.hpp
create mode 100644 rocclr/compiler/lib/loaders/elf/elf_utils.cpp
create mode 100644 rocclr/compiler/lib/loaders/elf/elf_utils.hpp
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/common/_elftc.h
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/common/elfdefinitions.h
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/common/native-elf-format
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/common/native-elf-format.h
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/common/uthash.h
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/README
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/README.build
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/Version.map
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/_libelf.h
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/_libelf_ar.h
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/_libelf_config.h
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/elf.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/elf_begin.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/elf_cntl.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/elf_data.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/elf_end.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/elf_errmsg.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/elf_errno.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/elf_fill.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/elf_flag.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/elf_getarhdr.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/elf_getarsym.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/elf_getbase.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/elf_getident.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/elf_hash.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/elf_kind.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/elf_memory.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/elf_next.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/elf_phnum.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/elf_rand.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/elf_rawfile.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/elf_scn.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/elf_shnum.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/elf_shstrndx.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/elf_strptr.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/elf_update.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/elf_version.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/gelf.h
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/gelf_cap.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/gelf_checksum.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/gelf_dyn.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/gelf_ehdr.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/gelf_fsize.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/gelf_getclass.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/gelf_move.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/gelf_phdr.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/gelf_rel.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/gelf_rela.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/gelf_shdr.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/gelf_sym.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/gelf_syminfo.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/gelf_symshndx.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/gelf_xlate.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/libelf.h
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/libelf_align.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/libelf_allocate.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/libelf_ar.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/libelf_ar_util.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/libelf_checksum.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/libelf_convert.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/libelf_data.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/libelf_ehdr.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/libelf_extended.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/libelf_fsize.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/libelf_msize.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/libelf_phdr.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/libelf_shdr.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/libelf_xlate.c
create mode 100644 rocclr/compiler/lib/loaders/elf/utils/libelf/roundup.h
create mode 100644 rocclr/compiler/lib/promotions/oclutils/os/alloc.cpp
create mode 100644 rocclr/compiler/lib/promotions/oclutils/os/alloc.hpp
create mode 100644 rocclr/compiler/lib/promotions/oclutils/os/os.cpp
create mode 100644 rocclr/compiler/lib/promotions/oclutils/os/os.hpp
create mode 100644 rocclr/compiler/lib/promotions/oclutils/os/os_posix.cpp
create mode 100644 rocclr/compiler/lib/promotions/oclutils/os/os_win32.cpp
create mode 100644 rocclr/compiler/lib/promotions/oclutils/os/setjmp.S
create mode 100644 rocclr/compiler/lib/promotions/oclutils/os/setjmp.asm
create mode 100644 rocclr/compiler/lib/promotions/oclutils/thread/atomic.hpp
create mode 100644 rocclr/compiler/lib/promotions/oclutils/thread/monitor.cpp
create mode 100644 rocclr/compiler/lib/promotions/oclutils/thread/monitor.hpp
create mode 100644 rocclr/compiler/lib/promotions/oclutils/thread/semaphore.cpp
create mode 100644 rocclr/compiler/lib/promotions/oclutils/thread/semaphore.hpp
create mode 100644 rocclr/compiler/lib/promotions/oclutils/thread/thread.cpp
create mode 100644 rocclr/compiler/lib/promotions/oclutils/thread/thread.hpp
create mode 100644 rocclr/compiler/lib/promotions/oclutils/top.hpp
create mode 100644 rocclr/compiler/lib/promotions/oclutils/utils/debug.cpp
create mode 100644 rocclr/compiler/lib/promotions/oclutils/utils/debug.hpp
create mode 100644 rocclr/compiler/lib/promotions/oclutils/utils/macros.hpp
create mode 100644 rocclr/compiler/lib/promotions/oclutils/utils/traits.hpp
create mode 100644 rocclr/compiler/lib/promotions/oclutils/utils/util.hpp
create mode 100644 rocclr/compiler/lib/utils/OPTIONS.def
create mode 100644 rocclr/compiler/lib/utils/bif_section_labels.hpp
create mode 100644 rocclr/compiler/lib/utils/libUtils.h
create mode 100644 rocclr/compiler/lib/utils/options.cpp
create mode 100644 rocclr/compiler/lib/utils/options.hpp
create mode 100644 rocclr/compiler/lib/utils/target_mappings.h
create mode 100644 rocclr/compiler/lib/utils/v0_8/libUtils.cpp
create mode 100644 rocclr/compiler/lib/utils/v0_8/libUtils.h
create mode 100644 rocclr/compiler/lib/utils/v0_8/target_mappings.h
create mode 100644 rocclr/compiler/lib/utils/v0_8/target_mappings_amdil.h
create mode 100644 rocclr/compiler/lib/utils/v0_8/target_mappings_amdil64.h
create mode 100644 rocclr/compiler/lib/utils/v0_8/target_mappings_hsail.h
create mode 100644 rocclr/compiler/lib/utils/v0_8/target_mappings_hsail64.h
create mode 100644 rocclr/compiler/lib/utils/v0_8/target_mappings_x64.h
create mode 100644 rocclr/compiler/lib/utils/v0_8/target_mappings_x86.h
create mode 100644 rocclr/compiler/lib/utils/versions.hpp
delete mode 100644 rocclr/init.txt
create mode 100644 rocclr/runtime/device/appprofile.cpp
create mode 100644 rocclr/runtime/device/appprofile.hpp
create mode 100644 rocclr/runtime/device/blit.cpp
create mode 100644 rocclr/runtime/device/blit.hpp
create mode 100644 rocclr/runtime/device/blitcl.cpp
create mode 100644 rocclr/runtime/device/cpu/cpubinary.cpp
create mode 100644 rocclr/runtime/device/cpu/cpubinary.hpp
create mode 100644 rocclr/runtime/device/cpu/cpubuiltins.cpp
create mode 100644 rocclr/runtime/device/cpu/cpubuiltins.hpp
create mode 100644 rocclr/runtime/device/cpu/cpucommand.cpp
create mode 100644 rocclr/runtime/device/cpu/cpucommand.hpp
create mode 100644 rocclr/runtime/device/cpu/cpudevice.cpp
create mode 100644 rocclr/runtime/device/cpu/cpudevice.hpp
create mode 100644 rocclr/runtime/device/cpu/cpufeat.hpp
create mode 100644 rocclr/runtime/device/cpu/cpukernel.S
create mode 100644 rocclr/runtime/device/cpu/cpukernel.asm
create mode 100644 rocclr/runtime/device/cpu/cpukernel.hpp
create mode 100644 rocclr/runtime/device/cpu/cpuprogram.cpp
create mode 100644 rocclr/runtime/device/cpu/cpuprogram.hpp
create mode 100644 rocclr/runtime/device/cpu/cpusettings.cpp
create mode 100644 rocclr/runtime/device/cpu/cpusettings.hpp
create mode 100644 rocclr/runtime/device/cpu/cputables.hpp
create mode 100644 rocclr/runtime/device/cpu/cpuvirtual.cpp
create mode 100644 rocclr/runtime/device/cpu/cpuvirtual.hpp
create mode 100644 rocclr/runtime/device/cpu/ring.hpp
create mode 100644 rocclr/runtime/device/device.cpp
create mode 100644 rocclr/runtime/device/device.hpp
create mode 100644 rocclr/runtime/device/gpu/gpuappprofile.cpp
create mode 100644 rocclr/runtime/device/gpu/gpuappprofile.hpp
create mode 100644 rocclr/runtime/device/gpu/gpubinary.cpp
create mode 100644 rocclr/runtime/device/gpu/gpubinary.hpp
create mode 100644 rocclr/runtime/device/gpu/gpublit.cpp
create mode 100644 rocclr/runtime/device/gpu/gpublit.hpp
create mode 100644 rocclr/runtime/device/gpu/gpucompiler.cpp
create mode 100644 rocclr/runtime/device/gpu/gpuconstbuf.cpp
create mode 100644 rocclr/runtime/device/gpu/gpuconstbuf.hpp
create mode 100644 rocclr/runtime/device/gpu/gpucounters.cpp
create mode 100644 rocclr/runtime/device/gpu/gpucounters.hpp
create mode 100644 rocclr/runtime/device/gpu/gpudefs.hpp
create mode 100644 rocclr/runtime/device/gpu/gpudevice.cpp
create mode 100644 rocclr/runtime/device/gpu/gpudevice.hpp
create mode 100644 rocclr/runtime/device/gpu/gpuheap.cpp
create mode 100644 rocclr/runtime/device/gpu/gpuheap.hpp
create mode 100644 rocclr/runtime/device/gpu/gpukernel.cpp
create mode 100644 rocclr/runtime/device/gpu/gpukernel.hpp
create mode 100644 rocclr/runtime/device/gpu/gpumemory.cpp
create mode 100644 rocclr/runtime/device/gpu/gpumemory.hpp
create mode 100644 rocclr/runtime/device/gpu/gpuprintf.cpp
create mode 100644 rocclr/runtime/device/gpu/gpuprintf.hpp
create mode 100644 rocclr/runtime/device/gpu/gpuprogram.cpp
create mode 100644 rocclr/runtime/device/gpu/gpuprogram.hpp
create mode 100644 rocclr/runtime/device/gpu/gpuresource.cpp
create mode 100644 rocclr/runtime/device/gpu/gpuresource.hpp
create mode 100644 rocclr/runtime/device/gpu/gpusched.hpp
create mode 100644 rocclr/runtime/device/gpu/gpuschedcl.cpp
create mode 100644 rocclr/runtime/device/gpu/gpuscr800.cpp
create mode 100644 rocclr/runtime/device/gpu/gpuscsi.cpp
create mode 100644 rocclr/runtime/device/gpu/gpusettings.cpp
create mode 100644 rocclr/runtime/device/gpu/gpusettings.hpp
create mode 100644 rocclr/runtime/device/gpu/gputhreadtrace.cpp
create mode 100644 rocclr/runtime/device/gpu/gputhreadtrace.hpp
create mode 100644 rocclr/runtime/device/gpu/gputimestamp.cpp
create mode 100644 rocclr/runtime/device/gpu/gputimestamp.hpp
create mode 100644 rocclr/runtime/device/gpu/gpuvirtual.cpp
create mode 100644 rocclr/runtime/device/gpu/gpuvirtual.hpp
create mode 100644 rocclr/runtime/device/gpu/gslbe/localdefs
create mode 100644 rocclr/runtime/device/gpu/gslbe/localrules
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/include/cal/cal.h
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/include/cal/calcl.h
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/include/extern/udx/d3d/calif.h
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/include/extern/udx/d3d/d3dshaderdefs.h
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/include/extern/udx/d3d/fourcc.h
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/promotions/Readme.txt
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/promotions/video/win64a/mmdcore.pdb
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/promotions/video/win64a/mmdcorecal.pdb
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/promotions/video/win64a/mmdhwlbarts.pdb
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/promotions/video/win64a/mmdhwlcaicos.pdb
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/promotions/video/win64a/mmdhwlcayman.pdb
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/promotions/video/win64a/mmdhwlcedar.pdb
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/promotions/video/win64a/mmdhwlcypress.pdb
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/promotions/video/win64a/mmdhwljuniper.pdb
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/promotions/video/win64a/mmdhwlkong.pdb
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/promotions/video/win64a/mmdhwlllano.pdb
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/promotions/video/win64a/mmdhwlontario.pdb
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/promotions/video/win64a/mmdhwlr600.pdb
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/promotions/video/win64a/mmdhwlredwood.pdb
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/promotions/video/win64a/mmdhwlrs780.pdb
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/promotions/video/win64a/mmdhwlrs880.pdb
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/promotions/video/win64a/mmdhwlrv610.pdb
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/promotions/video/win64a/mmdhwlrv630.pdb
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/promotions/video/win64a/mmdhwlrv670.pdb
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/promotions/video/win64a/mmdhwlrv710.pdb
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/promotions/video/win64a/mmdhwlrv730.pdb
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/promotions/video/win64a/mmdhwlrv770.pdb
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/promotions/video/win64a/mmdhwlsi_tahiti_p.pdb
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/promotions/video/win64a/mmdhwltrinity.pdb
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/promotions/video/win64a/mmdhwlturks.pdb
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/rt/DxxOpenCLInteropExt.h
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/rt/EventQueue.cpp
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/rt/EventQueue.h
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/rt/GSLContext.cpp
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/rt/GSLContext.h
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/rt/GSLDevice.cpp
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/rt/GSLDevice.h
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/rt/GSLDeviceD3D10.cpp
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/rt/GSLDeviceD3D11.cpp
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/rt/GSLDeviceD3D9.cpp
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/rt/GSLDeviceGL.cpp
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/rt/GSLDeviceLinux.cpp
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/rt/GSLDeviceWin.cpp
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/rt/GSLStubs.cpp
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/rt/backend.cpp
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/rt/backend.h
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/rt/inifile/ini_export.cpp
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/rt/inifile/ini_export.h
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/rt/inifile/ini_values.h
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/rt/inifile/inifile.cpp
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/rt/inifile/inifile.h
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/rt/inifile/inifile_parser.cpp
create mode 100644 rocclr/runtime/device/gpu/gslbe/src/rt/inifile/inifile_parser.h
create mode 100644 rocclr/runtime/device/hsa/hsaappprofile.cpp
create mode 100644 rocclr/runtime/device/hsa/hsaappprofile.hpp
create mode 100644 rocclr/runtime/device/hsa/hsabinary.cpp
create mode 100644 rocclr/runtime/device/hsa/hsabinary.hpp
create mode 100644 rocclr/runtime/device/hsa/hsablit.cpp
create mode 100644 rocclr/runtime/device/hsa/hsablit.hpp
create mode 100644 rocclr/runtime/device/hsa/hsacompiler.cpp
create mode 100644 rocclr/runtime/device/hsa/hsacompilerlib.cpp
create mode 100644 rocclr/runtime/device/hsa/hsacompilerlib.hpp
create mode 100644 rocclr/runtime/device/hsa/hsacore_symbol_loader.cpp
create mode 100644 rocclr/runtime/device/hsa/hsacore_symbol_loader.hpp
create mode 100644 rocclr/runtime/device/hsa/hsacounters.cpp
create mode 100644 rocclr/runtime/device/hsa/hsacounters.hpp
create mode 100644 rocclr/runtime/device/hsa/hsadefs.hpp
create mode 100644 rocclr/runtime/device/hsa/hsadevice.cpp
create mode 100644 rocclr/runtime/device/hsa/hsadevice.hpp
create mode 100644 rocclr/runtime/device/hsa/hsakernel.cpp
create mode 100644 rocclr/runtime/device/hsa/hsakernel.hpp
create mode 100644 rocclr/runtime/device/hsa/hsamemory.cpp
create mode 100644 rocclr/runtime/device/hsa/hsamemory.hpp
create mode 100644 rocclr/runtime/device/hsa/hsaprogram.cpp
create mode 100644 rocclr/runtime/device/hsa/hsaprogram.hpp
create mode 100644 rocclr/runtime/device/hsa/hsasettings.cpp
create mode 100644 rocclr/runtime/device/hsa/hsasettings.hpp
create mode 100644 rocclr/runtime/device/hsa/hsavirtual.cpp
create mode 100644 rocclr/runtime/device/hsa/hsavirtual.hpp
create mode 100644 rocclr/runtime/device/hsa/oclhsa.def
create mode 100644 rocclr/runtime/device/hsa/oclhsa_common.hpp
create mode 100644 rocclr/runtime/device/hsa/services_symbol_loader.cpp
create mode 100644 rocclr/runtime/device/hsa/services_symbol_loader.hpp
create mode 100644 rocclr/runtime/device/hsa/system_memory.h
create mode 100644 rocclr/runtime/os/alloc.cpp
create mode 100644 rocclr/runtime/os/alloc.hpp
create mode 100644 rocclr/runtime/os/os.cpp
create mode 100644 rocclr/runtime/os/os.hpp
create mode 100644 rocclr/runtime/os/os_posix.cpp
create mode 100644 rocclr/runtime/os/os_win32.cpp
create mode 100644 rocclr/runtime/os/setjmp.S
create mode 100644 rocclr/runtime/os/setjmp.asm
create mode 100644 rocclr/runtime/platform/agent.cpp
create mode 100644 rocclr/runtime/platform/agent.hpp
create mode 100644 rocclr/runtime/platform/command.cpp
create mode 100644 rocclr/runtime/platform/command.hpp
create mode 100644 rocclr/runtime/platform/commandqueue.cpp
create mode 100644 rocclr/runtime/platform/commandqueue.hpp
create mode 100644 rocclr/runtime/platform/context.cpp
create mode 100644 rocclr/runtime/platform/context.hpp
create mode 100644 rocclr/runtime/platform/counter.hpp
create mode 100644 rocclr/runtime/platform/interop.hpp
create mode 100644 rocclr/runtime/platform/kernel.cpp
create mode 100644 rocclr/runtime/platform/kernel.hpp
create mode 100644 rocclr/runtime/platform/memory.cpp
create mode 100644 rocclr/runtime/platform/memory.hpp
create mode 100644 rocclr/runtime/platform/ndrange.cpp
create mode 100644 rocclr/runtime/platform/ndrange.hpp
create mode 100644 rocclr/runtime/platform/object.cpp
create mode 100644 rocclr/runtime/platform/object.hpp
create mode 100644 rocclr/runtime/platform/perfctr.hpp
create mode 100644 rocclr/runtime/platform/program.cpp
create mode 100644 rocclr/runtime/platform/program.hpp
create mode 100644 rocclr/runtime/platform/runtime.cpp
create mode 100644 rocclr/runtime/platform/runtime.hpp
create mode 100644 rocclr/runtime/platform/sampler.hpp
create mode 100644 rocclr/runtime/platform/threadtrace.hpp
create mode 100644 rocclr/runtime/platform/video_session.hpp
create mode 100644 rocclr/runtime/thread/atomic.hpp
create mode 100644 rocclr/runtime/thread/monitor.cpp
create mode 100644 rocclr/runtime/thread/monitor.hpp
create mode 100644 rocclr/runtime/thread/semaphore.cpp
create mode 100644 rocclr/runtime/thread/semaphore.hpp
create mode 100644 rocclr/runtime/thread/thread.cpp
create mode 100644 rocclr/runtime/thread/thread.hpp
create mode 100644 rocclr/runtime/top.hpp
create mode 100644 rocclr/runtime/utils/concurrent.hpp
create mode 100644 rocclr/runtime/utils/debug.cpp
create mode 100644 rocclr/runtime/utils/debug.hpp
create mode 100644 rocclr/runtime/utils/flags.cpp
create mode 100644 rocclr/runtime/utils/flags.hpp
create mode 100644 rocclr/runtime/utils/macros.hpp
create mode 100644 rocclr/runtime/utils/util.hpp
create mode 100644 rocclr/runtime/utils/versions.hpp
diff --git a/rocclr/compiler/lib/Doxyfile b/rocclr/compiler/lib/Doxyfile
new file mode 100644
index 0000000000..1c59052d73
--- /dev/null
+++ b/rocclr/compiler/lib/Doxyfile
@@ -0,0 +1,1606 @@
+# Doxyfile 1.6.3
+
+# This file describes the settings to be used by the documentation system
+# doxygen (www.doxygen.org) for a project
+#
+# All text after a hash (#) is considered a comment and will be ignored
+# The format is:
+# TAG = value [value, ...]
+# For lists items can also be appended using:
+# TAG += value [value, ...]
+# Values that contain spaces should be placed between quotes (" ")
+
+#---------------------------------------------------------------------------
+# Project related configuration options
+#---------------------------------------------------------------------------
+
+# This tag specifies the encoding used for all characters in the config file
+# that follow. The default is UTF-8 which is also the encoding used for all
+# text before the first occurrence of this tag. Doxygen uses libiconv (or the
+# iconv built into libc) for the transcoding. See
+# http://www.gnu.org/software/libiconv for the list of possible encodings.
+
+DOXYFILE_ENCODING = UTF-8
+
+# The PROJECT_NAME tag is a single word (or a sequence of words surrounded
+# by quotes) that should identify the project.
+
+PROJECT_NAME = CompilerLibrary
+
+# The PROJECT_NUMBER tag can be used to enter a project or revision number.
+# This could be handy for archiving the generated documentation or
+# if some version control system is used.
+
+PROJECT_NUMBER = 0.9
+
+# The OUTPUT_DIRECTORY tag is used to specify the (relative or absolute)
+# base path where the generated documentation will be put.
+# If a relative path is entered, it will be relative to the location
+# where doxygen was started. If left blank the current directory will be used.
+
+OUTPUT_DIRECTORY = D:/hq/stg/opencl/drivers/opencl/compiler/lib/docs
+
+# If the CREATE_SUBDIRS tag is set to YES, then doxygen will create
+# 4096 sub-directories (in 2 levels) under the output directory of each output
+# format and will distribute the generated files over these directories.
+# Enabling this option can be useful when feeding doxygen a huge amount of
+# source files, where putting all generated files in the same directory would
+# otherwise cause performance problems for the file system.
+
+CREATE_SUBDIRS = NO
+
+# The OUTPUT_LANGUAGE tag is used to specify the language in which all
+# documentation generated by doxygen is written. Doxygen will use this
+# information to generate all constant output in the proper language.
+# The default language is English, other supported languages are:
+# Afrikaans, Arabic, Brazilian, Catalan, Chinese, Chinese-Traditional,
+# Croatian, Czech, Danish, Dutch, Esperanto, Farsi, Finnish, French, German,
+# Greek, Hungarian, Italian, Japanese, Japanese-en (Japanese with English
+# messages), Korean, Korean-en, Lithuanian, Norwegian, Macedonian, Persian,
+# Polish, Portuguese, Romanian, Russian, Serbian, Serbian-Cyrilic, Slovak,
+# Slovene, Spanish, Swedish, Ukrainian, and Vietnamese.
+
+OUTPUT_LANGUAGE = English
+
+# If the BRIEF_MEMBER_DESC tag is set to YES (the default) Doxygen will
+# include brief member descriptions after the members that are listed in
+# the file and class documentation (similar to JavaDoc).
+# Set to NO to disable this.
+
+BRIEF_MEMBER_DESC = YES
+
+# If the REPEAT_BRIEF tag is set to YES (the default) Doxygen will prepend
+# the brief description of a member or function before the detailed description.
+# Note: if both HIDE_UNDOC_MEMBERS and BRIEF_MEMBER_DESC are set to NO, the
+# brief descriptions will be completely suppressed.
+
+REPEAT_BRIEF = YES
+
+# This tag implements a quasi-intelligent brief description abbreviator
+# that is used to form the text in various listings. Each string
+# in this list, if found as the leading text of the brief description, will be
+# stripped from the text and the result after processing the whole list, is
+# used as the annotated text. Otherwise, the brief description is used as-is.
+# If left blank, the following values are used ("$name" is automatically
+# replaced with the name of the entity): "The $name class" "The $name widget"
+# "The $name file" "is" "provides" "specifies" "contains"
+# "represents" "a" "an" "the"
+
+ABBREVIATE_BRIEF = "The $name class" \
+ "The $name widget" \
+ "The $name file" \
+ is \
+ provides \
+ specifies \
+ contains \
+ represents \
+ a \
+ an \
+ the
+
+# If the ALWAYS_DETAILED_SEC and REPEAT_BRIEF tags are both set to YES then
+# Doxygen will generate a detailed section even if there is only a brief
+# description.
+
+ALWAYS_DETAILED_SEC = NO
+
+# If the INLINE_INHERITED_MEMB tag is set to YES, doxygen will show all
+# inherited members of a class in the documentation of that class as if those
+# members were ordinary class members. Constructors, destructors and assignment
+# operators of the base classes will not be shown.
+
+INLINE_INHERITED_MEMB = NO
+
+# If the FULL_PATH_NAMES tag is set to YES then Doxygen will prepend the full
+# path before files name in the file list and in the header files. If set
+# to NO the shortest path that makes the file name unique will be used.
+
+FULL_PATH_NAMES = NO
+
+# If the FULL_PATH_NAMES tag is set to YES then the STRIP_FROM_PATH tag
+# can be used to strip a user-defined part of the path. Stripping is
+# only done if one of the specified strings matches the left-hand part of
+# the path. The tag can be used to show relative paths in the file list.
+# If left blank the directory from which doxygen is run is used as the
+# path to strip.
+
+STRIP_FROM_PATH =
+
+# The STRIP_FROM_INC_PATH tag can be used to strip a user-defined part of
+# the path mentioned in the documentation of a class, which tells
+# the reader which header file to include in order to use a class.
+# If left blank only the name of the header file containing the class
+# definition is used. Otherwise one should specify the include paths that
+# are normally passed to the compiler using the -I flag.
+
+STRIP_FROM_INC_PATH =
+
+# If the SHORT_NAMES tag is set to YES, doxygen will generate much shorter
+# (but less readable) file names. This can be useful is your file systems
+# doesn't support long names like on DOS, Mac, or CD-ROM.
+
+SHORT_NAMES = NO
+
+# If the JAVADOC_AUTOBRIEF tag is set to YES then Doxygen
+# will interpret the first line (until the first dot) of a JavaDoc-style
+# comment as the brief description. If set to NO, the JavaDoc
+# comments will behave just like regular Qt-style comments
+# (thus requiring an explicit @brief command for a brief description.)
+
+JAVADOC_AUTOBRIEF = NO
+
+# If the QT_AUTOBRIEF tag is set to YES then Doxygen will
+# interpret the first line (until the first dot) of a Qt-style
+# comment as the brief description. If set to NO, the comments
+# will behave just like regular Qt-style comments (thus requiring
+# an explicit \brief command for a brief description.)
+
+QT_AUTOBRIEF = NO
+
+# The MULTILINE_CPP_IS_BRIEF tag can be set to YES to make Doxygen
+# treat a multi-line C++ special comment block (i.e. a block of //! or ///
+# comments) as a brief description. This used to be the default behaviour.
+# The new default is to treat a multi-line C++ comment block as a detailed
+# description. Set this tag to YES if you prefer the old behaviour instead.
+
+MULTILINE_CPP_IS_BRIEF = NO
+
+# If the INHERIT_DOCS tag is set to YES (the default) then an undocumented
+# member inherits the documentation from any documented member that it
+# re-implements.
+
+INHERIT_DOCS = YES
+
+# If the SEPARATE_MEMBER_PAGES tag is set to YES, then doxygen will produce
+# a new page for each member. If set to NO, the documentation of a member will
+# be part of the file/class/namespace that contains it.
+
+SEPARATE_MEMBER_PAGES = NO
+
+# The TAB_SIZE tag can be used to set the number of spaces in a tab.
+# Doxygen uses this value to replace tabs by spaces in code fragments.
+
+TAB_SIZE = 8
+
+# This tag can be used to specify a number of aliases that acts
+# as commands in the documentation. An alias has the form "name=value".
+# For example adding "sideeffect=\par Side Effects:\n" will allow you to
+# put the command \sideeffect (or @sideeffect) in the documentation, which
+# will result in a user-defined paragraph with heading "Side Effects:".
+# You can put \n's in the value part of an alias to insert newlines.
+
+ALIASES =
+
+# Set the OPTIMIZE_OUTPUT_FOR_C tag to YES if your project consists of C
+# sources only. Doxygen will then generate output that is more tailored for C.
+# For instance, some of the names that are used will be different. The list
+# of all members will be omitted, etc.
+
+OPTIMIZE_OUTPUT_FOR_C = YES
+
+# Set the OPTIMIZE_OUTPUT_JAVA tag to YES if your project consists of Java
+# sources only. Doxygen will then generate output that is more tailored for
+# Java. For instance, namespaces will be presented as packages, qualified
+# scopes will look different, etc.
+
+OPTIMIZE_OUTPUT_JAVA = NO
+
+# Set the OPTIMIZE_FOR_FORTRAN tag to YES if your project consists of Fortran
+# sources only. Doxygen will then generate output that is more tailored for
+# Fortran.
+
+OPTIMIZE_FOR_FORTRAN = NO
+
+# Set the OPTIMIZE_OUTPUT_VHDL tag to YES if your project consists of VHDL
+# sources. Doxygen will then generate output that is tailored for
+# VHDL.
+
+OPTIMIZE_OUTPUT_VHDL = NO
+
+# Doxygen selects the parser to use depending on the extension of the files it parses.
+# With this tag you can assign which parser to use for a given extension.
+# Doxygen has a built-in mapping, but you can override or extend it using this tag.
+# The format is ext=language, where ext is a file extension, and language is one of
+# the parsers supported by doxygen: IDL, Java, Javascript, C#, C, C++, D, PHP,
+# Objective-C, Python, Fortran, VHDL, C, C++. For instance to make doxygen treat
+# .inc files as Fortran files (default is PHP), and .f files as C (default is Fortran),
+# use: inc=Fortran f=C. Note that for custom extensions you also need to set
+# FILE_PATTERNS otherwise the files are not read by doxygen.
+
+EXTENSION_MAPPING =
+
+# If you use STL classes (i.e. std::string, std::vector, etc.) but do not want
+# to include (a tag file for) the STL sources as input, then you should
+# set this tag to YES in order to let doxygen match functions declarations and
+# definitions whose arguments contain STL classes (e.g. func(std::string); v.s.
+# func(std::string) {}). This also make the inheritance and collaboration
+# diagrams that involve STL classes more complete and accurate.
+
+BUILTIN_STL_SUPPORT = YES
+
+# If you use Microsoft's C++/CLI language, you should set this option to YES to
+# enable parsing support.
+
+CPP_CLI_SUPPORT = NO
+
+# Set the SIP_SUPPORT tag to YES if your project consists of sip sources only.
+# Doxygen will parse them like normal C++ but will assume all classes use public
+# instead of private inheritance when no explicit protection keyword is present.
+
+SIP_SUPPORT = NO
+
+# For Microsoft's IDL there are propget and propput attributes to indicate getter
+# and setter methods for a property. Setting this option to YES (the default)
+# will make doxygen to replace the get and set methods by a property in the
+# documentation. This will only work if the methods are indeed getting or
+# setting a simple type. If this is not the case, or you want to show the
+# methods anyway, you should set this option to NO.
+
+IDL_PROPERTY_SUPPORT = YES
+
+# If member grouping is used in the documentation and the DISTRIBUTE_GROUP_DOC
+# tag is set to YES, then doxygen will reuse the documentation of the first
+# member in the group (if any) for the other members of the group. By default
+# all members of a group must be documented explicitly.
+
+DISTRIBUTE_GROUP_DOC = YES
+
+# Set the SUBGROUPING tag to YES (the default) to allow class member groups of
+# the same type (for instance a group of public functions) to be put as a
+# subgroup of that type (e.g. under the Public Functions section). Set it to
+# NO to prevent subgrouping. Alternatively, this can be done per class using
+# the \nosubgrouping command.
+
+SUBGROUPING = YES
+
+# When TYPEDEF_HIDES_STRUCT is enabled, a typedef of a struct, union, or enum
+# is documented as struct, union, or enum with the name of the typedef. So
+# typedef struct TypeS {} TypeT, will appear in the documentation as a struct
+# with name TypeT. When disabled the typedef will appear as a member of a file,
+# namespace, or class. And the struct will be named TypeS. This can typically
+# be useful for C code in case the coding convention dictates that all compound
+# types are typedef'ed and only the typedef is referenced, never the tag name.
+
+TYPEDEF_HIDES_STRUCT = YES
+
+# The SYMBOL_CACHE_SIZE determines the size of the internal cache use to
+# determine which symbols to keep in memory and which to flush to disk.
+# When the cache is full, less often used symbols will be written to disk.
+# For small to medium size projects (<1000 input files) the default value is
+# probably good enough. For larger projects a too small cache size can cause
+# doxygen to be busy swapping symbols to and from disk most of the time
+# causing a significant performance penality.
+# If the system has enough physical memory increasing the cache will improve the
+# performance by keeping more symbols in memory. Note that the value works on
+# a logarithmic scale so increasing the size by one will rougly double the
+# memory usage. The cache size is given by this formula:
+# 2^(16+SYMBOL_CACHE_SIZE). The valid range is 0..9, the default is 0,
+# corresponding to a cache size of 2^16 = 65536 symbols
+
+SYMBOL_CACHE_SIZE = 0
+
+#---------------------------------------------------------------------------
+# Build related configuration options
+#---------------------------------------------------------------------------
+
+# If the EXTRACT_ALL tag is set to YES doxygen will assume all entities in
+# documentation are documented, even if no documentation was available.
+# Private class members and static file members will be hidden unless
+# the EXTRACT_PRIVATE and EXTRACT_STATIC tags are set to YES
+
+EXTRACT_ALL = YES
+
+# If the EXTRACT_PRIVATE tag is set to YES all private members of a class
+# will be included in the documentation.
+
+EXTRACT_PRIVATE = YES
+
+# If the EXTRACT_STATIC tag is set to YES all static members of a file
+# will be included in the documentation.
+
+EXTRACT_STATIC = YES
+
+# If the EXTRACT_LOCAL_CLASSES tag is set to YES classes (and structs)
+# defined locally in source files will be included in the documentation.
+# If set to NO only classes defined in header files are included.
+
+EXTRACT_LOCAL_CLASSES = YES
+
+# This flag is only useful for Objective-C code. When set to YES local
+# methods, which are defined in the implementation section but not in
+# the interface are included in the documentation.
+# If set to NO (the default) only methods in the interface are included.
+
+EXTRACT_LOCAL_METHODS = YES
+
+# If this flag is set to YES, the members of anonymous namespaces will be
+# extracted and appear in the documentation as a namespace called
+# 'anonymous_namespace{file}', where file will be replaced with the base
+# name of the file that contains the anonymous namespace. By default
+# anonymous namespace are hidden.
+
+EXTRACT_ANON_NSPACES = YES
+
+# If the HIDE_UNDOC_MEMBERS tag is set to YES, Doxygen will hide all
+# undocumented members of documented classes, files or namespaces.
+# If set to NO (the default) these members will be included in the
+# various overviews, but no documentation section is generated.
+# This option has no effect if EXTRACT_ALL is enabled.
+
+HIDE_UNDOC_MEMBERS = NO
+
+# If the HIDE_UNDOC_CLASSES tag is set to YES, Doxygen will hide all
+# undocumented classes that are normally visible in the class hierarchy.
+# If set to NO (the default) these classes will be included in the various
+# overviews. This option has no effect if EXTRACT_ALL is enabled.
+
+HIDE_UNDOC_CLASSES = NO
+
+# If the HIDE_FRIEND_COMPOUNDS tag is set to YES, Doxygen will hide all
+# friend (class|struct|union) declarations.
+# If set to NO (the default) these declarations will be included in the
+# documentation.
+
+HIDE_FRIEND_COMPOUNDS = NO
+
+# If the HIDE_IN_BODY_DOCS tag is set to YES, Doxygen will hide any
+# documentation blocks found inside the body of a function.
+# If set to NO (the default) these blocks will be appended to the
+# function's detailed documentation block.
+
+HIDE_IN_BODY_DOCS = NO
+
+# The INTERNAL_DOCS tag determines if documentation
+# that is typed after a \internal command is included. If the tag is set
+# to NO (the default) then the documentation will be excluded.
+# Set it to YES to include the internal documentation.
+
+INTERNAL_DOCS = NO
+
+# If the CASE_SENSE_NAMES tag is set to NO then Doxygen will only generate
+# file names in lower-case letters. If set to YES upper-case letters are also
+# allowed. This is useful if you have classes or files whose names only differ
+# in case and if your file system supports case sensitive file names. Windows
+# and Mac users are advised to set this option to NO.
+
+CASE_SENSE_NAMES = NO
+
+# If the HIDE_SCOPE_NAMES tag is set to NO (the default) then Doxygen
+# will show members with their full class and namespace scopes in the
+# documentation. If set to YES the scope will be hidden.
+
+HIDE_SCOPE_NAMES = NO
+
+# If the SHOW_INCLUDE_FILES tag is set to YES (the default) then Doxygen
+# will put a list of the files that are included by a file in the documentation
+# of that file.
+
+SHOW_INCLUDE_FILES = YES
+
+# If the FORCE_LOCAL_INCLUDES tag is set to YES then Doxygen
+# will list include files with double quotes in the documentation
+# rather than with sharp brackets.
+
+FORCE_LOCAL_INCLUDES = NO
+
+# If the INLINE_INFO tag is set to YES (the default) then a tag [inline]
+# is inserted in the documentation for inline members.
+
+INLINE_INFO = YES
+
+# If the SORT_MEMBER_DOCS tag is set to YES (the default) then doxygen
+# will sort the (detailed) documentation of file and class members
+# alphabetically by member name. If set to NO the members will appear in
+# declaration order.
+
+SORT_MEMBER_DOCS = YES
+
+# If the SORT_BRIEF_DOCS tag is set to YES then doxygen will sort the
+# brief documentation of file, namespace and class members alphabetically
+# by member name. If set to NO (the default) the members will appear in
+# declaration order.
+
+SORT_BRIEF_DOCS = NO
+
+# If the SORT_MEMBERS_CTORS_1ST tag is set to YES then doxygen
+# will sort the (brief and detailed) documentation of class members so that
+# constructors and destructors are listed first. If set to NO (the default)
+# the constructors will appear in the respective orders defined by
+# SORT_MEMBER_DOCS and SORT_BRIEF_DOCS.
+# This tag will be ignored for brief docs if SORT_BRIEF_DOCS is set to NO
+# and ignored for detailed docs if SORT_MEMBER_DOCS is set to NO.
+
+SORT_MEMBERS_CTORS_1ST = NO
+
+# If the SORT_GROUP_NAMES tag is set to YES then doxygen will sort the
+# hierarchy of group names into alphabetical order. If set to NO (the default)
+# the group names will appear in their defined order.
+
+SORT_GROUP_NAMES = NO
+
+# If the SORT_BY_SCOPE_NAME tag is set to YES, the class list will be
+# sorted by fully-qualified names, including namespaces. If set to
+# NO (the default), the class list will be sorted only by class name,
+# not including the namespace part.
+# Note: This option is not very useful if HIDE_SCOPE_NAMES is set to YES.
+# Note: This option applies only to the class list, not to the
+# alphabetical list.
+
+SORT_BY_SCOPE_NAME = NO
+
+# The GENERATE_TODOLIST tag can be used to enable (YES) or
+# disable (NO) the todo list. This list is created by putting \todo
+# commands in the documentation.
+
+GENERATE_TODOLIST = YES
+
+# The GENERATE_TESTLIST tag can be used to enable (YES) or
+# disable (NO) the test list. This list is created by putting \test
+# commands in the documentation.
+
+GENERATE_TESTLIST = YES
+
+# The GENERATE_BUGLIST tag can be used to enable (YES) or
+# disable (NO) the bug list. This list is created by putting \bug
+# commands in the documentation.
+
+GENERATE_BUGLIST = YES
+
+# The GENERATE_DEPRECATEDLIST tag can be used to enable (YES) or
+# disable (NO) the deprecated list. This list is created by putting
+# \deprecated commands in the documentation.
+
+GENERATE_DEPRECATEDLIST= YES
+
+# The ENABLED_SECTIONS tag can be used to enable conditional
+# documentation sections, marked by \if sectionname ... \endif.
+
+ENABLED_SECTIONS =
+
+# The MAX_INITIALIZER_LINES tag determines the maximum number of lines
+# the initial value of a variable or define consists of for it to appear in
+# the documentation. If the initializer consists of more lines than specified
+# here it will be hidden. Use a value of 0 to hide initializers completely.
+# The appearance of the initializer of individual variables and defines in the
+# documentation can be controlled using \showinitializer or \hideinitializer
+# command in the documentation regardless of this setting.
+
+MAX_INITIALIZER_LINES = 30
+
+# Set the SHOW_USED_FILES tag to NO to disable the list of files generated
+# at the bottom of the documentation of classes and structs. If set to YES the
+# list will mention the files that were used to generate the documentation.
+
+SHOW_USED_FILES = YES
+
+# If the sources in your project are distributed over multiple directories
+# then setting the SHOW_DIRECTORIES tag to YES will show the directory hierarchy
+# in the documentation. The default is NO.
+
+SHOW_DIRECTORIES = NO
+
+# Set the SHOW_FILES tag to NO to disable the generation of the Files page.
+# This will remove the Files entry from the Quick Index and from the
+# Folder Tree View (if specified). The default is YES.
+
+SHOW_FILES = YES
+
+# Set the SHOW_NAMESPACES tag to NO to disable the generation of the
+# Namespaces page. This will remove the Namespaces entry from the Quick Index
+# and from the Folder Tree View (if specified). The default is YES.
+
+SHOW_NAMESPACES = YES
+
+# The FILE_VERSION_FILTER tag can be used to specify a program or script that
+# doxygen should invoke to get the current version for each file (typically from
+# the version control system). Doxygen will invoke the program by executing (via
+# popen()) the command , where is the value of
+# the FILE_VERSION_FILTER tag, and is the name of an input file
+# provided by doxygen. Whatever the program writes to standard output
+# is used as the file version. See the manual for examples.
+
+FILE_VERSION_FILTER =
+
+# The LAYOUT_FILE tag can be used to specify a layout file which will be parsed by
+# doxygen. The layout file controls the global structure of the generated output files
+# in an output format independent way. The create the layout file that represents
+# doxygen's defaults, run doxygen with the -l option. You can optionally specify a
+# file name after the option, if omitted DoxygenLayout.xml will be used as the name
+# of the layout file.
+
+LAYOUT_FILE =
+
+#---------------------------------------------------------------------------
+# configuration options related to warning and progress messages
+#---------------------------------------------------------------------------
+
+# The QUIET tag can be used to turn on/off the messages that are generated
+# by doxygen. Possible values are YES and NO. If left blank NO is used.
+
+QUIET = NO
+
+# The WARNINGS tag can be used to turn on/off the warning messages that are
+# generated by doxygen. Possible values are YES and NO. If left blank
+# NO is used.
+
+WARNINGS = YES
+
+# If WARN_IF_UNDOCUMENTED is set to YES, then doxygen will generate warnings
+# for undocumented members. If EXTRACT_ALL is set to YES then this flag will
+# automatically be disabled.
+
+WARN_IF_UNDOCUMENTED = YES
+
+# If WARN_IF_DOC_ERROR is set to YES, doxygen will generate warnings for
+# potential errors in the documentation, such as not documenting some
+# parameters in a documented function, or documenting parameters that
+# don't exist or using markup commands wrongly.
+
+WARN_IF_DOC_ERROR = YES
+
+# This WARN_NO_PARAMDOC option can be abled to get warnings for
+# functions that are documented, but have no documentation for their parameters
+# or return value. If set to NO (the default) doxygen will only warn about
+# wrong or incomplete parameter documentation, but not about the absence of
+# documentation.
+
+WARN_NO_PARAMDOC = YES
+
+# The WARN_FORMAT tag determines the format of the warning messages that
+# doxygen can produce. The string should contain the $file, $line, and $text
+# tags, which will be replaced by the file and line number from which the
+# warning originated and the warning text. Optionally the format may contain
+# $version, which will be replaced by the version of the file (if it could
+# be obtained via FILE_VERSION_FILTER)
+
+WARN_FORMAT = "$file:$line: $text"
+
+# The WARN_LOGFILE tag can be used to specify a file to which warning
+# and error messages should be written. If left blank the output is written
+# to stderr.
+
+WARN_LOGFILE =
+
+#---------------------------------------------------------------------------
+# configuration options related to the input files
+#---------------------------------------------------------------------------
+
+# The INPUT tag can be used to specify the files and/or directories that contain
+# documented source files. You may enter file names like "myfile.cpp" or
+# directories like "/usr/src/myproject". Separate the files or directories
+# with spaces.
+
+INPUT = D:/hq/stg/opencl/drivers/opencl/compiler/lib
+
+# This tag can be used to specify the character encoding of the source files
+# that doxygen parses. Internally doxygen uses the UTF-8 encoding, which is
+# also the default input encoding. Doxygen uses libiconv (or the iconv built
+# into libc) for the transcoding. See http://www.gnu.org/software/libiconv for
+# the list of possible encodings.
+
+INPUT_ENCODING = UTF-8
+
+# If the value of the INPUT tag contains directories, you can use the
+# FILE_PATTERNS tag to specify one or more wildcard pattern (like *.cpp
+# and *.h) to filter out the source-files in the directories. If left
+# blank the following patterns are tested:
+# *.c *.cc *.cxx *.cpp *.c++ *.java *.ii *.ixx *.ipp *.i++ *.inl *.h *.hh *.hxx
+# *.hpp *.h++ *.idl *.odl *.cs *.php *.php3 *.inc *.m *.mm *.py *.f90
+
+FILE_PATTERNS = *.c \
+ *.cc \
+ *.cxx \
+ *.cpp \
+ *.c++ \
+ *.d \
+ *.java \
+ *.ii \
+ *.ixx \
+ *.ipp \
+ *.i++ \
+ *.inl \
+ *.h \
+ *.hh \
+ *.hxx \
+ *.hpp \
+ *.h++ \
+ *.idl \
+ *.odl \
+ *.cs \
+ *.php \
+ *.php3 \
+ *.inc \
+ *.m \
+ *.mm \
+ *.dox \
+ *.py \
+ *.f90 \
+ *.f \
+ *.vhd \
+ *.vhdl
+
+# The RECURSIVE tag can be used to turn specify whether or not subdirectories
+# should be searched for input files as well. Possible values are YES and NO.
+# If left blank NO is used.
+
+RECURSIVE = YES
+
+# The EXCLUDE tag can be used to specify files and/or directories that should
+# excluded from the INPUT source files. This way you can easily exclude a
+# subdirectory from a directory tree whose root is specified with the INPUT tag.
+
+EXCLUDE = D:/hq/stg/opencl/drivers/opencl/compiler/lib/backends/gpu/sc \
+ D:/hq/stg/opencl/drivers/opencl/compiler/lib/loaders/elf \
+ D:/hq/stg/opencl/drivers/opencl/compiler/lib/promotions \
+ D:/hq/stg/opencl/drivers/opencl/compiler/lib/loaders/bif/amuabi \
+ D:/hq/stg/opencl/drivers/opencl/compiler/lib/include/v0_7 \
+ D:/hq/stg/opencl/drivers/opencl/compiler/lib/api/v0_7 \
+ D:/hq/stg/opencl/drivers/opencl/compiler/lib/loaders/plugins
+
+# The EXCLUDE_SYMLINKS tag can be used select whether or not files or
+# directories that are symbolic links (a Unix filesystem feature) are excluded
+# from the input.
+
+EXCLUDE_SYMLINKS = YES
+
+# If the value of the INPUT tag contains directories, you can use the
+# EXCLUDE_PATTERNS tag to specify one or more wildcard patterns to exclude
+# certain files from those directories. Note that the wildcards are matched
+# against the file with absolute path, so to exclude all test directories
+# for example use the pattern */test/*
+
+EXCLUDE_PATTERNS = *.d
+
+# The EXCLUDE_SYMBOLS tag can be used to specify one or more symbol names
+# (namespaces, classes, functions, etc.) that should be excluded from the
+# output. The symbol name can be a fully qualified name, a word, or if the
+# wildcard * is used, a substring. Examples: ANamespace, AClass,
+# AClass::ANamespace, ANamespace::*Test
+
+EXCLUDE_SYMBOLS =
+
+# The EXAMPLE_PATH tag can be used to specify one or more files or
+# directories that contain example code fragments that are included (see
+# the \include command).
+
+EXAMPLE_PATH =
+
+# If the value of the EXAMPLE_PATH tag contains directories, you can use the
+# EXAMPLE_PATTERNS tag to specify one or more wildcard pattern (like *.cpp
+# and *.h) to filter out the source-files in the directories. If left
+# blank all files are included.
+
+EXAMPLE_PATTERNS = *
+
+# If the EXAMPLE_RECURSIVE tag is set to YES then subdirectories will be
+# searched for input files to be used with the \include or \dontinclude
+# commands irrespective of the value of the RECURSIVE tag.
+# Possible values are YES and NO. If left blank NO is used.
+
+EXAMPLE_RECURSIVE = NO
+
+# The IMAGE_PATH tag can be used to specify one or more files or
+# directories that contain image that are included in the documentation (see
+# the \image command).
+
+IMAGE_PATH =
+
+# The INPUT_FILTER tag can be used to specify a program that doxygen should
+# invoke to filter for each input file. Doxygen will invoke the filter program
+# by executing (via popen()) the command , where
+# is the value of the INPUT_FILTER tag, and is the name of an
+# input file. Doxygen will then use the output that the filter program writes
+# to standard output. If FILTER_PATTERNS is specified, this tag will be
+# ignored.
+
+INPUT_FILTER =
+
+# The FILTER_PATTERNS tag can be used to specify filters on a per file pattern
+# basis. Doxygen will compare the file name with each pattern and apply the
+# filter if there is a match. The filters are a list of the form:
+# pattern=filter (like *.cpp=my_cpp_filter). See INPUT_FILTER for further
+# info on how filters are used. If FILTER_PATTERNS is empty, INPUT_FILTER
+# is applied to all files.
+
+FILTER_PATTERNS =
+
+# If the FILTER_SOURCE_FILES tag is set to YES, the input filter (if set using
+# INPUT_FILTER) will be used to filter the input files when producing source
+# files to browse (i.e. when SOURCE_BROWSER is set to YES).
+
+FILTER_SOURCE_FILES = NO
+
+#---------------------------------------------------------------------------
+# configuration options related to source browsing
+#---------------------------------------------------------------------------
+
+# If the SOURCE_BROWSER tag is set to YES then a list of source files will
+# be generated. Documented entities will be cross-referenced with these sources.
+# Note: To get rid of all source code in the generated output, make sure also
+# VERBATIM_HEADERS is set to NO.
+
+SOURCE_BROWSER = YES
+
+# Setting the INLINE_SOURCES tag to YES will include the body
+# of functions and classes directly in the documentation.
+
+INLINE_SOURCES = YES
+
+# Setting the STRIP_CODE_COMMENTS tag to YES (the default) will instruct
+# doxygen to hide any special comment blocks from generated source code
+# fragments. Normal C and C++ comments will always remain visible.
+
+STRIP_CODE_COMMENTS = YES
+
+# If the REFERENCED_BY_RELATION tag is set to YES
+# then for each documented function all documented
+# functions referencing it will be listed.
+
+REFERENCED_BY_RELATION = YES
+
+# If the REFERENCES_RELATION tag is set to YES
+# then for each documented function all documented entities
+# called/used by that function will be listed.
+
+REFERENCES_RELATION = YES
+
+# If the REFERENCES_LINK_SOURCE tag is set to YES (the default)
+# and SOURCE_BROWSER tag is set to YES, then the hyperlinks from
+# functions in REFERENCES_RELATION and REFERENCED_BY_RELATION lists will
+# link to the source code. Otherwise they will link to the documentation.
+
+REFERENCES_LINK_SOURCE = YES
+
+# If the USE_HTAGS tag is set to YES then the references to source code
+# will point to the HTML generated by the htags(1) tool instead of doxygen
+# built-in source browser. The htags tool is part of GNU's global source
+# tagging system (see http://www.gnu.org/software/global/global.html). You
+# will need version 4.8.6 or higher.
+
+USE_HTAGS = NO
+
+# If the VERBATIM_HEADERS tag is set to YES (the default) then Doxygen
+# will generate a verbatim copy of the header file for each class for
+# which an include is specified. Set to NO to disable this.
+
+VERBATIM_HEADERS = YES
+
+#---------------------------------------------------------------------------
+# configuration options related to the alphabetical class index
+#---------------------------------------------------------------------------
+
+# If the ALPHABETICAL_INDEX tag is set to YES, an alphabetical index
+# of all compounds will be generated. Enable this if the project
+# contains a lot of classes, structs, unions or interfaces.
+
+ALPHABETICAL_INDEX = NO
+
+# If the alphabetical index is enabled (see ALPHABETICAL_INDEX) then
+# the COLS_IN_ALPHA_INDEX tag can be used to specify the number of columns
+# in which this list will be split (can be a number in the range [1..20])
+
+COLS_IN_ALPHA_INDEX = 5
+
+# In case all classes in a project start with a common prefix, all
+# classes will be put under the same header in the alphabetical index.
+# The IGNORE_PREFIX tag can be used to specify one or more prefixes that
+# should be ignored while generating the index headers.
+
+IGNORE_PREFIX =
+
+#---------------------------------------------------------------------------
+# configuration options related to the HTML output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_HTML tag is set to YES (the default) Doxygen will
+# generate HTML output.
+
+GENERATE_HTML = YES
+
+# The HTML_OUTPUT tag is used to specify where the HTML docs will be put.
+# If a relative path is entered the value of OUTPUT_DIRECTORY will be
+# put in front of it. If left blank `html' will be used as the default path.
+
+HTML_OUTPUT = html
+
+# The HTML_FILE_EXTENSION tag can be used to specify the file extension for
+# each generated HTML page (for example: .htm,.php,.asp). If it is left blank
+# doxygen will generate files with .html extension.
+
+HTML_FILE_EXTENSION = .html
+
+# The HTML_HEADER tag can be used to specify a personal HTML header for
+# each generated HTML page. If it is left blank doxygen will generate a
+# standard header.
+
+HTML_HEADER =
+
+# The HTML_FOOTER tag can be used to specify a personal HTML footer for
+# each generated HTML page. If it is left blank doxygen will generate a
+# standard footer.
+
+HTML_FOOTER =
+
+# The HTML_STYLESHEET tag can be used to specify a user-defined cascading
+# style sheet that is used by each HTML page. It can be used to
+# fine-tune the look of the HTML output. If the tag is left blank doxygen
+# will generate a default style sheet. Note that doxygen will try to copy
+# the style sheet file to the HTML output directory, so don't put your own
+# stylesheet in the HTML output directory as well, or it will be erased!
+
+HTML_STYLESHEET =
+
+# If the HTML_TIMESTAMP tag is set to YES then the footer of each generated HTML
+# page will contain the date and time when the page was generated. Setting
+# this to NO can help when comparing the output of multiple runs.
+
+HTML_TIMESTAMP = YES
+
+# If the HTML_ALIGN_MEMBERS tag is set to YES, the members of classes,
+# files or namespaces will be aligned in HTML using tables. If set to
+# NO a bullet list will be used.
+
+HTML_ALIGN_MEMBERS = YES
+
+# If the HTML_DYNAMIC_SECTIONS tag is set to YES then the generated HTML
+# documentation will contain sections that can be hidden and shown after the
+# page has loaded. For this to work a browser that supports
+# JavaScript and DHTML is required (for instance Mozilla 1.0+, Firefox
+# Netscape 6.0+, Internet explorer 5.0+, Konqueror, or Safari).
+
+HTML_DYNAMIC_SECTIONS = NO
+
+# If the GENERATE_DOCSET tag is set to YES, additional index files
+# will be generated that can be used as input for Apple's Xcode 3
+# integrated development environment, introduced with OSX 10.5 (Leopard).
+# To create a documentation set, doxygen will generate a Makefile in the
+# HTML output directory. Running make will produce the docset in that
+# directory and running "make install" will install the docset in
+# ~/Library/Developer/Shared/Documentation/DocSets so that Xcode will find
+# it at startup.
+# See http://developer.apple.com/tools/creatingdocsetswithdoxygen.html for more information.
+
+GENERATE_DOCSET = NO
+
+# When GENERATE_DOCSET tag is set to YES, this tag determines the name of the
+# feed. A documentation feed provides an umbrella under which multiple
+# documentation sets from a single provider (such as a company or product suite)
+# can be grouped.
+
+DOCSET_FEEDNAME = "Doxygen generated docs"
+
+# When GENERATE_DOCSET tag is set to YES, this tag specifies a string that
+# should uniquely identify the documentation set bundle. This should be a
+# reverse domain-name style string, e.g. com.mycompany.MyDocSet. Doxygen
+# will append .docset to the name.
+
+DOCSET_BUNDLE_ID = org.doxygen.Project
+
+# If the GENERATE_HTMLHELP tag is set to YES, additional index files
+# will be generated that can be used as input for tools like the
+# Microsoft HTML help workshop to generate a compiled HTML help file (.chm)
+# of the generated HTML documentation.
+
+GENERATE_HTMLHELP = NO
+
+# If the GENERATE_HTMLHELP tag is set to YES, the CHM_FILE tag can
+# be used to specify the file name of the resulting .chm file. You
+# can add a path in front of the file if the result should not be
+# written to the html output directory.
+
+CHM_FILE =
+
+# If the GENERATE_HTMLHELP tag is set to YES, the HHC_LOCATION tag can
+# be used to specify the location (absolute path including file name) of
+# the HTML help compiler (hhc.exe). If non-empty doxygen will try to run
+# the HTML help compiler on the generated index.hhp.
+
+HHC_LOCATION =
+
+# If the GENERATE_HTMLHELP tag is set to YES, the GENERATE_CHI flag
+# controls if a separate .chi index file is generated (YES) or that
+# it should be included in the master .chm file (NO).
+
+GENERATE_CHI = NO
+
+# If the GENERATE_HTMLHELP tag is set to YES, the CHM_INDEX_ENCODING
+# is used to encode HtmlHelp index (hhk), content (hhc) and project file
+# content.
+
+CHM_INDEX_ENCODING =
+
+# If the GENERATE_HTMLHELP tag is set to YES, the BINARY_TOC flag
+# controls whether a binary table of contents is generated (YES) or a
+# normal table of contents (NO) in the .chm file.
+
+BINARY_TOC = NO
+
+# The TOC_EXPAND flag can be set to YES to add extra items for group members
+# to the contents of the HTML help documentation and to the tree view.
+
+TOC_EXPAND = NO
+
+# If the GENERATE_QHP tag is set to YES and both QHP_NAMESPACE and QHP_VIRTUAL_FOLDER
+# are set, an additional index file will be generated that can be used as input for
+# Qt's qhelpgenerator to generate a Qt Compressed Help (.qch) of the generated
+# HTML documentation.
+
+GENERATE_QHP = NO
+
+# If the QHG_LOCATION tag is specified, the QCH_FILE tag can
+# be used to specify the file name of the resulting .qch file.
+# The path specified is relative to the HTML output folder.
+
+QCH_FILE =
+
+# The QHP_NAMESPACE tag specifies the namespace to use when generating
+# Qt Help Project output. For more information please see
+# http://doc.trolltech.com/qthelpproject.html#namespace
+
+QHP_NAMESPACE = org.doxygen.Project
+
+# The QHP_VIRTUAL_FOLDER tag specifies the namespace to use when generating
+# Qt Help Project output. For more information please see
+# http://doc.trolltech.com/qthelpproject.html#virtual-folders
+
+QHP_VIRTUAL_FOLDER = doc
+
+# If QHP_CUST_FILTER_NAME is set, it specifies the name of a custom filter to add.
+# For more information please see
+# http://doc.trolltech.com/qthelpproject.html#custom-filters
+
+QHP_CUST_FILTER_NAME =
+
+# The QHP_CUST_FILT_ATTRS tag specifies the list of the attributes of the custom filter to add.For more information please see
+# Qt Help Project / Custom Filters.
+
+QHP_CUST_FILTER_ATTRS =
+
+# The QHP_SECT_FILTER_ATTRS tag specifies the list of the attributes this project's
+# filter section matches.
+# Qt Help Project / Filter Attributes.
+
+QHP_SECT_FILTER_ATTRS =
+
+# If the GENERATE_QHP tag is set to YES, the QHG_LOCATION tag can
+# be used to specify the location of Qt's qhelpgenerator.
+# If non-empty doxygen will try to run qhelpgenerator on the generated
+# .qhp file.
+
+QHG_LOCATION =
+
+# If the GENERATE_ECLIPSEHELP tag is set to YES, additional index files
+# will be generated, which together with the HTML files, form an Eclipse help
+# plugin. To install this plugin and make it available under the help contents
+# menu in Eclipse, the contents of the directory containing the HTML and XML
+# files needs to be copied into the plugins directory of eclipse. The name of
+# the directory within the plugins directory should be the same as
+# the ECLIPSE_DOC_ID value. After copying Eclipse needs to be restarted before
+# the help appears.
+
+GENERATE_ECLIPSEHELP = NO
+
+# A unique identifier for the eclipse help plugin. When installing the plugin
+# the directory name containing the HTML and XML files should also have
+# this name.
+
+ECLIPSE_DOC_ID = org.doxygen.Project
+
+# The DISABLE_INDEX tag can be used to turn on/off the condensed index at
+# top of each HTML page. The value NO (the default) enables the index and
+# the value YES disables it.
+
+DISABLE_INDEX = NO
+
+# This tag can be used to set the number of enum values (range [1..20])
+# that doxygen will group on one line in the generated HTML documentation.
+
+ENUM_VALUES_PER_LINE = 4
+
+# The GENERATE_TREEVIEW tag is used to specify whether a tree-like index
+# structure should be generated to display hierarchical information.
+# If the tag value is set to YES, a side panel will be generated
+# containing a tree-like index structure (just like the one that
+# is generated for HTML Help). For this to work a browser that supports
+# JavaScript, DHTML, CSS and frames is required (i.e. any modern browser).
+# Windows users are probably better off using the HTML help feature.
+
+GENERATE_TREEVIEW = YES
+
+# By enabling USE_INLINE_TREES, doxygen will generate the Groups, Directories,
+# and Class Hierarchy pages using a tree view instead of an ordered list.
+
+USE_INLINE_TREES = NO
+
+# If the treeview is enabled (see GENERATE_TREEVIEW) then this tag can be
+# used to set the initial width (in pixels) of the frame in which the tree
+# is shown.
+
+TREEVIEW_WIDTH = 250
+
+# Use this tag to change the font size of Latex formulas included
+# as images in the HTML documentation. The default is 10. Note that
+# when you change the font size after a successful doxygen run you need
+# to manually remove any form_*.png images from the HTML output directory
+# to force them to be regenerated.
+
+FORMULA_FONTSIZE = 10
+
+# When the SEARCHENGINE tag is enabled doxygen will generate a search box
+# for the HTML output. The underlying search engine uses javascript
+# and DHTML and should work on any modern browser. Note that when using
+# HTML help (GENERATE_HTMLHELP), Qt help (GENERATE_QHP), or docsets
+# (GENERATE_DOCSET) there is already a search function so this one should
+# typically be disabled. For large projects the javascript based search engine
+# can be slow, then enabling SERVER_BASED_SEARCH may provide a better solution.
+
+SEARCHENGINE = NO
+
+# When the SERVER_BASED_SEARCH tag is enabled the search engine will be
+# implemented using a PHP enabled web server instead of at the web client
+# using Javascript. Doxygen will generate the search PHP script and index
+# file to put on the web server. The advantage of the server
+# based approach is that it scales better to large projects and allows
+# full text search. The disadvances is that it is more difficult to setup
+# and does not have live searching capabilities.
+
+SERVER_BASED_SEARCH = NO
+
+#---------------------------------------------------------------------------
+# configuration options related to the LaTeX output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_LATEX tag is set to YES (the default) Doxygen will
+# generate Latex output.
+
+GENERATE_LATEX = NO
+
+# The LATEX_OUTPUT tag is used to specify where the LaTeX docs will be put.
+# If a relative path is entered the value of OUTPUT_DIRECTORY will be
+# put in front of it. If left blank `latex' will be used as the default path.
+
+LATEX_OUTPUT = latex
+
+# The LATEX_CMD_NAME tag can be used to specify the LaTeX command name to be
+# invoked. If left blank `latex' will be used as the default command name.
+# Note that when enabling USE_PDFLATEX this option is only used for
+# generating bitmaps for formulas in the HTML output, but not in the
+# Makefile that is written to the output directory.
+
+LATEX_CMD_NAME = latex
+
+# The MAKEINDEX_CMD_NAME tag can be used to specify the command name to
+# generate index for LaTeX. If left blank `makeindex' will be used as the
+# default command name.
+
+MAKEINDEX_CMD_NAME = makeindex
+
+# If the COMPACT_LATEX tag is set to YES Doxygen generates more compact
+# LaTeX documents. This may be useful for small projects and may help to
+# save some trees in general.
+
+COMPACT_LATEX = NO
+
+# The PAPER_TYPE tag can be used to set the paper type that is used
+# by the printer. Possible values are: a4, a4wide, letter, legal and
+# executive. If left blank a4wide will be used.
+
+PAPER_TYPE = a4wide
+
+# The EXTRA_PACKAGES tag can be to specify one or more names of LaTeX
+# packages that should be included in the LaTeX output.
+
+EXTRA_PACKAGES =
+
+# The LATEX_HEADER tag can be used to specify a personal LaTeX header for
+# the generated latex document. The header should contain everything until
+# the first chapter. If it is left blank doxygen will generate a
+# standard header. Notice: only use this tag if you know what you are doing!
+
+LATEX_HEADER =
+
+# If the PDF_HYPERLINKS tag is set to YES, the LaTeX that is generated
+# is prepared for conversion to pdf (using ps2pdf). The pdf file will
+# contain links (just like the HTML output) instead of page references
+# This makes the output suitable for online browsing using a pdf viewer.
+
+PDF_HYPERLINKS = YES
+
+# If the USE_PDFLATEX tag is set to YES, pdflatex will be used instead of
+# plain latex in the generated Makefile. Set this option to YES to get a
+# higher quality PDF documentation.
+
+USE_PDFLATEX = YES
+
+# If the LATEX_BATCHMODE tag is set to YES, doxygen will add the \\batchmode.
+# command to the generated LaTeX files. This will instruct LaTeX to keep
+# running if errors occur, instead of asking the user for help.
+# This option is also used when generating formulas in HTML.
+
+LATEX_BATCHMODE = NO
+
+# If LATEX_HIDE_INDICES is set to YES then doxygen will not
+# include the index chapters (such as File Index, Compound Index, etc.)
+# in the output.
+
+LATEX_HIDE_INDICES = NO
+
+# If LATEX_SOURCE_CODE is set to YES then doxygen will include
+# source code with syntax highlighting in the LaTeX output.
+# Note that which sources are shown also depends on other settings
+# such as SOURCE_BROWSER.
+
+LATEX_SOURCE_CODE = NO
+
+#---------------------------------------------------------------------------
+# configuration options related to the RTF output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_RTF tag is set to YES Doxygen will generate RTF output
+# The RTF output is optimized for Word 97 and may not look very pretty with
+# other RTF readers or editors.
+
+GENERATE_RTF = NO
+
+# The RTF_OUTPUT tag is used to specify where the RTF docs will be put.
+# If a relative path is entered the value of OUTPUT_DIRECTORY will be
+# put in front of it. If left blank `rtf' will be used as the default path.
+
+RTF_OUTPUT = rtf
+
+# If the COMPACT_RTF tag is set to YES Doxygen generates more compact
+# RTF documents. This may be useful for small projects and may help to
+# save some trees in general.
+
+COMPACT_RTF = NO
+
+# If the RTF_HYPERLINKS tag is set to YES, the RTF that is generated
+# will contain hyperlink fields. The RTF file will
+# contain links (just like the HTML output) instead of page references.
+# This makes the output suitable for online browsing using WORD or other
+# programs which support those fields.
+# Note: wordpad (write) and others do not support links.
+
+RTF_HYPERLINKS = NO
+
+# Load stylesheet definitions from file. Syntax is similar to doxygen's
+# config file, i.e. a series of assignments. You only have to provide
+# replacements, missing definitions are set to their default value.
+
+RTF_STYLESHEET_FILE =
+
+# Set optional variables used in the generation of an rtf document.
+# Syntax is similar to doxygen's config file.
+
+RTF_EXTENSIONS_FILE =
+
+#---------------------------------------------------------------------------
+# configuration options related to the man page output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_MAN tag is set to YES (the default) Doxygen will
+# generate man pages
+
+GENERATE_MAN = NO
+
+# The MAN_OUTPUT tag is used to specify where the man pages will be put.
+# If a relative path is entered the value of OUTPUT_DIRECTORY will be
+# put in front of it. If left blank `man' will be used as the default path.
+
+MAN_OUTPUT = man
+
+# The MAN_EXTENSION tag determines the extension that is added to
+# the generated man pages (default is the subroutine's section .3)
+
+MAN_EXTENSION = .3
+
+# If the MAN_LINKS tag is set to YES and Doxygen generates man output,
+# then it will generate one additional man file for each entity
+# documented in the real man page(s). These additional files
+# only source the real man page, but without them the man command
+# would be unable to find the correct page. The default is NO.
+
+MAN_LINKS = NO
+
+#---------------------------------------------------------------------------
+# configuration options related to the XML output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_XML tag is set to YES Doxygen will
+# generate an XML file that captures the structure of
+# the code including all documentation.
+
+GENERATE_XML = NO
+
+# The XML_OUTPUT tag is used to specify where the XML pages will be put.
+# If a relative path is entered the value of OUTPUT_DIRECTORY will be
+# put in front of it. If left blank `xml' will be used as the default path.
+
+XML_OUTPUT = xml
+
+# The XML_SCHEMA tag can be used to specify an XML schema,
+# which can be used by a validating XML parser to check the
+# syntax of the XML files.
+
+XML_SCHEMA =
+
+# The XML_DTD tag can be used to specify an XML DTD,
+# which can be used by a validating XML parser to check the
+# syntax of the XML files.
+
+XML_DTD =
+
+# If the XML_PROGRAMLISTING tag is set to YES Doxygen will
+# dump the program listings (including syntax highlighting
+# and cross-referencing information) to the XML output. Note that
+# enabling this will significantly increase the size of the XML output.
+
+XML_PROGRAMLISTING = YES
+
+#---------------------------------------------------------------------------
+# configuration options for the AutoGen Definitions output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_AUTOGEN_DEF tag is set to YES Doxygen will
+# generate an AutoGen Definitions (see autogen.sf.net) file
+# that captures the structure of the code including all
+# documentation. Note that this feature is still experimental
+# and incomplete at the moment.
+
+GENERATE_AUTOGEN_DEF = NO
+
+#---------------------------------------------------------------------------
+# configuration options related to the Perl module output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_PERLMOD tag is set to YES Doxygen will
+# generate a Perl module file that captures the structure of
+# the code including all documentation. Note that this
+# feature is still experimental and incomplete at the
+# moment.
+
+GENERATE_PERLMOD = NO
+
+# If the PERLMOD_LATEX tag is set to YES Doxygen will generate
+# the necessary Makefile rules, Perl scripts and LaTeX code to be able
+# to generate PDF and DVI output from the Perl module output.
+
+PERLMOD_LATEX = NO
+
+# If the PERLMOD_PRETTY tag is set to YES the Perl module output will be
+# nicely formatted so it can be parsed by a human reader. This is useful
+# if you want to understand what is going on. On the other hand, if this
+# tag is set to NO the size of the Perl module output will be much smaller
+# and Perl will parse it just the same.
+
+PERLMOD_PRETTY = YES
+
+# The names of the make variables in the generated doxyrules.make file
+# are prefixed with the string contained in PERLMOD_MAKEVAR_PREFIX.
+# This is useful so different doxyrules.make files included by the same
+# Makefile don't overwrite each other's variables.
+
+PERLMOD_MAKEVAR_PREFIX =
+
+#---------------------------------------------------------------------------
+# Configuration options related to the preprocessor
+#---------------------------------------------------------------------------
+
+# If the ENABLE_PREPROCESSING tag is set to YES (the default) Doxygen will
+# evaluate all C-preprocessor directives found in the sources and include
+# files.
+
+ENABLE_PREPROCESSING = YES
+
+# If the MACRO_EXPANSION tag is set to YES Doxygen will expand all macro
+# names in the source code. If set to NO (the default) only conditional
+# compilation will be performed. Macro expansion can be done in a controlled
+# way by setting EXPAND_ONLY_PREDEF to YES.
+
+MACRO_EXPANSION = NO
+
+# If the EXPAND_ONLY_PREDEF and MACRO_EXPANSION tags are both set to YES
+# then the macro expansion is limited to the macros specified with the
+# PREDEFINED and EXPAND_AS_DEFINED tags.
+
+EXPAND_ONLY_PREDEF = NO
+
+# If the SEARCH_INCLUDES tag is set to YES (the default) the includes files
+# in the INCLUDE_PATH (see below) will be search if a #include is found.
+
+SEARCH_INCLUDES = YES
+
+# The INCLUDE_PATH tag can be used to specify one or more directories that
+# contain include files that are not input files but should be processed by
+# the preprocessor.
+
+INCLUDE_PATH =
+
+# You can use the INCLUDE_FILE_PATTERNS tag to specify one or more wildcard
+# patterns (like *.h and *.hpp) to filter out the header-files in the
+# directories. If left blank, the patterns specified with FILE_PATTERNS will
+# be used.
+
+INCLUDE_FILE_PATTERNS =
+
+# The PREDEFINED tag can be used to specify one or more macro names that
+# are defined before the preprocessor is started (similar to the -D option of
+# gcc). The argument of the tag is a list of macros of the form: name
+# or name=definition (no spaces). If the definition and the = are
+# omitted =1 is assumed. To prevent a macro definition from being
+# undefined via #undef or recursively expanded use the := operator
+# instead of the = operator.
+
+PREDEFINED =
+
+# If the MACRO_EXPANSION and EXPAND_ONLY_PREDEF tags are set to YES then
+# this tag can be used to specify a list of macro names that should be expanded.
+# The macro definition that is found in the sources will be used.
+# Use the PREDEFINED tag if you want to use a different macro definition.
+
+EXPAND_AS_DEFINED =
+
+# If the SKIP_FUNCTION_MACROS tag is set to YES (the default) then
+# doxygen's preprocessor will remove all function-like macros that are alone
+# on a line, have an all uppercase name, and do not end with a semicolon. Such
+# function macros are typically used for boiler-plate code, and will confuse
+# the parser if not removed.
+
+SKIP_FUNCTION_MACROS = YES
+
+#---------------------------------------------------------------------------
+# Configuration::additions related to external references
+#---------------------------------------------------------------------------
+
+# The TAGFILES option can be used to specify one or more tagfiles.
+# Optionally an initial location of the external documentation
+# can be added for each tagfile. The format of a tag file without
+# this location is as follows:
+# TAGFILES = file1 file2 ...
+# Adding location for the tag files is done as follows:
+# TAGFILES = file1=loc1 "file2 = loc2" ...
+# where "loc1" and "loc2" can be relative or absolute paths or
+# URLs. If a location is present for each tag, the installdox tool
+# does not have to be run to correct the links.
+# Note that each tag file must have a unique name
+# (where the name does NOT include the path)
+# If a tag file is not located in the directory in which doxygen
+# is run, you must also specify the path to the tagfile here.
+
+TAGFILES =
+
+# When a file name is specified after GENERATE_TAGFILE, doxygen will create
+# a tag file that is based on the input files it reads.
+
+GENERATE_TAGFILE =
+
+# If the ALLEXTERNALS tag is set to YES all external classes will be listed
+# in the class index. If set to NO only the inherited external classes
+# will be listed.
+
+ALLEXTERNALS = NO
+
+# If the EXTERNAL_GROUPS tag is set to YES all external groups will be listed
+# in the modules index. If set to NO, only the current project's groups will
+# be listed.
+
+EXTERNAL_GROUPS = YES
+
+# The PERL_PATH should be the absolute path and name of the perl script
+# interpreter (i.e. the result of `which perl').
+
+PERL_PATH = /usr/bin/perl
+
+#---------------------------------------------------------------------------
+# Configuration options related to the dot tool
+#---------------------------------------------------------------------------
+
+# If the CLASS_DIAGRAMS tag is set to YES (the default) Doxygen will
+# generate a inheritance diagram (in HTML, RTF and LaTeX) for classes with base
+# or super classes. Setting the tag to NO turns the diagrams off. Note that
+# this option is superseded by the HAVE_DOT option below. This is only a
+# fallback. It is recommended to install and use dot, since it yields more
+# powerful graphs.
+
+CLASS_DIAGRAMS = YES
+
+# You can define message sequence charts within doxygen comments using the \msc
+# command. Doxygen will then run the mscgen tool (see
+# http://www.mcternan.me.uk/mscgen/) to produce the chart and insert it in the
+# documentation. The MSCGEN_PATH tag allows you to specify the directory where
+# the mscgen tool resides. If left empty the tool is assumed to be found in the
+# default search path.
+
+MSCGEN_PATH =
+
+# If set to YES, the inheritance and collaboration graphs will hide
+# inheritance and usage relations if the target is undocumented
+# or is not a class.
+
+HIDE_UNDOC_RELATIONS = YES
+
+# If you set the HAVE_DOT tag to YES then doxygen will assume the dot tool is
+# available from the path. This tool is part of Graphviz, a graph visualization
+# toolkit from AT&T and Lucent Bell Labs. The other options in this section
+# have no effect if this option is set to NO (the default)
+
+HAVE_DOT = NO
+
+# By default doxygen will write a font called FreeSans.ttf to the output
+# directory and reference it in all dot files that doxygen generates. This
+# font does not include all possible unicode characters however, so when you need
+# these (or just want a differently looking font) you can specify the font name
+# using DOT_FONTNAME. You need need to make sure dot is able to find the font,
+# which can be done by putting it in a standard location or by setting the
+# DOTFONTPATH environment variable or by setting DOT_FONTPATH to the directory
+# containing the font.
+
+DOT_FONTNAME = FreeSans
+
+# The DOT_FONTSIZE tag can be used to set the size of the font of dot graphs.
+# The default size is 10pt.
+
+DOT_FONTSIZE = 10
+
+# By default doxygen will tell dot to use the output directory to look for the
+# FreeSans.ttf font (which doxygen will put there itself). If you specify a
+# different font using DOT_FONTNAME you can set the path where dot
+# can find it using this tag.
+
+DOT_FONTPATH =
+
+# If the CLASS_GRAPH and HAVE_DOT tags are set to YES then doxygen
+# will generate a graph for each documented class showing the direct and
+# indirect inheritance relations. Setting this tag to YES will force the
+# the CLASS_DIAGRAMS tag to NO.
+
+CLASS_GRAPH = YES
+
+# If the COLLABORATION_GRAPH and HAVE_DOT tags are set to YES then doxygen
+# will generate a graph for each documented class showing the direct and
+# indirect implementation dependencies (inheritance, containment, and
+# class references variables) of the class with other documented classes.
+
+COLLABORATION_GRAPH = YES
+
+# If the GROUP_GRAPHS and HAVE_DOT tags are set to YES then doxygen
+# will generate a graph for groups, showing the direct groups dependencies
+
+GROUP_GRAPHS = YES
+
+# If the UML_LOOK tag is set to YES doxygen will generate inheritance and
+# collaboration diagrams in a style similar to the OMG's Unified Modeling
+# Language.
+
+UML_LOOK = NO
+
+# If set to YES, the inheritance and collaboration graphs will show the
+# relations between templates and their instances.
+
+TEMPLATE_RELATIONS = NO
+
+# If the ENABLE_PREPROCESSING, SEARCH_INCLUDES, INCLUDE_GRAPH, and HAVE_DOT
+# tags are set to YES then doxygen will generate a graph for each documented
+# file showing the direct and indirect include dependencies of the file with
+# other documented files.
+
+INCLUDE_GRAPH = YES
+
+# If the ENABLE_PREPROCESSING, SEARCH_INCLUDES, INCLUDED_BY_GRAPH, and
+# HAVE_DOT tags are set to YES then doxygen will generate a graph for each
+# documented header file showing the documented files that directly or
+# indirectly include this file.
+
+INCLUDED_BY_GRAPH = YES
+
+# If the CALL_GRAPH and HAVE_DOT options are set to YES then
+# doxygen will generate a call dependency graph for every global function
+# or class method. Note that enabling this option will significantly increase
+# the time of a run. So in most cases it will be better to enable call graphs
+# for selected functions only using the \callgraph command.
+
+CALL_GRAPH = NO
+
+# If the CALLER_GRAPH and HAVE_DOT tags are set to YES then
+# doxygen will generate a caller dependency graph for every global function
+# or class method. Note that enabling this option will significantly increase
+# the time of a run. So in most cases it will be better to enable caller
+# graphs for selected functions only using the \callergraph command.
+
+CALLER_GRAPH = NO
+
+# If the GRAPHICAL_HIERARCHY and HAVE_DOT tags are set to YES then doxygen
+# will graphical hierarchy of all classes instead of a textual one.
+
+GRAPHICAL_HIERARCHY = YES
+
+# If the DIRECTORY_GRAPH, SHOW_DIRECTORIES and HAVE_DOT tags are set to YES
+# then doxygen will show the dependencies a directory has on other directories
+# in a graphical way. The dependency relations are determined by the #include
+# relations between the files in the directories.
+
+DIRECTORY_GRAPH = YES
+
+# The DOT_IMAGE_FORMAT tag can be used to set the image format of the images
+# generated by dot. Possible values are png, jpg, or gif
+# If left blank png will be used.
+
+DOT_IMAGE_FORMAT = png
+
+# The tag DOT_PATH can be used to specify the path where the dot tool can be
+# found. If left blank, it is assumed the dot tool can be found in the path.
+
+DOT_PATH =
+
+# The DOTFILE_DIRS tag can be used to specify one or more directories that
+# contain dot files that are included in the documentation (see the
+# \dotfile command).
+
+DOTFILE_DIRS =
+
+# The DOT_GRAPH_MAX_NODES tag can be used to set the maximum number of
+# nodes that will be shown in the graph. If the number of nodes in a graph
+# becomes larger than this value, doxygen will truncate the graph, which is
+# visualized by representing a node as a red box. Note that doxygen if the
+# number of direct children of the root node in a graph is already larger than
+# DOT_GRAPH_MAX_NODES then the graph will not be shown at all. Also note
+# that the size of a graph can be further restricted by MAX_DOT_GRAPH_DEPTH.
+
+DOT_GRAPH_MAX_NODES = 50
+
+# The MAX_DOT_GRAPH_DEPTH tag can be used to set the maximum depth of the
+# graphs generated by dot. A depth value of 3 means that only nodes reachable
+# from the root by following a path via at most 3 edges will be shown. Nodes
+# that lay further from the root node will be omitted. Note that setting this
+# option to 1 or 2 may greatly reduce the computation time needed for large
+# code bases. Also note that the size of a graph can be further restricted by
+# DOT_GRAPH_MAX_NODES. Using a depth of 0 means no depth restriction.
+
+MAX_DOT_GRAPH_DEPTH = 0
+
+# Set the DOT_TRANSPARENT tag to YES to generate images with a transparent
+# background. This is disabled by default, because dot on Windows does not
+# seem to support this out of the box. Warning: Depending on the platform used,
+# enabling this option may lead to badly anti-aliased labels on the edges of
+# a graph (i.e. they become hard to read).
+
+DOT_TRANSPARENT = NO
+
+# Set the DOT_MULTI_TARGETS tag to YES allow dot to generate multiple output
+# files in one run (i.e. multiple -o and -T options on the command line). This
+# makes dot run faster, but since only newer versions of dot (>1.8.10)
+# support this, this feature is disabled by default.
+
+DOT_MULTI_TARGETS = NO
+
+# If the GENERATE_LEGEND tag is set to YES (the default) Doxygen will
+# generate a legend page explaining the meaning of the various boxes and
+# arrows in the dot generated graphs.
+
+GENERATE_LEGEND = YES
+
+# If the DOT_CLEANUP tag is set to YES (the default) Doxygen will
+# remove the intermediate dot files that are used to generate
+# the various graphs.
+
+DOT_CLEANUP = YES
diff --git a/rocclr/compiler/lib/amdoclcl.def.in b/rocclr/compiler/lib/amdoclcl.def.in
new file mode 100644
index 0000000000..0d8a7009e2
--- /dev/null
+++ b/rocclr/compiler/lib/amdoclcl.def.in
@@ -0,0 +1,99 @@
+EXPORTS
+aclLoader_OnLoad
+aclLoader_OnUnload
+aclCompilerInit
+aclCompilerFini
+aclCompilerVersion
+aclVersionSize
+aclGetErrorString
+aclGetArchInfo
+aclGetDeviceInfo
+aclGetTargetInfo
+aclGetArchitecture
+aclGetFamily
+aclGetChip
+aclBinaryInit
+aclBinaryFini
+aclReadFromFile
+aclReadFromMem
+aclWriteToFile
+aclWriteToMem
+aclCreateFromBinary
+aclBinaryVersion
+aclInsertSection
+aclRemoveSection
+aclExtractSection
+aclInsertSymbol
+aclRemoveSymbol
+aclExtractSymbol
+aclDbgAddArgument
+aclDbgRemoveArgument
+aclQueryInfo
+aclCompile
+aclLink
+aclGetCompilerLog
+aclRetrieveType
+aclSetType
+aclConvertType
+aclDisassemble
+aclGetDeviceBinary
+oclCompilerInit
+oclCompilerFini
+oclCompilerVersion
+oclVersionSize
+oclCompileSource
+oclCompileSourceToIR
+oclCompileIRToIL
+oclCompileILToISA
+oclCompileBinary
+oclGetCompilerLog
+oclGetArchInfo
+oclGetFamilyInfo
+oclGetDeviceInfo
+oclGetAsicInfo
+oclGetTargetInfo
+oclGetArchitecture
+oclGetFamily
+oclGetChip
+oclGetAsic
+elfInsertSection
+elfExtractSection
+elfInsertSymbol
+elfExtractSymbol
+oclirSetType
+oclirRetrieveType
+oclirLink
+oclhsaCompileSource
+oclhsaCompileBinary
+oclhsaSetType
+oclhsaRetrieveType
+oclhsaConvertType
+oclilCompileSource
+oclilCompileBinary
+oclilSetType
+oclilRetrieveType
+oclilConvertType
+oclisaDisassemble
+oclisaGetBinaryBlob
+constructOclElf
+destructOclElf
+readOclElfFromFile
+readOclElfFromMem
+writeOclElfToFile
+writeOclElfToMem
+createElfFromElf
+getBIFVersion
+rtGetInfo
+aclDumpBinary
+aclJITObjectImageCreate
+aclJITObjectImageCopy
+aclJITObjectImageDestroy
+aclJITObjectImageFinalize
+aclJITObjectImageSize
+aclJITObjectImageData
+aclJITObjectImageDisassembleKernel
+aclJITObjectImageIterateSymbols
+aclJITObjectImageGetGlobalsSize
+#if defined(WITH_TARGET_HSAIL)
+aclHsaLoader
+#endif
diff --git a/rocclr/compiler/lib/amdoclcl.map.in b/rocclr/compiler/lib/amdoclcl.map.in
new file mode 100644
index 0000000000..f2ee10dedc
--- /dev/null
+++ b/rocclr/compiler/lib/amdoclcl.map.in
@@ -0,0 +1,104 @@
+ACL_API_0.8 {
+global:
+ oclCompilerInit;
+ oclCompilerFini;
+ oclCompilerVersion;
+ oclVersionSize;
+ oclCompileSource;
+ oclCompileSourceToIR;
+ oclCompileIRToIL;
+ oclCompileILToISA;
+ oclCompileBinary;
+ oclGetCompilerLog;
+ oclGetArchInfo;
+ oclGetDeviceInfo;
+ oclGetTargetInfo;
+ oclGetArchitecture;
+ oclGetFamily;
+ oclGetChip;
+ readOclElfFromFile;
+ readOclElfFromMem;
+ writeOclElfToFile;
+ writeOclElfToMem;
+ createElfFromElf;
+ getBIFVersion;
+ constructOclElf;
+ destructOclElf;
+ elfInsertSection;
+ elfExtractSection;
+ elfInsertSymbol;
+ elfExtractSymbol;
+ oclirSetType;
+ oclirRetrieveType;
+ oclirLink;
+ oclhsaCompileSource;
+ oclhsaCompileBinary;
+ oclhsaSetType;
+ oclhsaRetrieveType;
+ oclhsaConvertType;
+ oclilCompileSource;
+ oclilCompileBinary;
+ oclilSetType;
+ oclilRetrieveType;
+ oclilConvertType;
+ oclisaDisassemble;
+ oclisaGetBinaryBlob;
+ rtGetInfo;
+ aclCompilerInit;
+ aclCompilerFini;
+ aclCompilerVersion;
+ aclVersionSize;
+ aclGetErrorString;
+ aclGetArchInfo;
+ aclGetFamilyInfo;
+ aclGetDeviceInfo;
+ aclGetAsicInfo;
+ aclGetTargetInfo;
+ aclGetArchitecture;
+ aclGetFamily;
+ aclGetChip;
+ aclGetAsic;
+ aclBinaryInit;
+ aclBinaryFini;
+ aclReadFromFile;
+ aclReadFromMem;
+ aclWriteToFile;
+ aclWriteToMem;
+ aclCreateFromBinary;
+ aclBinaryVersion;
+ aclInsertSection;
+ aclRemoveSection;
+ aclExtractSection;
+ aclInsertSymbol;
+ aclRemoveSymbol;
+ aclExtractSymbol;
+ aclQueryInfo;
+ aclDbgAddArgument;
+ aclDbgRemoveArgument;
+ aclCompile;
+ aclLink;
+ aclGetCompilerLog;
+ aclRetrieveType;
+ aclSetType;
+ aclConvertType;
+ aclDisassemble;
+ aclGetDeviceBinary;
+ aclLoader_OnLoad;
+ aclLoader_OnUnload;
+ aclJITObjectImageCreate;
+ aclJITObjectImageCopy;
+ aclJITObjectImageDestroy;
+ aclJITObjectImageFinalize;
+ aclJITObjectImageSize;
+ aclJITObjectImageData;
+ aclJITObjectImageDisassembleKernel;
+ aclJITObjectImageIterateSymbols;
+ aclJITObjectImageGetGlobalsSize;
+#if defined(WITH_TARGET_HSAIL)
+ aclHsaLoader;
+#endif
+#if defined(OPENCL_MAINLINE)
+local:
+ *;
+#endif
+};
diff --git a/rocclr/compiler/lib/amdoclcl.rc b/rocclr/compiler/lib/amdoclcl.rc
new file mode 100644
index 0000000000..c0b14d40ed
--- /dev/null
+++ b/rocclr/compiler/lib/amdoclcl.rc
@@ -0,0 +1,75 @@
+#define STR(__macro__) #__macro__
+#define XSTR(__macro__) STR(__macro__)
+
+#if defined(_DEBUG)
+#define DEBUG_ONLY(x) x
+#else
+#define DEBUG_ONLY(x)
+#endif
+
+#define VERSION_PREFIX_MAJOR 1
+#define VERSION_PREFIX_MINOR 1
+
+
+#define APSTUDIO_READONLY_SYMBOLS
+/////////////////////////////////////////////////////////////////////////////
+//
+// Generated from the TEXTINCLUDE 2 resource.
+//
+#include "winresrc.h"
+#include "utils/versions.hpp"
+
+/////////////////////////////////////////////////////////////////////////////
+#undef APSTUDIO_READONLY_SYMBOLS
+
+/////////////////////////////////////////////////////////////////////////////
+// English (U.S.) resources
+
+#if !defined(AFX_RESOURCE_DLL) || defined(AFX_TARG_ENU)
+#ifdef _WIN32
+LANGUAGE LANG_ENGLISH, SUBLANG_ENGLISH_US
+#pragma code_page(1252)
+#endif //_WIN32
+
+
+/////////////////////////////////////////////////////////////////////////////
+//
+// Version
+//
+
+VS_VERSION_INFO VERSIONINFO
+ FILEVERSION AMD_COMPILER_MAJOR_VERSION,AMD_COMPILER_MINOR_VERSION,AMD_COMPILER_BUILD_NUMBER,AMD_COMPILER_REVISION_NUMBER
+ PRODUCTVERSION AMD_COMPILER_MAJOR_VERSION,AMD_COMPILER_MINOR_VERSION,AMD_COMPILER_BUILD_NUMBER,AMD_COMPILER_REVISION_NUMBER
+ FILEFLAGSMASK 0x3fL
+#ifdef _DEBUG
+ FILEFLAGS 0x1L
+#else
+ FILEFLAGS 0x0L
+#endif
+ FILEOS 0x40004L
+ FILETYPE 0x2L
+ FILESUBTYPE 0x0L
+BEGIN
+ BLOCK "StringFileInfo"
+ BEGIN
+ BLOCK "040904b0"
+ BEGIN
+ VALUE "Comments", " \0"
+ VALUE "CompanyName", "Advanced Micro Devices Inc.\0"
+ VALUE "FileDescription", AMD_COMPILER_NAME " OpenCL " XSTR(VERSION_PREFIX_MAJOR) "." XSTR(VERSION_PREFIX_MINOR) " Compiler\0"
+ VALUE "FileVersion", XSTR(AMD_COMPILER_MAJOR_VERSION) ", " XSTR(AMD_COMPILER_MINOR_VERSION) ", " XSTR(AMD_COMPILER_BUILD_NUMBER) ", " XSTR(AMD_COMPILER_REVISION_NUMBER) ", " XSTR(AMD_SC_COMPILER_REVISION_NUMBER)
+ VALUE "InternalName", "AOC"
+ VALUE "LegalCopyright", "Copyright (C) 2011 Advanced Micro Devices Inc.\0"
+ VALUE "OriginalFilename", "amdoclcl.dll"
+ VALUE "ProductName", "AMD Compiler Library " XSTR(VERSION_PREFIX_MAJOR) "." XSTR(VERSION_PREFIX_MINOR) " " AMD_COMPILER_INFO "\0"
+ VALUE "ProductVersion", XSTR(AMD_COMPILER_MAJOR_VERSION) ", " XSTR(AMD_COMPILER_MINOR_VERSION) ", " XSTR(AMD_COMPILER_BUILD_NUMBER) ", " XSTR(AMD_COMPILER_REVISION_NUMBER) ", " XSTR(AMD_SC_COMPILER_REVISION_NUMBER)
+ END
+ END
+ BLOCK "VarFileInfo"
+ BEGIN
+ VALUE "Translation", 0x409, 1200
+ END
+END
+
+#endif // English (U.S.) resources
+/////////////////////////////////////////////////////////////////////////////
diff --git a/rocclr/compiler/lib/backends/common/backend.hpp b/rocclr/compiler/lib/backends/common/backend.hpp
new file mode 100644
index 0000000000..e7e9cdd3e7
--- /dev/null
+++ b/rocclr/compiler/lib/backends/common/backend.hpp
@@ -0,0 +1,33 @@
+//
+// Copyright (c) 2008 Advanced Micro Devices, Inc. All rights reserved.
+//
+#ifndef _BE_BACKEND_HPP_
+#define _BE_BACKEND_HPP_
+#include "compiler_stage.hpp"
+
+namespace amdcl
+{
+ /*! \addtogroup Compiler Library
+ *
+ * \copydoc amdcl::Backend
+ *
+ * @{
+ */
+ class Backend : public CompilerStage {
+ Backend(Backend&); // DO NOT IMPLEMENT.
+ Backend(); // DO NOT IMPLEMENT.
+ public:
+ Backend(aclCompiler *cl, aclBinary *elf, aclLogFunction log)
+ : CompilerStage(cl, elf, log) {}
+
+ virtual ~Backend() {}
+
+ /*! Function that takes in a string that is a source file
+ * and generates the backend binary that is then
+ * inserted into the elf file at the correct location.
+ */
+ virtual int jit(const std::string &source) = 0;
+ }; // class Backend
+ /*@}*/
+}; // amdcl namespace
+#endif // _BE_BACKEND_HPP
diff --git a/rocclr/compiler/lib/backends/common/codegen.cpp b/rocclr/compiler/lib/backends/common/codegen.cpp
new file mode 100644
index 0000000000..57a639c65a
--- /dev/null
+++ b/rocclr/compiler/lib/backends/common/codegen.cpp
@@ -0,0 +1,367 @@
+//
+// Copyright (c) 2008 Advanced Micro Devices, Inc. All rights reserved.
+//
+#include "top.hpp"
+#include "codegen.hpp"
+#include "utils/libUtils.h"
+#include "os/os.hpp"
+#include "jit/src/jit.hpp"
+#include "utils/target_mappings.h"
+#include "llvm/Support/FormattedStream.h"
+#include "llvm/Support/Host.h"
+#include "llvm/Support/raw_ostream.h"
+#include "llvm/Support/TargetSelect.h"
+#include "llvm/DataLayout.h"
+#include "llvm/Target/TargetMachine.h"
+#include "llvm/Target/TargetOptions.h"
+#include "llvm/Support/TargetRegistry.h"
+#include "llvm/Support/CommandLine.h"
+#include
+#include
+#include
+#include
+
+using namespace amdcl;
+using namespace llvm;
+
+#ifdef WITH_TARGET_HSAIL
+// Variable FileType are checked by HSAILTargetMachine, but only
+// created in llc.exe. Create it here for online compilation path.
+llvm::cl::opt
+FileType("filetype", cl::init(TargetMachine::CGFT_ObjectFile),
+ cl::values(
+ clEnumValN(TargetMachine::CGFT_AssemblyFile, "asm", ""),
+ clEnumValN(TargetMachine::CGFT_ObjectFile, "obj", ""),
+ clEnumValN(TargetMachine::CGFT_Null, "null", ""),
+ clEnumValEnd));
+#endif
+
+static std::string aclGetCodegenName(const aclTargetInfo &tgtInfo)
+{
+ assert(tgtInfo.arch_id <= aclLast && "Unknown device id!");
+ const FamilyMapping *family = familySet + tgtInfo.arch_id;
+ if (!family) return "";
+
+ assert((tgtInfo.chip_id) < family->children_size && "Unknown family id!");
+ const TargetMapping *target = &family->target[tgtInfo.chip_id];
+ return (target) ? target->codegen_name : "";
+}
+
+
+
+/*! Function that modifies the code gen level based on the
+ * function size threshhold.
+ */
+static CodeGenOpt::Level
+AdjustCGOptLevel(Module& M, CodeGenOpt::Level OrigOLvl)
+{
+ const unsigned int FuncSizeThreshold = 10000;
+ if (OrigOLvl == CodeGenOpt::None)
+ return OrigOLvl;
+ for (Module::iterator I = M.begin(), E = M.end(); I != E; ++I) {
+ Function *F = (Function *)I;
+ if (F->size() > FuncSizeThreshold) {
+ return CodeGenOpt::None;
+ }
+ }
+ return OrigOLvl;
+}
+
+int
+llvmCodeGen(
+ Module* Composite,
+ amd::option::Options *OptionsObj,
+ std::string& output,
+ aclBinary* binary)
+{
+ const FamilyMapping &familyMap = familySet[binary->target.arch_id];
+ const bool optimize = (OptionsObj ? (OptionsObj->oVariables->OptLevel > 0) : true);
+ const TargetMapping* targetMap = familyMap.target;
+ unsigned famID = binary->target.chip_id;
+ if (!targetMap || !targetMap[famID].supported) {
+ LogError("Device is not supported by code generator!");
+ return 1;
+ }
+
+#if 1 || LLVM_TRUNK_INTEGRATION_CL >= 1463
+#else
+ // a dirty way to guarantee "push bp" inserted by CodeGen in prologue
+ llvm::NoFramePointerElim = !optimize;
+#endif
+ // Load the module to be compiled...
+ Module &mod = *Composite;
+
+ // FIXME: The triple given in this map is wrong and isn't really
+ // useful. Only need the architecture.
+ const std::string TargetTriple = std::string(familyMap.triple);
+ Triple TheTriple(TargetTriple);
+ if (TheTriple.getTriple().empty()) {
+ TheTriple.setTriple(sys::getDefaultTargetTriple());
+ }
+
+ Triple::ArchType arch = TheTriple.getArch();
+
+ bool isGPU = (arch == Triple::amdil || arch == Triple::amdil64 ||
+ arch == Triple::hsail || arch == Triple::hsail_64);
+
+ if (isGPU) {
+ TheTriple.setOS(Triple::UnknownOS);
+ } else { // CPUs
+ // FIXME: This should come from somewhere else.
+#ifdef __linux__
+ TheTriple.setOS(Triple::Linux);
+#else
+ TheTriple.setOS(Triple::MinGW32);
+#endif
+ }
+
+ TheTriple.setEnvironment(Triple::AMDOpenCL);
+ // FIXME: need to make AMDOpenCL be the same as ELF
+ if (OptionsObj->oVariables->UseJIT)
+ TheTriple.setEnvironment(Triple::ELF);
+ mod.setTargetTriple(TheTriple.getTriple());
+
+ // Allocate target machine. First, check whether the user has explicitly
+ // specified an architecture to compile for. If so we have to look it up by
+ // name, because it might be a backend that has no mapping to a target triple.
+ const Target *TheTarget = 0;
+ assert(binary->target.arch_id != aclError && "Cannot have the error device!");
+
+ std::string MArch = familyMap.architecture;
+
+#ifdef WITH_TARGET_HSAIL
+ if (MArch == "hsail" && OptionsObj->oVariables->GPU64BitIsa) {
+ MArch = std::string("hsail-64");
+ }
+#endif
+
+ for (TargetRegistry::iterator it = TargetRegistry::begin(),
+ ie = TargetRegistry::end(); it != ie; ++it) {
+ if (MArch == it->getName()) {
+ TheTarget = &*it;
+ break;
+ }
+ }
+
+ if (!TheTarget) {
+ errs() << ": ERROR: invalid target '" << MArch << "'.\n";
+ return 1;
+ }
+
+ CodeGenOpt::Level OLvl = CodeGenOpt::None;
+ switch (OptionsObj->oVariables->OptLevel) {
+ case 0: // -O0
+ OLvl = CodeGenOpt::None;
+ break;
+ case 1: // -O1
+ OLvl = CodeGenOpt::Less;
+ break;
+ default:
+ assert(!"Error with optimization level");
+ case 2: // -O2
+ case 5: // -O5(-Os)
+ OLvl = CodeGenOpt::Default;
+ break;
+ case 3: // -O3
+ case 4: // -O4
+ OLvl = CodeGenOpt::Aggressive;
+ break;
+ };
+
+ // If there is a very big function, lower the optimization level.
+ OLvl = AdjustCGOptLevel(mod, OLvl);
+
+ // Adjust the triple to match (if known), otherwise stick with the
+ // module/host triple.
+ Triple::ArchType Type = Triple::getArchTypeForLLVMName(MArch);
+ if (Type != Triple::UnknownArch)
+ TheTriple.setArch(Type);
+
+ // Package up features to be passed to target/subtarget
+ std::string FeatureStr;
+ if ((Type == Triple::amdil || Type == Triple::amdil64) &&
+ targetMap[famID].chip_options) {
+ uint64_t y = targetMap[famID].chip_options;
+ for (uint64_t x = 0; y != 0; y >>= 1, ++x) {
+ if (!(y & 0x1) && (x >= 11 && x < 16)) {
+ continue;
+ }
+
+ if ((1 << x) == F_NO_ALIAS) {
+ FeatureStr += (!OptionsObj->oVariables->AssumeAlias ? '+' : '-');
+ } else if ((1 << x) == F_STACK_UAV) {
+ FeatureStr += (OptionsObj->oVariables->UseStackUAV ? '+' : '-');
+ } else if ((1 << x) == F_MACRO_CALL) {
+ FeatureStr += (OptionsObj->oVariables->UseMacroForCall ? '+' : '-');
+ } else if ((1 << x) == F_64BIT_PTR) {
+ FeatureStr += (binary->target.arch_id == aclAMDIL64) ? '+' : '-';
+ } else {
+ FeatureStr += ((y & 0x1) ? '+' : '-');
+ }
+
+ FeatureStr += GPUCodeGenFlagTable[x];
+ if (y != 0x1) {
+ FeatureStr += ',';
+ }
+ }
+ }
+
+ if (Type == Triple::amdil64) {
+ if (OptionsObj->oVariables->SmallGlobalObjects)
+ FeatureStr += ",+small-global-objects";
+ }
+
+#if 1 || LLVM_TRUNK_INTEGRATION_CL >= 1463
+ llvm::TargetOptions targetOptions;
+ targetOptions.NoFramePointerElim = false;
+ targetOptions.StackAlignmentOverride =
+ OptionsObj->oVariables->CPUStackAlignment;
+ // jgolds
+ //targetOptions.EnableEBB = (optimize && OptionsObj->oVariables->CGEBB);
+ //targetOptions.EnableBFO = OptionsObj->oVariables->CGBFO;
+ //targetOptions.NoExcessFPPrecision = !OptionsObj->oVariables->EnableFMA;
+
+ // Don't allow unsafe optimizations for CPU because the library
+ // contains code that is not safe. See bug 9567.
+ if (isGPU)
+ targetOptions.UnsafeFPMath = OptionsObj->oVariables->UnsafeMathOpt;
+ targetOptions.LessPreciseFPMADOption = OptionsObj->oVariables->MadEnable ||
+ OptionsObj->oVariables->EnableMAD;
+ targetOptions.NoInfsFPMath = OptionsObj->oVariables->FiniteMathOnly;
+ // Need to add a support for OptionsObj->oVariables->NoSignedZeros,
+ targetOptions.NoNaNsFPMath = OptionsObj->oVariables->FastRelaxedMath;
+
+ std::auto_ptr
+ target(TheTarget->createTargetMachine(TheTriple.getTriple(),
+ aclGetCodegenName(binary->target), FeatureStr, targetOptions,
+ WINDOWS_SWITCH(Reloc::DynamicNoPIC, Reloc::PIC_),
+ CodeModel::Default, OLvl));
+#else
+ std::auto_ptr
+ target(TheTarget->createTargetMachine(TheTriple.getTriple(),
+ aclGetCodegenName(binary->target), FeatureStr,
+ WINDOWS_SWITCH(Reloc::DynamicNoPIC, Reloc::PIC_),
+ CodeModel::Default));
+ assert(target.get() && "Could not allocate target machine!");
+#endif
+
+ // MCJIT(Jan)
+ if(!isGPU && OptionsObj->oVariables->UseJIT) {
+ TargetMachine* jittarget(TheTarget->createTargetMachine(TheTriple.getTriple(),
+ aclGetCodegenName(binary->target), FeatureStr, targetOptions,
+ WINDOWS_SWITCH(Reloc::DynamicNoPIC, Reloc::PIC_),
+ CodeModel::Default, OLvl));
+
+ std::string ErrStr = jitCodeGen(Composite, jittarget, OLvl, output);
+
+ if (!ErrStr.empty()) {
+ LogError("MCJIT failed to generate code");
+ LogError(ErrStr.c_str());
+ return 1;
+ }
+ return 0;
+ }
+
+
+ TargetMachine &Target = *target;
+
+ // Figure out where we are going to send the output...
+ raw_string_ostream *RSOut = new raw_string_ostream(output);
+ formatted_raw_ostream *Out = new formatted_raw_ostream(*RSOut, formatted_raw_ostream::DELETE_STREAM);
+ if (Out == 0) {
+ LogError("llvmCodeGen couldn't create an output stream");
+ return 1;
+ }
+
+ // Build up all of the passes that we want to do to the module or function or
+ // Basic Block.
+ PassManager Passes;
+
+ // Add the target data from the target machine, if it exists, or the module.
+ if (const DataLayout *TD = Target.getDataLayout())
+ Passes.add(new DataLayout(*TD));
+ else
+ Passes.add(new DataLayout(&mod));
+
+ // Override default to generate verbose assembly, if the device is not the GPU.
+ // The GPU sets this in AMDILTargetMachine.cpp.
+ if (familyMap.target == (const TargetMapping*)&X86TargetMapping ||
+#if WITH_VERSION_0_9
+ familyMap.target == (const TargetMapping*)&A32TargetMapping ||
+ familyMap.target == (const TargetMapping*)&A32TargetMapping ||
+#elif WITH_VERSION_0_8
+#else
+#error "The current version implementation was not implemented here."
+#endif
+ familyMap.target == (const TargetMapping*)&X64TargetMapping
+ ) {
+ Target.setAsmVerbosityDefault(true);
+ }
+
+#ifdef WITH_TARGET_HSAIL
+ if (isHSAILTarget(binary->target)) {
+ if (Target.addPassesToEmitFile(Passes, *Out, TargetMachine::CGFT_ObjectFile, true)) {
+ delete Out;
+ return 1;
+ }
+ } else
+#endif
+ {
+#ifndef NDEBUG
+#if 1 || LLVM_TRUNK_INTEGRATION_CL >= 1144
+ if (Target.addPassesToEmitFile(Passes, *Out, TargetMachine::CGFT_AssemblyFile, false))
+#else
+ if (Target.addPassesToEmitFile(Passes, *Out, TargetMachine::CGFT_AssemblyFile, OLvl, false))
+#endif
+#else
+#if 1 || LLVM_TRUNK_INTEGRATION_CL >= 1144
+ if (Target.addPassesToEmitFile(Passes, *Out, TargetMachine::CGFT_AssemblyFile, true))
+#else
+ if (Target.addPassesToEmitFile(Passes, *Out, TargetMachine::CGFT_AssemblyFile, OLvl, true))
+#endif
+#endif
+ {
+ delete Out;
+ return 1;
+ }
+ }
+
+ Passes.run(mod);
+
+ delete Out;
+ return 0;
+}
+
+ int
+CLCodeGen::codegen(llvm::Module *input)
+{
+ uint64_t time_cg = 0ULL;
+ if (Options()->oVariables->EnableBuildTiming) {
+ time_cg = amd::Os::timeNanos();
+ }
+ llvmbinary_ = input;
+ amdcl::CompilerStage *cs = reinterpret_cast(this);
+ if (!isHSAILTarget(cs->Elf()->target)) {
+ setWholeProgram(true);
+ }
+
+ int ret = llvmCodeGen(LLVMBinary(), Options(), Source(), Elf());
+
+ if (Options()->oVariables->EnableBuildTiming) {
+ time_cg = amd::Os::timeNanos() - time_cg;
+ std::stringstream tmp_ss;
+ tmp_ss << " LLVM CodeGen time: "
+ << time_cg/1000ULL
+ << "us\n";
+ appendLogToCL(CL(), tmp_ss.str());
+ }
+ if (!Source().empty() && Options()->isDumpFlagSet(amd::option::DUMP_CGIL)) {
+ std::string ilFileName = Options()->getDumpFileName(".il");
+ std::fstream f;
+ f.open(ilFileName.c_str(), (std::fstream::out | std::fstream::binary));
+ f.write(Source().data(), Source().length());
+ f.close();
+ }
+
+ return ret;
+}
diff --git a/rocclr/compiler/lib/backends/common/codegen.hpp b/rocclr/compiler/lib/backends/common/codegen.hpp
new file mode 100644
index 0000000000..e8581e19ce
--- /dev/null
+++ b/rocclr/compiler/lib/backends/common/codegen.hpp
@@ -0,0 +1,87 @@
+//
+// Copyright (c) 2008 Advanced Micro Devices, Inc. All rights reserved.
+//
+#ifndef _BE_CODEGEN_HPP_
+#define _BE_CODEGEN_HPP_
+#include "compiler_stage.hpp"
+
+namespace amdcl
+{
+ /*! \addtogroup Compiler Library
+ *
+ * \copydoc amdcl::CodeGen
+ *
+ * @{
+ */
+ class CodeGen : public LLVMCompilerStage {
+ CodeGen(CodeGen&); // DO NOT IMPLEMENT.
+ CodeGen(); // DO NOT IMPLEMENT.
+ public:
+ CodeGen(aclCompiler *cl, aclBinary *elf, aclLogFunction log)
+ : LLVMCompilerStage(cl, elf, log) {}
+
+ virtual ~CodeGen() {}
+
+ /*! Function that takes in an LLVM module as input
+ * and generates code for it based on the target
+ * device.
+ * Returns 0 on success and non-zero on failure.
+ */
+ virtual int codegen(llvm::Module *input) = 0;
+
+ }; // class CodeGen
+ /*@}*/
+
+ /*! \addtogroup Compiler Library
+ *
+ * \copydoc amdcl::CLCodeGen
+ *
+ * @{
+ */
+ class CLCodeGen : public CodeGen {
+ CLCodeGen(CLCodeGen&); // DO NOT IMPLEMENT.
+ CLCodeGen(); // DO NOT IMPLEMENT.
+ public:
+ CLCodeGen(aclCompiler *cl, aclBinary *elf, aclLogFunction log)
+ : CodeGen(cl, elf, log) {}
+
+ virtual ~CLCodeGen() {}
+
+ /*! Function that takes in an LLVM module as input
+ * and generates code for it based on the target
+ * device.
+ * Returns 0 on success and non-zero on failure.
+ */
+ virtual int codegen(llvm::Module *input);
+
+ }; // class CLCodeGen
+ /*@}*/
+
+#if 0
+ /*! \addtogroup Compiler Library
+ *
+ * \copydoc amdcl::AMDILCodeGen
+ *
+ * @{
+ */
+ class AMDILCodeGen : public CodeGen {
+ AMDILCodeGen(AMDILCodeGen&); // DO NOT IMPLEMENT.
+ AMDILCodeGen(); // DO NOT IMPLEMENT.
+ public:
+ AMDILCodeGen(aclCompiler *cl, aclBinary *elf, llvm::LLVMContext *ctx)
+ : CLCodeGen(cl, elf, ctx) {}
+
+ virtual ~AMDILCodeGen() {}
+
+ /*! Function that takes in an LLVM module as input
+ * and generates code for it based on the target
+ * device.
+ * Returns 0 on success and non-zero on failure.
+ */
+ int codegen(llvm::Module *input) = 0;
+
+ }; // class AMDILCodeGen
+ /*@}*/
+#endif
+} // amdcl namespace
+#endif // _BE_CODEGEN_HPP_
diff --git a/rocclr/compiler/lib/backends/common/compiler_stage.cpp b/rocclr/compiler/lib/backends/common/compiler_stage.cpp
new file mode 100644
index 0000000000..36a855a7cb
--- /dev/null
+++ b/rocclr/compiler/lib/backends/common/compiler_stage.cpp
@@ -0,0 +1,99 @@
+//
+// Copyright (c) 2012 Advanced Micro Devices, Inc. All rights reserved.
+//
+#include "compiler_stage.hpp"
+#include "utils/libUtils.h"
+
+using namespace amdcl;
+
+CompilerStage::CompilerStage(aclCompiler* cl, aclBinary* elf,
+ aclLogFunction callback)
+: cl_(cl), elf_(elf), binary_(NULL),
+ source_(""), log_(""), callback_(callback)
+{
+ opts_ = (amd::option::Options*)Elf()->options;
+}
+
+CompilerStage::~CompilerStage()
+{ }
+
+LLVMCompilerStage::LLVMCompilerStage(aclCompiler *cl, aclBinary *elf,
+ aclLogFunction callback)
+: CompilerStage(cl, elf, callback),
+ llvmbinary_(NULL),
+ context_(NULL)
+{
+ if (!Options()->oVariables->DisableAllWarnings) {
+ hookup_.LLVMBuildLog = &log_;
+ }
+ // Expose some options to LLVM.
+ llvm::AMDOptions *amdopts = &hookup_.amdoptions;
+ amdopts->OptLiveness = Options()->oVariables->OptLiveness;
+ if (isHSAILTarget(Elf()->target)) {
+ if ((amdopts->NumAvailGPRs == ~0u) || (Options()->NumAvailGPRs != -1))
+ amdopts->NumAvailGPRs = Options()->NumAvailGPRs;
+ } else {
+ amdopts->OptPrintLiveness = Options()->oVariables->OptPrintLiveness;
+ amdopts->OptMem2reg = Options()->oVariables->OptMem2reg;
+ amdopts->UseJIT = Options()->oVariables->UseJIT;
+ amdopts->APThreshold = Options()->oVariables->APThreshold;
+ amdopts->AAForBarrier = Options()->oVariables->AAForBarrier;
+ amdopts->UnrollScratchThreshold = 500;
+ amdopts->AmdilUseDefaultResId = Options()->oVariables->DefaultResourceId;
+ }
+ amdopts->OptSimplifyLibCall = Options()->oVariables->OptSimplifyLibCall;
+ amdopts->EnableFDiv2FMul = Options()->oVariables->EnableFDiv2FMul;
+ amdopts->SRThreshold = Options()->oVariables->SRThreshold;
+ amdopts->OptMemCombineMaxVecGen = Options()->oVariables->OptMemCombineMaxVecGen;
+ amdopts->OptLICM = Options()->oVariables->OptLICM;
+
+ // math-related options
+ amdopts->UnsafeMathOpt = Options()->oVariables->UnsafeMathOpt;
+ amdopts->NoSignedZeros = Options()->oVariables->NoSignedZeros;
+ amdopts->FiniteMathOnly = Options()->oVariables->FiniteMathOnly;
+ amdopts->FastRelaxedMath = Options()->oVariables->FastRelaxedMath;
+
+ amdopts->LUThreshold = Options()->oVariables->LUThreshold;
+ amdopts->LUCount = Options()->oVariables->LUCount;
+ amdopts->LUAllowPartial = Options()->oVariables->LUAllowPartial;
+ amdopts->GPUArch = (uint32_t)getLibraryType(&elf->target);
+}
+
+ void
+LLVMCompilerStage::setContext(aclContext *ctx)
+{
+ context_ = reinterpret_cast(ctx);
+ if (ctx) {
+ Context().setAMDLLVMContextHook(&hookup_);
+ }
+}
+
+LLVMCompilerStage::~LLVMCompilerStage()
+{
+ if (context_) {
+ Context().setAMDLLVMContextHook(NULL);
+ }
+}
+
+ llvm::Module*
+LLVMCompilerStage::loadBitcode(std::string& llvmBinary)
+{
+ if (!llvm::isBitcode(reinterpret_cast(llvmBinary.data()),
+ reinterpret_cast(llvmBinary.data()
+ + llvmBinary.length()))) {
+ llvm::SMDiagnostic diags;
+ return ParseAssemblyString(llvmBinary.c_str(), llvmbinary_, diags, Context());
+
+ }
+ // Use getMemBuffer() ?
+ if (llvm::MemoryBuffer *Buffer =
+ llvm::MemoryBuffer::getMemBufferCopy(
+ llvm::StringRef(llvmBinary), "input.bc")) {
+ std::string ErrorMessage;
+ llvm::Module* M =
+ llvm::ParseBitcodeFile(Buffer, Context(), &ErrorMessage);
+ delete Buffer;
+ return M;
+ }
+ return NULL;
+}
diff --git a/rocclr/compiler/lib/backends/common/compiler_stage.hpp b/rocclr/compiler/lib/backends/common/compiler_stage.hpp
new file mode 100644
index 0000000000..2d14bdde9a
--- /dev/null
+++ b/rocclr/compiler/lib/backends/common/compiler_stage.hpp
@@ -0,0 +1,96 @@
+//
+// Copyright (c) 2012 Advanced Micro Devices, Inc. All rights reserved.
+//
+#ifndef _BE_COMPILER_STAGE_HPP_
+#define _BE_COMPILER_STAGE_HPP_
+#include "aclTypes.h"
+#include "utils/options.hpp"
+#include "llvm/AMDLLVMContextHook.h"
+#include "llvm/LLVMContext.h"
+#include "llvm/Module.h"
+#include "llvm/PassManager.h"
+#include "llvm/Pass.h"
+#include "llvm/Support/MemoryBuffer.h"
+#include "llvm/Support/SourceMgr.h"
+#include "llvm/Bitcode/ReaderWriter.h"
+#include "llvm/Assembly/Parser.h"
+
+#include
+#include
+
+namespace amdcl
+{
+ /*! \addtogroup CompilerLibrary
+ *
+ * \copydoc amdcl::CompilerStage
+ *
+ * @{
+ */
+ class CompilerStage {
+ private:
+ CompilerStage(); // DO NOT IMPLEMENT.
+ CompilerStage(CompilerStage&); // DO NOT IMPLEMENT.
+ public:
+ CompilerStage(aclCompiler* cl, aclBinary* elf, aclLogFunction callback);
+
+ virtual ~CompilerStage();
+
+ /*! Returns the Compiler */
+ aclCompiler* CL() const { return cl_; }
+
+ /*! Returns the elf binary */
+ aclBinary* Elf() const { return elf_; }
+
+ /*! Returns the callback */
+ aclLogFunction Callback() const { return callback_; }
+
+ /*! Returns the options */
+ amd::option::Options* Options() const {
+ assert(opts_ && "Options should not be null");
+ return opts_;
+ }
+
+
+ /*! Returns the source file */
+ std::string& Source() { return source_; }
+
+ /*! Returns the build log */
+ std::string& BuildLog() { return log_; }
+
+ protected:
+ aclCompiler *cl_;
+ aclBinary *elf_;
+ void *binary_;
+ amd::option::Options* opts_;
+ std::string source_;
+ std::string log_;
+ aclLogFunction callback_;
+ }; // class CompilerStage
+
+ class LLVMCompilerStage : public CompilerStage {
+ public:
+ LLVMCompilerStage(aclCompiler *cl, aclBinary *elf,
+ aclLogFunction callback);
+ virtual ~LLVMCompilerStage();
+ void setContext(aclContext *ctx);
+
+ /*! Returns the local context */
+ llvm::LLVMContext& Context() { return (*context_); }
+
+ /*! Loads bitcode in either text or binary format and return
+ * and LLVM module. */
+ virtual llvm::Module* loadBitcode(std::string& llvmBinary);
+ void setGPU(bool isForGPU) { hookup_.amdoptions.IsGPU = isForGPU; }
+ void setWholeProgram(bool Val) { hookup_.amdoptions.WholeProgram = Val; }
+
+ /*! Returns the llvm binary */
+ llvm::Module* LLVMBinary() const { return llvmbinary_; }
+ aclModule* Module() const { return reinterpret_cast(llvmbinary_);}
+ protected:
+ llvm::Module *llvmbinary_;
+ llvm::LLVMContext *context_;
+ llvm::AMDLLVMContextHook hookup_;
+ }; // class CompilerStage
+ /*@}*/
+}
+#endif // _BE_COMPILER_STAGE_HPP_
diff --git a/rocclr/compiler/lib/backends/common/frontend.cpp b/rocclr/compiler/lib/backends/common/frontend.cpp
new file mode 100644
index 0000000000..a89e7802a1
--- /dev/null
+++ b/rocclr/compiler/lib/backends/common/frontend.cpp
@@ -0,0 +1,295 @@
+//
+// Copyright (c) 2011 Advanced Micro Devices, Inc. All rights reserved.
+//
+#include "top.hpp"
+#include "frontend.hpp"
+#include "bif/bifbase.hpp"
+#include "utils/libUtils.h"
+#include "utils/target_mappings.h"
+#include "utils/options.hpp"
+#include "os/os.hpp"
+#include "llvm/ADT/StringRef.h"
+#include
+#include
+#include
+#include
+#include
+#include
+
+bool Is64bitMachine() {return sizeof(void*) == 8;}
+
+void
+amdcl::OCLFrontend::appendCLVersionFlag(std::stringstream &ss,
+ const amd::option::Options *opts)
+{
+ llvm::StringRef clStd(opts->oVariables->CLStd);
+
+ if (clStd == "CL1.0") {
+ ss << "--opencl=1.0 ";
+ } else if (clStd == "CL1.1") {
+ ss << "--opencl=1.1 ";
+ } else if (clStd == "CL1.2") {
+ ss << "--opencl=1.2 ";
+ } else {
+ if (clStd != "CL2.0") {
+ appendLogToCL(CL(), "Warning: invalid value for -cl-std, defaulting to CL1.2");
+ ss << "--opencl=1.2 ";
+ return;
+ }
+
+ ss << "--opencl=2.0 ";
+ }
+}
+
+///
+/// @brief Function that converts elf + src combo into the correct
+/// sequence of commands to call the CLC frontend.
+///
+/// FIXME: This needs to be modified so writing to a file is
+/// not necessary!
+std::string
+amdcl::OCLFrontend::getFrontendCommand(aclBinary *elf,
+ const std::string &src,
+ std::string &logFile,
+ std::string &clFile,
+ bool preprocessOnly)
+{
+ std::stringstream systemPath;
+ std::fstream f;
+ amd::option::Options* Opts = (amd::option::Options*)elf->options;
+
+ f.open(clFile.c_str(), (std::fstream::out | std::fstream::binary));
+ f.write(src.data(), src.length());
+ f.close();
+
+ bool enableSpir = false;
+#ifdef DEBUG
+ enableSpir = getenv("AMD_OCL_ENABLE_SPIR");
+#endif
+
+ if (enableSpir)
+ systemPath << "clc --spir --emit=spirbc ";
+ else
+ systemPath << "clc --emit=llvmbc ";
+
+ appendCLVersionFlag(systemPath, Opts);
+
+ if (enableSpir)
+ systemPath << "--amd-options-begin " << Opts->origOptionStr << " --amd-options-end ";
+
+#if WITH_VERSION_0_8
+ if (checkFlag(aclutGetCaps(elf), capImageSupport)) {
+ systemPath << "-D__IMAGE_SUPPORT__=1 ";
+ }
+
+ if (checkFlag(aclutGetCaps(elf), capFMA)) {
+ systemPath << "-DFP_FAST_FMAF=1 ";
+ systemPath << "-DFP_FAST_FMA=1 ";
+ }
+#elif WITH_VERSION_0_9
+#else
+#error "The current version was not handled correctly here."
+#endif
+
+ // F_IMAGES
+ if (Options()->oVariables->ImageSupport) {
+ systemPath << "-D__IMAGE_SUPPORT__=1 ";
+ }
+
+ if (Options()->oVariables->FastFMA) {
+ systemPath << "-DFP_FAST_FMA=1 ";
+ }
+
+ if (Options()->oVariables->FastFMAF) {
+ systemPath << "-DFP_FAST_FMAF=1 ";
+ }
+
+ systemPath << "-D__AMD__=1 ";
+ uint32_t chipName = elf->target.chip_id;
+ assert(chipName < familySet[elf->target.arch_id].children_size && "Cannot index past end of array!");
+ switch(elf->target.arch_id) {
+ default:
+ assert(!"Unknown target device ID!");
+ case aclX64:
+ systemPath << "--march=x86-64 -D__X86_64__=1 -D__" << X64TargetMapping[chipName].chip_name << "__=1 ";
+ break;
+ case aclX86:
+ systemPath << "--march=x86 -D__X86__=1 -D__" << X86TargetMapping[chipName].chip_name << "__=1 ";
+ break;
+ case aclAMDIL:
+ systemPath << "-D__AMDIL__ -D__" << AMDILTargetMapping[chipName].chip_name << "__=1 ";
+ break;
+ case aclAMDIL64:
+ systemPath << "--march=gpu-64 -D__AMDIL_64__ -D__" << AMDIL64TargetMapping[chipName].chip_name << "__=1 ";
+ break;
+#if WITH_VERSION_0_9
+ case aclA64:
+ systemPath << "--march=arm64 -D__ARM_64__=1 -D__" << A64TargetMapping[chipName].chip_name << "__=1 ";
+ break;
+ case aclARM:
+ systemPath << "--march=arm -D__ARM__=1 -D__" << A32TargetMapping[chipName].chip_name << "__=1 ";
+ break;
+#elif WITH_VERSION_0_8
+#else
+#error "The current version was not handled correctly here."
+#endif
+ case aclHSAIL:
+ systemPath << "--march=hsail -D__HSAIL__ -D__" << HSAILTargetMapping[chipName].chip_name << "__=1 ";
+ break;
+ case aclHSAIL64:
+ systemPath << "--march=hsail-64 -D__HSAIL__ -D__" << HSAIL64TargetMapping[chipName].chip_name << "__=1 ";
+ break;
+ };
+ // AMDIL and non CPU HSAIL targets get the GPU define, everything
+ // else gets CPU define.
+ if (!isCpuTarget(elf->target)) {
+ systemPath << "-D__GPU__=1 ";
+ } else {
+ systemPath << "-D__CPU__=1 ";
+ }
+
+ if (elf->target.arch_id == aclAMDIL
+ && AMDILTargetMapping[chipName].family_enum == FAMILY_RV7XX) {
+ systemPath << "-Dcl_amd_vec3=1 -Dcl_amd_printf=1 --opencl=1.0";
+ }
+
+ if (Opts) {
+ systemPath << Opts->clcOptions;
+ }
+
+#ifdef WITH_TARGET_HSAIL
+ if ((Is64bitMachine() && isHSAILTarget(elf->target)) ||
+ (Opts->oVariables->GPU64BitIsa && (elf->target.arch_id == aclHSAIL)))
+ systemPath << " --march=hsail-64 ";
+#endif
+
+#ifdef DEBUG
+ const char* env = getenv("AMD_EDG_OPTIONS");
+ if (env)
+ systemPath << env << " ";
+#endif
+
+#ifdef DEBUG
+ if (!getenv("AMD_OCL_SHOW_COMPILER_OUTPUT"))
+#endif
+ systemPath << " --error_output \"" << logFile << "\" ";
+ if(preprocessOnly) {
+ std::string clppFileName = Opts->getDumpFileName(".i");
+ systemPath << " -E -o \"" << clppFileName << "\"";
+ }
+ systemPath << " \"" << clFile << "\" ";
+
+ LogPrintfDebug("Invoking CL to LLVM binary compilation:\n %s",
+ systemPath.str().c_str());
+
+#ifdef DEBUG
+ if(getenv("AMD_OCL_SHOW_CMD_LINE"))
+ std::cout << "command line: " << systemPath.str() << std::endl;
+#endif
+
+ if (Opts && Opts->isDumpFlagSet(amd::option::DUMP_CL) && !preprocessOnly) {
+ std::string clFileName = Opts->getDumpFileName(".cl");
+ f.open(clFileName.c_str(), (std::fstream::out | std::fstream::binary));
+ f.write(src.data(), src.length());
+ f.close();
+ }
+ std::string clcCmd = systemPath.str();
+ return clcCmd;
+}
+// CLC_IN_PROCESS_CHANGE
+extern int openclFrontEnd(const char* cmdline, std::string*, std::string* typeInfo = NULL);
+
+static std::string
+loadFileToStr(std::string file)
+{
+ std::string str = "";
+ std::ifstream log(file.c_str(), std::ios::in|std::ios::ate);
+ if (log.is_open()) {
+ size_t size = (size_t)log.tellg();
+ log.seekg(0, std::ios::beg);
+
+ std::vector buffer(size+1);
+ log.read(&buffer[0],size);
+ log.close();
+ //for safety
+ buffer[size] = '\0';
+ str += &buffer[0];
+ }
+ return str;
+}
+
+int
+amdcl::OCLFrontend::compileCommand(const std::string& singleSrc)
+{
+
+ std::string tempFileName = amd::Os::getTempFileName();
+ std::string logFile = tempFileName + ".log";
+ std::string clFile = tempFileName + ".cl";
+ std::string frontendCmd = getFrontendCommand(Elf(), singleSrc, logFile,
+ clFile, false);
+ std::string logStr;
+ uint64_t start_time = 0, stop_time = 0;
+ amd::option::Options* Opts = (amd::option::Options*)Elf()->options;
+
+ if (Options()->oVariables->EnableBuildTiming) {
+ start_time = amd::Os::timeNanos();
+ }
+ if (
+#if WITH_VERSION_0_8
+ !checkFlag(aclutGetCaps(Elf()), capSaveSOURCE)
+#elif WITH_VERSION_0_9
+ !Options()->oVariables->BinSOURCE
+#else
+#error "The current version was not handled correctly here."
+#endif
+ ) {
+ CL()->clAPI.remSec(CL(), Elf(), aclSOURCE);
+ }
+ int ret = openclFrontEnd(frontendCmd.c_str(), &Source(), NULL);
+
+ // We dump the preprocessed code by invoking clc a second time after the
+ // original call, just in case somthing really bad happens in the original
+ // call.
+ if (Opts && Opts->isDumpFlagSet(amd::option::DUMP_I)) {
+ std::string pplogFile = tempFileName + "preprocess.log";
+ std::string ppFrontendCmd =
+ getFrontendCommand(Elf(), singleSrc, pplogFile, clFile, true);
+ (void) openclFrontEnd(ppFrontendCmd.c_str(), &Source(), NULL);
+ amd::Os::unlink(pplogFile.c_str());
+ }
+ if (Options()->oVariables->EnableBuildTiming) {
+ stop_time = amd::Os::timeNanos();
+ std::stringstream tmp_ss;
+ tmp_ss << " OpenCL FE time: "
+ << (stop_time - start_time)/1000ULL
+ << "us\n";
+ appendLogToCL(CL(), tmp_ss.str());
+ }
+ llvmbinary_ = loadBitcode(Source());
+ if (!llvmbinary_) {
+ ret |= 1;
+ }
+ if (!ret &&
+#if WITH_VERSION_0_8
+ checkFlag(aclutGetCaps(Elf()), capSaveLLVMIR)
+#elif WITH_VERSION_0_9
+ Options()->oVariables->BinLLVMIR
+#else
+#error "The current version was not handled correctly here."
+#endif
+ ) {
+ CL()->clAPI.insSec(CL(), Elf(), Source().data(),
+ Source().size(), aclLLVMIR);
+ } else {
+ CL()->clAPI.remSec(CL(), Elf(), aclLLVMIR);
+ }
+ log_ += loadFileToStr(logFile);
+ amd::Os::unlink(logFile.c_str());
+ if (isCpuTarget(Elf()->target)
+ && Options()->oVariables->EnableDebug) {
+ Options()->sourceFileName_ = clFile;
+ } else {
+ amd::Os::unlink(clFile.c_str());
+ }
+ return ret;
+}
diff --git a/rocclr/compiler/lib/backends/common/frontend.hpp b/rocclr/compiler/lib/backends/common/frontend.hpp
new file mode 100644
index 0000000000..0c9145f84d
--- /dev/null
+++ b/rocclr/compiler/lib/backends/common/frontend.hpp
@@ -0,0 +1,99 @@
+//
+// Copyright (c) 2008 Advanced Micro Devices, Inc. All rights reserved.
+//
+#ifndef _BE_FRONTEND_HPP_
+#define _BE_FRONTEND_HPP_
+#include
+#include "aclTypes.h"
+#include "compiler_stage.hpp"
+
+namespace amdcl
+{
+ /*! \addtogroup CompilerLibrary
+ *
+ * \copydoc amdcl::Frontend
+ *
+ * @{
+ * \brief Interface parent class for the frontend child classes.
+ * This class should never be instantiated directly.
+ */
+ class Frontend : public LLVMCompilerStage {
+ Frontend(Frontend&); // DO NOT IMPLEMENT.
+ Frontend(); // DO NOT IMPLEMENT.
+ public:
+ Frontend(aclCompiler* cl, aclBinary* elf, aclLogFunction log)
+ : LLVMCompilerStage(cl, elf, log) {}
+ //! Virtual destructer that makes sure everything is cleaned up.
+ virtual ~Frontend() {}
+
+ //! Function that converts from OpenCL singleSrc into
+ // OpenCL formatted LLVM-IR stored as a std::string.
+ // This function generates a command string for clc to execute.
+ virtual int compileCommand(const std::string& singleSrc) = 0;
+
+ }; // class Frontend
+ /*@}*/
+
+ /*! \addtogroup CompilerLibrary
+ *
+ * \copydoc amdcl::OCLFrontend
+ *
+ * @{
+ * \brief Implementation of the Frontend interface to compile
+ * from OpenCL C to LLVM-IR.
+ */
+ class OCLFrontend : public Frontend {
+ OCLFrontend(OCLFrontend&); // DO NOT IMPLEMENT.
+ OCLFrontend(); // DO NOT IMPLEMENT.
+
+ void appendCLVersionFlag(
+ std::stringstream &ss,
+ const amd::option::Options *opts);
+
+ std::string getFrontendCommand(
+ aclBinary *elf,
+ const std::string &src,
+ std::string &logFile,
+ std::string &clFile,
+ bool preprocessOnly);
+
+ public:
+ OCLFrontend(aclCompiler* cl, aclBinary* elf, aclLogFunction log)
+ : Frontend(cl, elf, log) {}
+
+ virtual ~OCLFrontend() {}
+
+ //! Function that converts from OpenCL singleSrc into
+ // OpenCL formatted LLVM-IR stored as a std::string.
+ // This function generates a command string for clc to execute.
+ virtual int compileCommand(const std::string& singleSrc);
+
+ }; // class OCLFrontend
+ /*@}*/
+
+
+ /*! \addtogroup CompilerLibrary
+ *
+ * \copydoc amdcl::Frontend
+ *
+ * @{
+ * \brief This is the class which calls the clang front-end.
+ * This class will be used if user asks for it (By default EDG will be
+ * called).
+ */
+ class ClangOCLFrontend : public Frontend {
+ //! Options to be passed to the ClangOCLFE library.
+
+ public:
+ ClangOCLFrontend(aclCompiler* cl, aclBinary* elf, aclLogFunction log);
+
+ //! Virtual destructer that makes sure everything is cleaned up.
+ virtual ~ClangOCLFrontend() {}
+
+ //! This function generates a command string for ClangOCLFE to execute.
+ virtual int compileCommand(const std::string& singleSrc);
+
+ }; // class Frontend
+ /*@}*/
+} // namespac amdcl
+#endif // _BE_FRONTEND_HPP_
diff --git a/rocclr/compiler/lib/backends/common/frontend_clang.cpp b/rocclr/compiler/lib/backends/common/frontend_clang.cpp
new file mode 100644
index 0000000000..e7ae76e70e
--- /dev/null
+++ b/rocclr/compiler/lib/backends/common/frontend_clang.cpp
@@ -0,0 +1,202 @@
+//
+// Copyright (c) 2008 Advanced Micro Devices, Inc. All rights reserved.
+//
+
+#include "OpenCLFE.h"
+
+#include "bif/bifbase.hpp"
+#include "frontend.hpp"
+#include "os/os.hpp"
+#include "top.hpp"
+#include "utils/libUtils.h"
+#include "utils/options.hpp"
+#include "utils/target_mappings.h"
+
+#include "llvm/Support/ErrorHandling.h"
+#include "llvm/Support/MemoryBuffer.h"
+#include "llvm/ADT/StringRef.h"
+
+#include
+#include
+#include
+
+amdcl::ClangOCLFrontend::ClangOCLFrontend(aclCompiler* cl, aclBinary* elf,
+ aclLogFunction log)
+ : Frontend(cl, elf, log){}
+
+/// @brief This function generates the required command-line options to
+/// call the ClangOCLFE library.
+int amdcl::ClangOCLFrontend::compileCommand(const std::string& src) {
+
+ std::vector argsToClang;
+ std::string tempFileName = amd::Os::getTempFileName();
+ std::string logFileName = tempFileName + ".log";
+ std::string inpCLFileName = tempFileName + ".cl";
+ std::string logFromClang;
+ int ret = 0;
+
+ aclBinary *elf = Elf();
+ amd::option::Options* amdOpts = (amd::option::Options*)elf->options;
+
+ // Following are the options passed to the ClangOCLFE library
+ // and then to Clang itself.
+
+ // Passing the compiler FE options to clang.
+ if (amdOpts) {
+ for (std::vector::const_iterator it = amdOpts->clangOptions.begin();
+ it != amdOpts->clangOptions.end(); ++it) {
+ argsToClang.push_back((*it).c_str());
+ }
+ }
+
+ // Other options are passed using OptionsInfo structure.
+ clc2::OptionsInfo ClangOptions;
+
+ ClangOptions.InFilename = inpCLFileName;
+
+ // Generate target triple.
+ // TODO: Refine the triple as necessary.
+ uint32_t chipName = elf->target.chip_id;
+ assert(chipName < familySet[elf->target.arch_id].children_size &&
+ "Cannot index past end of array!");
+ switch (elf->target.arch_id) {
+ default:
+ log_ += "\nerror: Unknown target device ID!\n";
+ ret |= 1;
+ return ret;
+ break;
+ case aclX86:
+ case aclAMDIL:
+ case aclHSAIL:
+ // See bug: http://ocltc.amd.com/bugs/show_bug.cgi?id=9631
+ if (sizeof(void*) != 4) {
+ log_ += "\nerror: 32-bit kernels not supported on a 64-bit executable\n";
+ ret |= 1;
+ return ret;
+ }
+ ClangOptions.TargetArch = llvm::Triple::spir;
+ break;
+ case aclX64:
+ case aclAMDIL64:
+ case aclHSAIL64:
+ // See bug: http://ocltc.amd.com/bugs/show_bug.cgi?id=9631
+ if (sizeof(void*) != 8) {
+ log_ += "\nerror: 64-bit kernels not supported on a 32-bit executable\n";
+ ret |= 1;
+ return ret;
+ }
+ ClangOptions.TargetArch = llvm::Triple::spir64;
+ break;
+ };
+
+ // Copy the source to a buffer. Note that the input
+ // file itself is not passed to the ClangOCLFE library. It is a passed
+ // as a string for compilation.
+
+ llvm::MemoryBuffer *srcBuffer =
+ llvm::MemoryBuffer::getMemBuffer(src, inpCLFileName.c_str(),
+ true);
+ llvm::OwningPtr srcBufferPtr(srcBuffer);
+ ClangOptions.Src.swap(srcBufferPtr);
+ assert(ClangOptions.Src.get() && "ClangOCLFE: Memory Buffer"
+ " initialization error\n");
+
+ // Set Pre-processor output if user asks for it.
+ if (amdOpts && amdOpts->isDumpFlagSet(amd::option::DUMP_I)) {
+ ClangOptions.PreProcOut = amdOpts->getDumpFileName(".i");
+ }
+
+ // Set the LLVMContext for the front-end compilation.
+ ClangOptions.CompilerContext = &Context();
+
+ if (amdOpts && amdOpts->isDumpFlagSet(amd::option::DUMP_CL)) {
+ std::string inpCLFileName = amdOpts->getDumpFileName(".cl");
+ std::fstream f;
+ f.open(inpCLFileName.c_str(), (std::fstream::out | std::fstream::binary));
+ f.write(src.data(), src.length());
+ f.close();
+ }
+
+ //Start the compilation
+ uint64_t start_time = 0, stop_time = 0;
+
+ if (Options()->oVariables->EnableBuildTiming) {
+ start_time = amd::Os::timeNanos();
+ }
+
+ if (
+#if WITH_VERSION_0_8
+ !checkFlag(aclutGetCaps(Elf()), capSaveSOURCE)
+#elif WITH_VERSION_0_9
+ !Options()->oVariables->BinSOURCE
+#else
+#error "The current version was not handled correctly here."
+#endif
+ ) {
+ CL()->clAPI.remSec(CL(), Elf(), aclSOURCE);
+ }
+
+ // Pass OpenCL version option to Clang
+ llvm::StringRef OCLVer(amdOpts->oVariables->CLStd);
+ if (OCLVer.equals("CL1.2")) {
+ ClangOptions.OCLVer = clc2::OCL_12;
+ } else if (OCLVer.equals("CL2.0")) {
+ ClangOptions.OCLVer = clc2::OCL_20;
+ } else {
+ llvm_unreachable("Unknown OpenCL version");
+ }
+
+ // Call the Clang Front-end to generate serialized llvm::Module
+ // from the OpenCL source.
+#ifdef ANDROID
+ // We will not exercise Clang for RenderScript.
+ log_ += "\nerror: Clang front-end compilation unsupported on Android!\n";
+ ret |= 1;
+ return ret;
+#else
+ if (!parseOCLSource(ClangOptions, argsToClang, &Source(), &logFromClang)) {
+ log_ += logFromClang;
+ log_ += "\nerror: Clang front-end compilation failed!\n";
+ ret |= 1;
+ return ret;
+ }
+#endif
+
+ if (Options()->oVariables->EnableBuildTiming) {
+ stop_time = amd::Os::timeNanos();
+ std::stringstream tmp_ss;
+ tmp_ss << " OpenCL FE time: "
+ << (stop_time - start_time)/1000ULL
+ << "us\n";
+ appendLogToCL(CL(), tmp_ss.str());
+ }
+
+ llvmbinary_ = loadBitcode(Source());
+
+ if (!llvmbinary_) {
+ ret |= 1;
+ }
+
+ if (!ret &&
+#if WITH_VERSION_0_8
+ checkFlag(aclutGetCaps(Elf()), capSaveLLVMIR)
+#elif WITH_VERSION_0_9
+ Options()->oVariables->BinLLVMIR
+#else
+#error "The current version was not handled correctly here."
+#endif
+ ) {
+ CL()->clAPI.insSec(CL(), Elf(), Source().data(),
+ Source().size(), aclLLVMIR);
+ } else {
+ CL()->clAPI.remSec(CL(), Elf(), aclLLVMIR);
+ }
+ log_ += logFromClang;
+ if (isCpuTarget(Elf()->target)
+ && Options()->oVariables->EnableDebug) {
+ Options()->sourceFileName_ = inpCLFileName;
+ } else {
+ amd::Os::unlink(inpCLFileName.c_str());
+ }
+ return ret;
+}
diff --git a/rocclr/compiler/lib/backends/common/if_acl.h b/rocclr/compiler/lib/backends/common/if_acl.h
new file mode 100644
index 0000000000..e688dc880b
--- /dev/null
+++ b/rocclr/compiler/lib/backends/common/if_acl.h
@@ -0,0 +1,15 @@
+//
+// Copyright (c) 2012 Advanced Micro Devices, Inc. All rights reserved.
+//
+#ifndef _IF_ACL_H_
+#define _IF_ACL_H_
+#include "aclTypes.h"
+#if WITH_VERSION_0_8
+#include "v0_8/if_acl.h"
+#elif WITH_VERSION_0_9
+#include "v0_9/if_acl.h"
+#else
+#error "The compiler library version was not defined."
+#include "v0_8/if_acl.h"
+#endif
+#endif // _IF_ACL_H_
diff --git a/rocclr/compiler/lib/backends/common/library.cpp b/rocclr/compiler/lib/backends/common/library.cpp
new file mode 100644
index 0000000000..471bdbf3f7
--- /dev/null
+++ b/rocclr/compiler/lib/backends/common/library.cpp
@@ -0,0 +1,290 @@
+
+// Copyright (c) 2008 Advanced Micro Devices, Inc. All rights reserved.
+//
+
+#include
+#include
+
+#include "top.hpp"
+#include "aclTypes.h"
+#include "library.hpp"
+#include "utils/options.hpp"
+
+namespace amd {
+
+/*
+ Integrated bitcode libraries
+ */
+
+// GPU libraries
+#if defined(WITH_TARGET_AMDIL)
+#include "builtins-gpugen-comm.inc"
+#include "builtins-gpugen-diff.gpu.inc"
+#include "builtins-gpugen-diff.gpu-64.inc"
+#include "builtins-gpucommon-comm.inc"
+#include "builtins-gpucommon-diff.gpu.inc"
+#include "builtins-gpucommon-diff.gpu-64.inc"
+#include "builtins-SI-comm.inc"
+#include "builtins-SI-diff.gpu.inc"
+#include "builtins-SI-diff.gpu-64.inc"
+#include "builtins-CI-comm.inc"
+#include "builtins-CI-diff.gpu.inc"
+#include "builtins-CI-diff.gpu-64.inc"
+#endif // WITH_TARGET_AMDIL
+
+// CPU libraries
+#if defined(WITH_TARGET_X86)
+#include "builtins-cpugen.x86.inc"
+#include "builtins-cpucommon.x86.inc"
+#include "builtins-avx.x86.inc"
+#include "builtins-fma4.x86.inc"
+#include "builtins-cpugen.x86-64.inc"
+#include "builtins-cpucommon.x86-64.inc"
+#include "builtins-avx.x86-64.inc"
+#include "builtins-fma4.x86-64.inc"
+#endif // WITH_TARGET_X86
+
+#if defined(WITH_TARGET_ARM)
+#include "builtins-cpugen.arm.inc"
+#include "builtins-cpucommon.arm.inc"
+#endif // WITH_TARGET_ARM
+
+#ifdef WITH_TARGET_HSAIL
+// HSAIL libraries
+#include "builtins-hsail.inc"
+#include "builtins-hsail-amd-ci.inc"
+#include "builtins-gcn.inc"
+#endif
+
+#include
+// getLibsDesc() : returns a list of libraries that need to be linked with the
+// application. The max number of libraries is defined by
+// enum MAX_NUM_LIBRARY_DESCS in class LibraryDescriptor.
+//
+// Return 0: successful
+// : error happened
+int
+getLibDescs (
+ LibrarySelector LibType, // input
+ LibraryDescriptor* LibDesc, // output
+ int& LibDescSize // output -- LibDesc[0:LibDescSize-1]
+)
+{
+ switch (LibType) {
+#if defined(WITH_TARGET_AMDIL)
+ case GPU_Library_Evergreen:
+ // Library order is important!
+ LibDesc[0].start = reinterpret_cast
+ (builtins_gpucommon_comm);
+ LibDesc[0].size = builtins_gpucommon_comm_size;
+ LibDesc[1].start = reinterpret_cast
+ (builtins_gpucommon_diff_gpu);
+ LibDesc[1].size = builtins_gpucommon_diff_gpu_size;
+ LibDesc[2].start = reinterpret_cast
+ (builtins_gpugen_comm);
+ LibDesc[2].size = builtins_gpugen_comm_size;
+ LibDesc[3].start = reinterpret_cast
+ (builtins_gpugen_diff_gpu);
+ LibDesc[3].size = builtins_gpugen_diff_gpu_size;
+ LibDescSize = 4;
+ break;
+
+ case GPU_Library_SI:
+ // Library order is important!
+ LibDesc[0].start = reinterpret_cast
+ (builtins_SI_comm);
+ LibDesc[0].size = builtins_SI_comm_size;
+ LibDesc[1].start = reinterpret_cast
+ (builtins_SI_diff_gpu);
+ LibDesc[1].size = builtins_SI_diff_gpu_size;
+ LibDesc[2].start = reinterpret_cast
+ (builtins_gpucommon_comm);
+ LibDesc[2].size = builtins_gpucommon_comm_size;
+ LibDesc[3].start = reinterpret_cast
+ (builtins_gpucommon_diff_gpu);
+ LibDesc[3].size = builtins_gpucommon_diff_gpu_size;
+ LibDesc[4].start = reinterpret_cast
+ (builtins_gpugen_comm);
+ LibDesc[4].size = builtins_gpugen_comm_size;
+ LibDesc[5].start = reinterpret_cast
+ (builtins_gpugen_diff_gpu);
+ LibDesc[5].size = builtins_gpugen_diff_gpu_size;
+ LibDescSize = 6;
+ break;
+
+ case GPU64_Library_SI:
+ // Library order is important!
+ LibDesc[0].start = reinterpret_cast
+ (builtins_SI_comm);
+ LibDesc[0].size = builtins_SI_comm_size;
+ LibDesc[1].start = reinterpret_cast
+ (builtins_SI_diff_gpu_64);
+ LibDesc[1].size = builtins_SI_diff_gpu_64_size;
+ LibDesc[2].start = reinterpret_cast
+ (builtins_gpucommon_comm);
+ LibDesc[2].size = builtins_gpucommon_comm_size;
+ LibDesc[3].start = reinterpret_cast
+ (builtins_gpucommon_diff_gpu_64);
+ LibDesc[3].size = builtins_gpucommon_diff_gpu_64_size;
+ LibDesc[4].start = reinterpret_cast
+ (builtins_gpugen_comm);
+ LibDesc[4].size = builtins_gpugen_comm_size;
+ LibDesc[5].start = reinterpret_cast
+ (builtins_gpugen_diff_gpu_64);
+ LibDesc[5].size = builtins_gpugen_diff_gpu_64_size;
+ LibDescSize = 6;
+ break;
+
+ case GPU_Library_CI:
+ // Library order is important!
+ LibDesc[0].start = reinterpret_cast
+ (builtins_CI_comm);
+ LibDesc[0].size = builtins_CI_comm_size;
+ LibDesc[1].start = reinterpret_cast
+ (builtins_CI_diff_gpu);
+ LibDesc[1].size = builtins_CI_diff_gpu_size;
+ LibDesc[2].start = reinterpret_cast
+ (builtins_SI_comm);
+ LibDesc[2].size = builtins_SI_comm_size;
+ LibDesc[3].start = reinterpret_cast
+ (builtins_SI_diff_gpu);
+ LibDesc[3].size = builtins_SI_diff_gpu_size;
+ LibDesc[4].start = reinterpret_cast
+ (builtins_gpucommon_comm);
+ LibDesc[4].size = builtins_gpucommon_comm_size;
+ LibDesc[5].start = reinterpret_cast
+ (builtins_gpucommon_diff_gpu);
+ LibDesc[5].size = builtins_gpucommon_diff_gpu_size;
+ LibDesc[6].start = reinterpret_cast
+ (builtins_gpugen_comm);
+ LibDesc[6].size = builtins_gpugen_comm_size;
+ LibDesc[7].start = reinterpret_cast
+ (builtins_gpugen_diff_gpu);
+ LibDesc[7].size = builtins_gpugen_diff_gpu_size;
+ LibDescSize = 8;
+ break;
+
+ case GPU64_Library_CI:
+ // Library order is important!
+ LibDesc[0].start = reinterpret_cast
+ (builtins_CI_comm);
+ LibDesc[0].size = builtins_CI_comm_size;
+ LibDesc[1].start = reinterpret_cast
+ (builtins_CI_diff_gpu_64);
+ LibDesc[1].size = builtins_CI_diff_gpu_64_size;
+ LibDesc[2].start = reinterpret_cast
+ (builtins_SI_comm);
+ LibDesc[2].size = builtins_SI_comm_size;
+ LibDesc[3].start = reinterpret_cast
+ (builtins_SI_diff_gpu_64);
+ LibDesc[3].size = builtins_SI_diff_gpu_64_size;
+ LibDesc[4].start = reinterpret_cast
+ (builtins_gpucommon_comm);
+ LibDesc[4].size = builtins_gpucommon_comm_size;
+ LibDesc[5].start = reinterpret_cast
+ (builtins_gpucommon_diff_gpu_64);
+ LibDesc[5].size = builtins_gpucommon_diff_gpu_64_size;
+ LibDesc[6].start = reinterpret_cast
+ (builtins_gpugen_comm);
+ LibDesc[6].size = builtins_gpugen_comm_size;
+ LibDesc[7].start = reinterpret_cast
+ (builtins_gpugen_diff_gpu_64);
+ LibDesc[7].size = builtins_gpugen_diff_gpu_64_size;
+ LibDescSize = 8;
+ break;
+
+#endif // WITH_TARGET_AMDIL
+
+#if defined(WITH_TARGET_X86)
+ case CPU64_Library_Generic:
+ LibDesc[0].start = reinterpret_cast(builtins_cpucommon_x86_64);
+ LibDesc[0].size = builtins_cpucommon_x86_64_size;
+ LibDesc[1].start = reinterpret_cast(builtins_cpugen_x86_64);
+ LibDesc[1].size = builtins_cpugen_x86_64_size;
+ LibDescSize = 2;
+ break;
+
+ case CPU64_Library_AVX:
+ LibDesc[0].start = reinterpret_cast(builtins_avx_x86_64);
+ LibDesc[0].size = builtins_avx_x86_64_size;
+ LibDesc[1].start = reinterpret_cast(builtins_cpucommon_x86_64);
+ LibDesc[1].size = builtins_cpucommon_x86_64_size;
+ LibDesc[2].start = reinterpret_cast(builtins_cpugen_x86_64);
+ LibDesc[2].size = builtins_cpugen_x86_64_size;
+ LibDescSize = 3;
+ break;
+
+ case CPU64_Library_FMA4:
+ LibDesc[0].start = reinterpret_cast(builtins_fma4_x86_64);
+ LibDesc[0].size = builtins_fma4_x86_64_size;
+ LibDesc[1].start = reinterpret_cast(builtins_avx_x86_64);
+ LibDesc[1].size = builtins_avx_x86_64_size;
+ LibDesc[2].start = reinterpret_cast(builtins_cpucommon_x86_64);
+ LibDesc[2].size = builtins_cpucommon_x86_64_size;
+ LibDesc[3].start = reinterpret_cast(builtins_cpugen_x86_64);
+ LibDesc[3].size = builtins_cpugen_x86_64_size;
+ LibDescSize = 4;
+ break;
+
+ case CPU_Library_Generic:
+ LibDesc[0].start = reinterpret_cast(builtins_cpucommon_x86);
+ LibDesc[0].size = builtins_cpucommon_x86_size;
+ LibDesc[1].start = reinterpret_cast(builtins_cpugen_x86);
+ LibDesc[1].size = builtins_cpugen_x86_size;
+ LibDescSize = 2;
+ break;
+
+ case CPU_Library_AVX:
+ LibDesc[0].start = reinterpret_cast(builtins_avx_x86);
+ LibDesc[0].size = builtins_avx_x86_size;
+ LibDesc[1].start = reinterpret_cast(builtins_cpucommon_x86);
+ LibDesc[1].size = builtins_cpucommon_x86_size;
+ LibDesc[2].start = reinterpret_cast(builtins_cpugen_x86);
+ LibDesc[2].size = builtins_cpugen_x86_size;
+ LibDescSize = 3;
+ break;
+
+ case CPU_Library_FMA4:
+ LibDesc[0].start = reinterpret_cast(builtins_fma4_x86);
+ LibDesc[0].size = builtins_fma4_x86_size;
+ LibDesc[1].start = reinterpret_cast(builtins_avx_x86);
+ LibDesc[1].size = builtins_avx_x86_size;
+ LibDesc[2].start = reinterpret_cast(builtins_cpucommon_x86);
+ LibDesc[2].size = builtins_cpucommon_x86_size;
+ LibDesc[3].start = reinterpret_cast(builtins_cpugen_x86);
+ LibDesc[3].size = builtins_cpugen_x86_size;
+ LibDescSize = 4;
+ break;
+#endif // WITH_TARGET_X86
+
+#if defined(WITH_TARGET_ARM)
+ case CPU_Library_Generic:
+ LibDesc[0].start = reinterpret_cast(builtins_cpucommon_arm);
+ LibDesc[0].size = builtins_cpucommon_arm_size;
+ LibDesc[1].start = reinterpret_cast(builtins_cpugen_arm);
+ LibDesc[1].size = builtins_cpugen_arm_size;
+ LibDescSize = 2;
+ break;
+#endif // WITH_TARGET_ARM
+
+#if defined(WITH_TARGET_HSAIL)
+ case GPU_Library_HSAIL:
+ // Library order is important!
+ LibDesc[0].start = reinterpret_cast(builtins_gcn);
+ LibDesc[0].size = builtins_gcn_size;
+ LibDesc[1].start = reinterpret_cast(builtins_hsail_amd_ci);
+ LibDesc[1].size = builtins_hsail_amd_ci_size;
+ LibDesc[2].start = reinterpret_cast(builtins_hsail);
+ LibDesc[2].size = builtins_hsail_size;
+ LibDescSize = 3;
+ break;
+#endif // WITH_TARGET_HSAIL
+
+ default:
+ // Failed
+ return 1; //
+ }
+ return 0;
+}
+
+} // namespace amd
diff --git a/rocclr/compiler/lib/backends/common/library.hpp b/rocclr/compiler/lib/backends/common/library.hpp
new file mode 100644
index 0000000000..2d563a81f4
--- /dev/null
+++ b/rocclr/compiler/lib/backends/common/library.hpp
@@ -0,0 +1,59 @@
+//
+// Copyright (c) 2008 Advanced Micro Devices, Inc. All rights reserved.
+//
+
+#ifndef LIBRARY_H_
+#define LIBRARY_H_
+
+#include
+#include
+namespace amd {
+
+typedef enum _library_selector_0_7 {
+ LibraryUndefined = 0,
+ GPU_Library_7xx,
+ GPU_Library_Evergreen,
+ GPU_Library_SI,
+ CPU_Library_Generic,
+ CPU_Library_AVX,
+ CPU_Library_FMA4,
+ GPU_Library_Generic,
+ CPU64_Library_Generic,
+ CPU64_Library_AVX,
+ CPU64_Library_FMA4,
+ GPU64_Library_Evergreen,
+ GPU64_Library_SI,
+ GPU64_Library_Generic,
+ GPU_Library_CI,
+ GPU64_Library_CI,
+ GPU_Library_HSAIL,
+ LibraryTotal
+} LibrarySelector;
+
+/** Integrated Bitcode Libararies **/
+class LibraryDescriptor {
+public:
+ enum {MAX_NUM_LIBRARY_DESCS = 11};
+
+ const char* start;
+ size_t size;
+};
+
+int getLibDescs (
+ LibrarySelector LibType, // input
+ LibraryDescriptor* LibDesc, // output
+ int& LibDescSize // output -- LibDesc[0:LibDescSize-1]
+);
+
+static const char* amdRTFuns[] = {
+ "__amdrt_div_i64",
+ "__amdrt_div_u64",
+ "__amdrt_mod_i64",
+ "__amdrt_mod_u64",
+ "__amdrt_cvt_f64_to_u64",
+ "__amdrt_cvt_f32_to_u64"
+};
+} //amd
+
+#endif // LIBRARY_H_
+
diff --git a/rocclr/compiler/lib/backends/common/linker.cpp b/rocclr/compiler/lib/backends/common/linker.cpp
new file mode 100644
index 0000000000..f85e366a47
--- /dev/null
+++ b/rocclr/compiler/lib/backends/common/linker.cpp
@@ -0,0 +1,1299 @@
+//
+// Copyright (c) 2008 Advanced Micro Devices, Inc. All rights reserved.
+//
+// TODO: The entire linker implementation should be a pass in LLVM and
+// the code in the compiler library should only call this pass.
+
+#include "top.hpp"
+#include "library.hpp"
+#include "linker.hpp"
+#include "os/os.hpp"
+#include "thread/monitor.hpp"
+#include "utils/libUtils.h"
+#include "utils/options.hpp"
+#include "utils/target_mappings.h"
+
+#include "acl.h"
+
+#include "llvm/Instructions.h"
+#include "llvm/Linker.h"
+#include "llvm/GlobalValue.h"
+#include "llvm/GlobalVariable.h"
+
+#include "llvm/AMDResolveLinker.h"
+#include "llvm/AMDPrelinkOpt.h"
+#include "llvm/ADT/Triple.h"
+#include "llvm/ADT/StringMap.h"
+#include "llvm/Analysis/AMDLocalArrayUsage.h"
+#include "llvm/Analysis/CodeMetrics.h"
+#include "llvm/Analysis/LoopPass.h"
+#include "llvm/Analysis/Passes.h"
+#include "llvm/Analysis/Verifier.h"
+#include "llvm/Bitcode/ReaderWriter.h"
+
+#include "llvm/CodeGen/LinkAllAsmWriterComponents.h"
+#include "llvm/CodeGen/LinkAllCodegenComponents.h"
+#if 1 || LLVM_TRUNK_INTEGRATION_CL >= 2270
+#else
+#include "llvm/CodeGen/ObjectCodeEmitter.h"
+#endif
+#include "llvm/Config/config.h"
+
+#include "llvm/MC/SubtargetFeature.h"
+
+#include "llvm/Support/CallSite.h"
+#include "llvm/Support/FileSystem.h"
+#include "llvm/Support/FileUtilities.h"
+#include "llvm/Support/FormattedStream.h"
+#include "llvm/Support/Host.h"
+#include "llvm/Support/ManagedStatic.h"
+#include "llvm/Support/MemoryBuffer.h"
+#include "llvm/Support/Path.h"
+#include "llvm/Support/PluginLoader.h"
+#include "llvm/Support/raw_ostream.h"
+#include "llvm/Support/Signals.h"
+#include "llvm/Support/system_error.h"
+#include "llvm/Support/TargetRegistry.h"
+#include "llvm/Support/TargetSelect.h"
+#include "llvm/DataLayout.h"
+#include "llvm/Target/TargetMachine.h"
+#include "llvm/Target/TargetOptions.h"
+
+#include "llvm/Transforms/IPO.h"
+#include "llvm/Transforms/Scalar.h"
+#include "llvm/ValueSymbolTable.h"
+
+#ifdef _DEBUG
+#include "llvm/Assembly/Writer.h"
+#endif
+
+// need to undef DEBUG before using DEBUG macro in llvm/Support/Debug.h
+#ifdef DEBUG
+#undef DEBUG
+#endif
+#include "llvm/Support/Debug.h"
+
+#include
+#include
+#include
+#include
+#include
+#include
+#include
+#include
+#include
+#include