Files
rocm-systems/rocclr/runtime/device/blitcl.cpp
T
foreman e682abb47e P4 to Git Change 1303140 by lmoriche@lmoriche_opencl_dev on 2016/08/15 17:04:37
SWDEV-94610 - Code provided by Wilkin - Implement the roc Program Manager to call the Lightning Compiler instead of the compiler library.
	- Embed and use the pre-compiled header generated by the built-in library build
	- If LLVM_BIN is not set, try to find Clang from the libamdocl path

	Testing: http://ocltc.amd.com:8111/viewModification.html?modId=75068&personal=true&buildTypeId=&tab=vcsModificationBuilds&show_all_builds=true

Affected files ...

... //depot/stg/opencl/drivers/opencl/compiler/lib/loaders/elf/elf.cpp#35 edit
... //depot/stg/opencl/drivers/opencl/compiler/lib/loaders/elf/elf.hpp#24 edit
... //depot/stg/opencl/drivers/opencl/runtime/device/blitcl.cpp#9 edit
... //depot/stg/opencl/drivers/opencl/runtime/device/device.cpp#200 edit
... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/build/Makefile.oclrocm#7 edit
... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/roccompiler.cpp#5 edit
... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocdevice.cpp#7 edit
... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rockernel.cpp#5 edit
... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rockernel.hpp#4 edit
... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocmetadata.cpp#1 add
... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocmetadata.hpp#1 add
... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocprogram.cpp#7 edit
... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocprogram.hpp#5 edit
... //depot/stg/opencl/drivers/opencl/runtime/device/rocm/rocvirtual.cpp#8 edit
... //depot/stg/opencl/drivers/opencl/runtime/platform/program.cpp#81 edit
2016-08-15 18:51:49 -04:00

171 rivejä
3.9 KiB
C++

//
// Copyright (c) 2010 Advanced Micro Devices, Inc. All rights reserved.
//
namespace device {
#define BLIT_KERNELS(...) #__VA_ARGS__
const char* BlitSourceCode =
BLIT_KERNELS(
extern void __amd_copyBufferRect(
__global uchar*, __global uchar*,
ulong4, ulong4, ulong4);
extern void __amd_copyBufferRectAligned(
__global uint*, __global uint*,
ulong4, ulong4, ulong4);
extern void __amd_copyBuffer(
__global uchar*, __global uchar*,
ulong, ulong, ulong, uint);
extern void __amd_copyBufferAligned(
__global uint*, __global uint*,
ulong, ulong, ulong, uint);
extern void __amd_fillBuffer(
__global uchar*, __global uint*, __constant uchar*,
uint, ulong, ulong);
__kernel void copyBufferRect(
__global uchar* src,
__global uchar* dst,
ulong4 srcRect,
ulong4 dstRect,
ulong4 size)
{
__amd_copyBufferRect(src, dst, srcRect, dstRect, size);
}
__kernel void copyBufferRectAligned(
__global uint* src,
__global uint* dst,
ulong4 srcRect,
ulong4 dstRect,
ulong4 size)
{
__amd_copyBufferRectAligned(src, dst, srcRect, dstRect, size);
}
__kernel void copyBuffer(
__global uchar* srcI,
__global uchar* dstI,
ulong srcOrigin,
ulong dstOrigin,
ulong size,
uint remain)
{
__amd_copyBuffer(srcI, dstI, srcOrigin, dstOrigin, size, remain);
}
__kernel void copyBufferAligned(
__global uint* src,
__global uint* dst,
ulong srcOrigin,
ulong dstOrigin,
ulong size,
uint alignment)
{
__amd_copyBufferAligned(src, dst, srcOrigin, dstOrigin, size, alignment);
}
__kernel void fillBuffer(
__global uchar* bufUChar,
__global uint* bufUInt,
__constant uchar* pattern,
uint patternSize,
ulong offset,
ulong size)
{
__amd_fillBuffer(bufUChar, bufUInt, pattern, patternSize, offset, size);
}
)
#if !defined(WITH_LIGHTNING_COMPILER)
BLIT_KERNELS(
extern void __amd_copyBufferToImage(
__global uint*, __write_only image2d_array_t, ulong4,
int4, int4, uint4, ulong4);
extern void __amd_copyImageToBuffer(
__read_only image2d_array_t, __global uint*, __global ushort*,
__global uchar*, int4, ulong4, int4, uint4, ulong4);
extern void __amd_copyImage(
__read_only image2d_array_t, __write_only image2d_array_t,
int4, int4, int4);
extern void __amd_copyImage1DA(
__read_only image2d_array_t, __write_only image2d_array_t,
int4, int4, int4);
extern void __amd_fillImage(
__write_only image2d_array_t,
float4, int4, uint4, int4, int4, uint);
__kernel void copyBufferToImage(
__global uint* src,
__write_only image2d_array_t dst,
ulong4 srcOrigin,
int4 dstOrigin,
int4 size,
uint4 format,
ulong4 pitch)
{
__amd_copyBufferToImage(src, dst, srcOrigin, dstOrigin, size, format, pitch);
}
__kernel void copyImageToBuffer(
__read_only image2d_array_t src,
__global uint* dstUInt,
__global ushort* dstUShort,
__global uchar* dstUChar,
int4 srcOrigin,
ulong4 dstOrigin,
int4 size,
uint4 format,
ulong4 pitch)
{
__amd_copyImageToBuffer(src, dstUInt, dstUShort, dstUChar,
srcOrigin, dstOrigin, size, format, pitch);
}
__kernel void copyImage(
__read_only image2d_array_t src,
__write_only image2d_array_t dst,
int4 srcOrigin,
int4 dstOrigin,
int4 size)
{
__amd_copyImage(src, dst, srcOrigin, dstOrigin, size);
}
__kernel void copyImage1DA(
__read_only image2d_array_t src,
__write_only image2d_array_t dst,
int4 srcOrigin,
int4 dstOrigin,
int4 size)
{
__amd_copyImage1DA(src, dst, srcOrigin, dstOrigin, size);
}
__kernel void fillImage(
__write_only image2d_array_t image,
float4 patternFLOAT4,
int4 patternINT4,
uint4 patternUINT4,
int4 origin,
int4 size,
uint type)
{
__amd_fillImage(image, patternFLOAT4, patternINT4, patternUINT4,
origin, size, type);
}
)
#endif // !defined(WITH_LIGHTNING_COMPILER)
;
} // namespace device