P4 to Git Change 1234219 by smekhano@stas-rampitec-hsa on 2016/02/03 22:29:28
SWDEV-86849 - HSA HLC: add AssertZExt to get_local_id/get_local_size calls if workrgoup size is know to fit i8 or i16 Testing: smoke, precheckin Reviewed by Valery Pykhtin Affected files ... ... //depot/stg/opencl/drivers/opencl/compiler/lib/backends/common/linker.cpp#138 edit ... //depot/stg/opencl/drivers/opencl/compiler/llvm/lib/Target/HSAIL/HSAILISelLowering.cpp#110 edit ... //depot/stg/opencl/drivers/opencl/compiler/llvm/lib/Target/HSAIL/HSAILISelLowering.h#27 edit ... //depot/stg/opencl/drivers/opencl/tests/hsa/src/llc/opt/mul24/local_size.cl#1 add ... //depot/stg/opencl/drivers/opencl/tests/hsa/tlst/llc_opt.tlst#80 edit
This commit is contained in:
@@ -125,6 +125,7 @@
|
||||
#if !defined(LEGACY_COMPLIB)
|
||||
namespace llvm {
|
||||
extern bool HLC_FlushF32Denorms;
|
||||
extern unsigned HLC_Max_WG_Size;
|
||||
}
|
||||
#endif
|
||||
|
||||
@@ -739,6 +740,7 @@ amdcl::OCLLinker::link(llvm::Module* input, std::vector<llvm::Module*> &libs)
|
||||
setDenormsAreZero(Options()->oVariables->DenormsAreZero);
|
||||
#if !defined(LEGACY_COMPLIB)
|
||||
llvm::HLC_FlushF32Denorms = Options()->oVariables->DenormsAreZero;
|
||||
llvm::HLC_Max_WG_Size = 2048; // Maximum HW supported workgroup size
|
||||
#endif
|
||||
setUniformWorkGroupSize(Options()->oVariables->UniformWorkGroupSize);
|
||||
setHaveFastFMA32(chip == "Cypress"
|
||||
|
||||
مرجع در شماره جدید
Block a user