P4 to Git Change 1234219 by smekhano@stas-rampitec-hsa on 2016/02/03 22:29:28

SWDEV-86849 - HSA HLC: add AssertZExt to get_local_id/get_local_size calls if workrgoup size is know to fit i8 or i16
	Testing: smoke, precheckin
	Reviewed by Valery Pykhtin

Affected files ...

... //depot/stg/opencl/drivers/opencl/compiler/lib/backends/common/linker.cpp#138 edit
... //depot/stg/opencl/drivers/opencl/compiler/llvm/lib/Target/HSAIL/HSAILISelLowering.cpp#110 edit
... //depot/stg/opencl/drivers/opencl/compiler/llvm/lib/Target/HSAIL/HSAILISelLowering.h#27 edit
... //depot/stg/opencl/drivers/opencl/tests/hsa/src/llc/opt/mul24/local_size.cl#1 add
... //depot/stg/opencl/drivers/opencl/tests/hsa/tlst/llc_opt.tlst#80 edit
This commit is contained in:
foreman
2016-02-03 22:33:51 -05:00
والد bb433385db
کامیت bf45e6549f
@@ -125,6 +125,7 @@
#if !defined(LEGACY_COMPLIB)
namespace llvm {
extern bool HLC_FlushF32Denorms;
extern unsigned HLC_Max_WG_Size;
}
#endif
@@ -739,6 +740,7 @@ amdcl::OCLLinker::link(llvm::Module* input, std::vector<llvm::Module*> &libs)
setDenormsAreZero(Options()->oVariables->DenormsAreZero);
#if !defined(LEGACY_COMPLIB)
llvm::HLC_FlushF32Denorms = Options()->oVariables->DenormsAreZero;
llvm::HLC_Max_WG_Size = 2048; // Maximum HW supported workgroup size
#endif
setUniformWorkGroupSize(Options()->oVariables->UniformWorkGroupSize);
setHaveFastFMA32(chip == "Cypress"