From 19968ab78a26fe9f549985d681cd0b05abcbb5bc Mon Sep 17 00:00:00 2001 From: foreman Date: Wed, 1 Aug 2018 11:53:18 -0400 Subject: [PATCH] P4 to Git Change 1588181 by gandryey@gera-w8 on 2018/08/01 11:39:16 SWDEV-155434 - Add SQTT instrumentation tokens for OpenCL dispatches for RGP support - Switch to the workgroup size report for the dispatch info. Affected files ... ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palvirtual.cpp#118 edit --- rocclr/runtime/device/pal/palvirtual.cpp | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/rocclr/runtime/device/pal/palvirtual.cpp b/rocclr/runtime/device/pal/palvirtual.cpp index 0dfd42971e..f89e67a4ad 100644 --- a/rocclr/runtime/device/pal/palvirtual.cpp +++ b/rocclr/runtime/device/pal/palvirtual.cpp @@ -2139,7 +2139,10 @@ bool VirtualGPU::submitKernelInternal(const amd::NDRangeContainer& sizes, const // If RGP capturing is enabled, then start SQTT trace if (rgpCaptureEna()) { dev().rgpCaptureMgr()->PreDispatch(this, hsaKernel, - newGlobalSize[0], newGlobalSize[1], newGlobalSize[2]); + // Report global size in workgroups, since that's the RGP trace semantics + newGlobalSize[0] / sizes.local[0], + newGlobalSize[1] / sizes.local[1], + newGlobalSize[2] / sizes.local[2]); } bool printfEnabled = (hsaKernel.printfInfo().size() > 0) ? true : false;