From ae61cd52cb231b8a9f697b9d64ffb3d998c23386 Mon Sep 17 00:00:00 2001
From: foreman
Date: Fri, 15 Dec 2017 16:04:24 -0500
Subject: [PATCH] P4 to Git Change 1495220 by gandryey@gera-w8 on 2017/12/15
15:59:55
SWDEV-79445 - OCL generic changes and code clean-up
- Following CL#1495187. Add a check for profiling enabled with the wavelimiter.
Affected files ...
... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palvirtual.cpp#67 edit
[ROCm/clr commit: ea9b94057ae4d729e25b1b2e8e81529c9cab2ead]
---
projects/clr/rocclr/runtime/device/pal/palvirtual.cpp | 2 +-
1 file changed, 1 insertion(+), 1 deletion(-)
diff --git a/projects/clr/rocclr/runtime/device/pal/palvirtual.cpp b/projects/clr/rocclr/runtime/device/pal/palvirtual.cpp
index 5e2301623d..0f2c685c51 100644
--- a/projects/clr/rocclr/runtime/device/pal/palvirtual.cpp
+++ b/projects/clr/rocclr/runtime/device/pal/palvirtual.cpp
@@ -1984,7 +1984,7 @@ bool VirtualGPU::submitKernelInternal(const amd::NDRangeContainer& sizes, const
iCmd()->CmdDispatchAql(dispatchParam);
// Note: This a workaround for incorrect results reported with release_mem packet,
// when the packet can be processed later after this dispatch and including extra time
- if (profiling()) {
+ if (profiling() || state_.profileEnabled_) {
flushCUCaches();
}
eventEnd(MainEngine, gpuEvent);