From c4462940dbc5b1a82dcdd45aeebef96a71d62cea Mon Sep 17 00:00:00 2001
From: foreman
Date: Fri, 23 Feb 2018 19:23:42 -0500
Subject: [PATCH] P4 to Git Change 1519084 by gandryey@gera-w8 on 2018/02/23
19:15:27
SWDEV-79445 - OCL generic changes and code clean-up
- Remove debugger checks from the dispatch path. There are no plans to enable debugger in the near future.
Affected files ...
... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palvirtual.cpp#74 edit
[ROCm/clr commit: b561617774cd924a6a7f6339646af15c68ce1432]
---
.../rocclr/runtime/device/pal/palvirtual.cpp | 34 +++----------------
1 file changed, 5 insertions(+), 29 deletions(-)
diff --git a/projects/clr/rocclr/runtime/device/pal/palvirtual.cpp b/projects/clr/rocclr/runtime/device/pal/palvirtual.cpp
index 479f64096e..f053f0f1e2 100644
--- a/projects/clr/rocclr/runtime/device/pal/palvirtual.cpp
+++ b/projects/clr/rocclr/runtime/device/pal/palvirtual.cpp
@@ -2085,11 +2085,6 @@ bool VirtualGPU::submitKernelInternal(const amd::NDRangeContainer& sizes, const
const_address parameters, bool nativeMem,
amd::Event* enqueueEvent)
{
- uint64_t vmParentWrap = 0;
- uint64_t vmDefQueue = 0;
- VirtualGPU* gpuDefQueue = nullptr;
- amd::HwDebugManager* dbgManager = dev().hwDebugMgr();
-
// If RGP capturing is enabled, then start SQTT trace
if (rgpCaptureEna()) {
dev().rgpCaptureMgr()->PreDispatch(this);
@@ -2110,8 +2105,11 @@ bool VirtualGPU::submitKernelInternal(const amd::NDRangeContainer& sizes, const
return false;
}
+ // Add ISA memory object to the resource tracking list
AddKernel(kernel);
+ uint64_t vmDefQueue = 0;
+ VirtualGPU* gpuDefQueue = nullptr;
if (hsaKernel.dynamicParallelism()) {
// Initialize GPU device queue for execution (gpuDefQueue)
if (!PreDeviceEnqueue(kernel, hsaKernel, &gpuDefQueue, &vmDefQueue)) {
@@ -2119,14 +2117,7 @@ bool VirtualGPU::submitKernelInternal(const amd::NDRangeContainer& sizes, const
}
}
- // setup the storage for the memory pointers of the kernel parameters
- uint numParams = kernel.signature().numParameters();
- if (dbgManager) {
- dbgManager->allocParamMemList(numParams);
- }
-
bool needFlush = false;
-
// Avoid flushing when PerfCounter is enabled, to make sure PerfStart/dispatch/PerfEnd
// are in the same cmdBuffer
if (!state_.perfCounterEnabled_) {
@@ -2175,6 +2166,7 @@ bool VirtualGPU::submitKernelInternal(const amd::NDRangeContainer& sizes, const
amd::NDRangeContainer tmpSizes(sizes.dimensions(), &newOffset[0], &newGlobalSize[0],
&(const_cast(sizes).local()[0]));
+ uint64_t vmParentWrap = 0;
// Program the kernel arguments for the GPU execution
hsa_kernel_dispatch_packet_t* aqlPkt = hsaKernel.loadArguments(
*this, kernel, tmpSizes, parameters, nativeMem, vmDefQueue, &vmParentWrap);
@@ -2190,15 +2182,6 @@ bool VirtualGPU::submitKernelInternal(const amd::NDRangeContainer& sizes, const
addVmMemory(scratch->memObj_);
}
- // HW Debug for the kernel?
- HwDbgKernelInfo kernelInfo;
- HwDbgKernelInfo* pKernelInfo = nullptr;
-
- if (dbgManager) {
- buildKernelInfo(hsaKernel, aqlPkt, kernelInfo, enqueueEvent);
- pKernelInfo = &kernelInfo;
- }
-
// Set up the dispatch information
Pal::DispatchAqlParams dispatchParam = {};
dispatchParam.pAqlPacket = aqlPkt;
@@ -2222,13 +2205,6 @@ bool VirtualGPU::submitKernelInternal(const amd::NDRangeContainer& sizes, const
}
eventEnd(MainEngine, gpuEvent);
- if (id != gpuEvent.id) {
- LogError("something is wrong. ID mismatch!\n");
- }
- if (dbgManager && (nullptr != dbgManager->postDispatchCallBackFunc())) {
- dbgManager->executePostDispatchCallBack();
- }
-
// Execute scheduler for device enqueue
if (hsaKernel.dynamicParallelism()) {
PostDeviceEnqueue(kernel, hsaKernel, gpuDefQueue, vmDefQueue, vmParentWrap, &gpuEvent);
@@ -2245,7 +2221,7 @@ bool VirtualGPU::submitKernelInternal(const amd::NDRangeContainer& sizes, const
return false;
}
}
-
+ // Perform post dispatch logic for RGP traces
if (rgpCaptureEna()) {
dev().rgpCaptureMgr()->PostDispatch(this);
}