901e67024a
SWDEV-79445 - OCL generic changes and code clean-up - Update copyright header. No functional changes. Affected files ... ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_agent_amd.h#3 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_d3d9_amd.hpp#19 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_debugger_amd.h#8 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_lqdflash_amd.h#7 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_p2p_amd.h#2 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_platform_amd.h#3 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_profile_amd.h#4 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_sdi_amd.cpp#5 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_sdi_amd.h#3 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_semaphore_amd.h#4 edit ... //depot/stg/opencl/drivers/opencl/api/opencl/amdocl/cl_thread_trace_amd.h#5 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paldeviced3d10.cpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paldeviced3d11.cpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paldeviced3d9.cpp#4 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paldevicegl.cpp#12 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/palmemory.cpp#29 edit ... //depot/stg/opencl/drivers/opencl/runtime/device/pal/paltrap.hpp#3 edit
138 regels
3.8 KiB
C++
138 regels
3.8 KiB
C++
//
|
|
// Copyright (c) 2015 Advanced Micro Devices, Inc. All rights reserved.
|
|
//
|
|
|
|
#include "paldevice.hpp"
|
|
|
|
#if defined(ATI_OS_LINUX)
|
|
namespace pal {
|
|
bool Device::associateD3D11Device(void* d3d11Device) { return false; }
|
|
} // namespace pal
|
|
#else // !ATI_OS_LINUX
|
|
|
|
#include <D3D11.h>
|
|
|
|
/**************************************************************************************************************
|
|
* Note: ideally the DXX extension interfaces should be mapped from the DXX perforce branch.
|
|
* This means OCL client spec will need to change to include headers directly from the DXX perforce
|
|
*tree.
|
|
* However, OCL only cares about the DXX OpenCL extension interface class. The spec cannot change
|
|
* without notification. So it is safe to use a local copy of the relevant DXX extension interface
|
|
*classes.
|
|
**************************************************************************************************************/
|
|
#include "DxxOpenCLInteropExt.h"
|
|
|
|
namespace pal {
|
|
|
|
static bool queryD3D11DeviceGPUMask(ID3D11Device* pd3d11Device, UINT* pd3d11DeviceGPUMask) {
|
|
HMODULE hDLL = nullptr;
|
|
IAmdDxExt* pExt = nullptr;
|
|
IAmdDxExtCLInterop* pCLExt = nullptr;
|
|
PFNAmdDxExtCreate11 AmdDxExtCreate11;
|
|
HRESULT hr = S_OK;
|
|
|
|
// Get a handle to the DXX DLL with extension API support
|
|
#if defined _WIN64
|
|
static const CHAR dxxModuleName[13] = "atidxx64.dll";
|
|
#else
|
|
static const CHAR dxxModuleName[13] = "atidxx32.dll";
|
|
#endif
|
|
|
|
hDLL = GetModuleHandle(dxxModuleName);
|
|
|
|
if (hDLL == nullptr) {
|
|
hr = E_FAIL;
|
|
}
|
|
|
|
// Get the exported AmdDxExtCreate() function pointer
|
|
if (SUCCEEDED(hr)) {
|
|
AmdDxExtCreate11 =
|
|
reinterpret_cast<PFNAmdDxExtCreate11>(GetProcAddress(hDLL, "AmdDxExtCreate11"));
|
|
if (AmdDxExtCreate11 == nullptr) {
|
|
hr = E_FAIL;
|
|
}
|
|
}
|
|
|
|
// Create the extension object
|
|
if (SUCCEEDED(hr)) {
|
|
hr = AmdDxExtCreate11(pd3d11Device, &pExt);
|
|
}
|
|
|
|
// Get the extension version information
|
|
if (SUCCEEDED(hr)) {
|
|
AmdDxExtVersion extVersion;
|
|
hr = pExt->GetVersion(&extVersion);
|
|
|
|
if (extVersion.majorVersion == 0) {
|
|
hr = E_FAIL;
|
|
}
|
|
}
|
|
|
|
// Get the OpenCL Interop interface
|
|
if (SUCCEEDED(hr)) {
|
|
pCLExt = static_cast<IAmdDxExtCLInterop*>(pExt->GetExtInterface(AmdDxExtCLInteropID));
|
|
if (pCLExt != nullptr) {
|
|
// Get the GPU mask using the CL Interop extension.
|
|
pCLExt->QueryInteropGpuMask(pd3d11DeviceGPUMask);
|
|
} else {
|
|
hr = E_FAIL;
|
|
}
|
|
}
|
|
|
|
if (pCLExt != nullptr) {
|
|
pCLExt->Release();
|
|
}
|
|
|
|
if (pExt != nullptr) {
|
|
pExt->Release();
|
|
}
|
|
|
|
return (SUCCEEDED(hr));
|
|
}
|
|
|
|
bool Device::associateD3D11Device(void* d3d11Device) {
|
|
ID3D11Device* pd3d11Device = static_cast<ID3D11Device*>(d3d11Device);
|
|
|
|
IDXGIDevice* pDXGIDevice;
|
|
pd3d11Device->QueryInterface(__uuidof(IDXGIDevice), (void**)&pDXGIDevice);
|
|
|
|
IDXGIAdapter* pDXGIAdapter;
|
|
pDXGIDevice->GetAdapter(&pDXGIAdapter);
|
|
|
|
DXGI_ADAPTER_DESC adapterDesc;
|
|
pDXGIAdapter->GetDesc(&adapterDesc);
|
|
|
|
// match the adapter
|
|
bool canInteroperate =
|
|
(properties().osProperties.luidHighPart == adapterDesc.AdapterLuid.HighPart) &&
|
|
(properties().osProperties.luidLowPart == adapterDesc.AdapterLuid.LowPart);
|
|
|
|
UINT chainBitMask = 1 << properties().gpuIndex;
|
|
|
|
// match the chain ID
|
|
if (canInteroperate) {
|
|
UINT d3d11DeviceGPUMask = 0;
|
|
|
|
if (queryD3D11DeviceGPUMask(pd3d11Device, &d3d11DeviceGPUMask)) {
|
|
canInteroperate = (chainBitMask & d3d11DeviceGPUMask) != 0;
|
|
} else {
|
|
// special handling for Intel iGPU + AMD dGPU in LDA mode
|
|
// (only occurs on a PX platform) where
|
|
// the D3D11Device object is created on the Intel iGPU and
|
|
// passed to AMD dGPU (secondary) to interoperate.
|
|
if (chainBitMask > 1) {
|
|
canInteroperate = false;
|
|
}
|
|
}
|
|
}
|
|
|
|
pDXGIDevice->Release();
|
|
pDXGIAdapter->Release();
|
|
|
|
return canInteroperate;
|
|
}
|
|
|
|
} // namespace pal
|
|
|
|
#endif // !ATI_OS_LINUX
|