2024-04-30 09:01:09 -05:00
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
|
//
|
|
|
|
|
// The University of Illinois/NCSA
|
|
|
|
|
// Open Source License (NCSA)
|
|
|
|
|
//
|
|
|
|
|
// Copyright (c) 2020, Advanced Micro Devices, Inc. All rights reserved.
|
|
|
|
|
//
|
|
|
|
|
// Developed by:
|
|
|
|
|
//
|
|
|
|
|
// AMD Research and AMD HSA Software Development
|
|
|
|
|
//
|
|
|
|
|
// Advanced Micro Devices, Inc.
|
|
|
|
|
//
|
|
|
|
|
// www.amd.com
|
|
|
|
|
//
|
|
|
|
|
// Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
|
|
|
// of this software and associated documentation files (the "Software"), to
|
|
|
|
|
// deal with the Software without restriction, including without limitation
|
|
|
|
|
// the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
|
|
|
// and/or sell copies of the Software, and to permit persons to whom the
|
|
|
|
|
// Software is furnished to do so, subject to the following conditions:
|
|
|
|
|
//
|
|
|
|
|
// - Redistributions of source code must retain the above copyright notice,
|
|
|
|
|
// this list of conditions and the following disclaimers.
|
|
|
|
|
// - Redistributions in binary form must reproduce the above copyright
|
|
|
|
|
// notice, this list of conditions and the following disclaimers in
|
|
|
|
|
// the documentation and/or other materials provided with the distribution.
|
|
|
|
|
// - Neither the names of Advanced Micro Devices, Inc,
|
|
|
|
|
// nor the names of its contributors may be used to endorse or promote
|
|
|
|
|
// products derived from this Software without specific prior written
|
|
|
|
|
// permission.
|
|
|
|
|
//
|
|
|
|
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
|
|
|
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
|
|
|
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
|
|
|
// THE CONTRIBUTORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
|
|
|
|
|
// OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
|
|
|
|
|
// ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
|
|
|
|
|
// DEALINGS WITH THE SOFTWARE.
|
|
|
|
|
//
|
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
|
|
|
|
|
|
#include <cinttypes>
|
|
|
|
|
#include <bitset>
|
|
|
|
|
|
|
|
|
|
#include <sys/mman.h>
|
|
|
|
|
#include <sys/sysinfo.h>
|
2025-02-24 16:17:58 +08:00
|
|
|
#include <sys/stat.h>
|
2024-04-30 09:01:09 -05:00
|
|
|
#include <linux/mman.h>
|
|
|
|
|
#include <fcntl.h>
|
|
|
|
|
#include <unistd.h>
|
2024-12-05 18:02:00 +08:00
|
|
|
#include "impl/wddm/status.h"
|
|
|
|
|
#include "impl/wddm/types.h"
|
|
|
|
|
#include "impl/wddm/device.h"
|
|
|
|
|
#include "impl/wddm/queue.h"
|
2024-04-30 09:01:09 -05:00
|
|
|
|
2024-09-10 08:16:11 -07:00
|
|
|
namespace wsl {
|
|
|
|
|
namespace thunk {
|
2024-04-30 09:01:09 -05:00
|
|
|
|
|
|
|
|
const uint32_t WDDMDevice::cmdbuf_aql_frame_num_ = 0x1000;
|
|
|
|
|
|
2025-06-25 12:08:35 +08:00
|
|
|
WDDMDevice::WDDMDevice(D3DKMT_HANDLE adapter, LUID adapter_luid, uint32_t node_id)
|
|
|
|
|
: adapter_(adapter), adapter_luid_(adapter_luid), node_id_(node_id) {
|
2024-04-30 09:01:09 -05:00
|
|
|
memset(&device_info_, 0, sizeof(device_info_));
|
|
|
|
|
|
|
|
|
|
ParseDeviceInfo();
|
|
|
|
|
CreateDevice();
|
|
|
|
|
SetPowerOptimization(false);
|
|
|
|
|
CreatePagingQueue();
|
|
|
|
|
InitCmdbufInfo();
|
2025-11-06 17:31:47 +08:00
|
|
|
QuerySegmentInfo();
|
2024-04-30 09:01:09 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
WDDMDevice::~WDDMDevice() {
|
|
|
|
|
DestroyPagingQueue();
|
|
|
|
|
SetPowerOptimization(true);
|
|
|
|
|
DestroyDevice();
|
|
|
|
|
|
|
|
|
|
DestroyDeviceInfo();
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static NTSTATUS WDDMQueryAdapter(D3DKMT_HANDLE adapter, KMTQUERYADAPTERINFOTYPE type,
|
|
|
|
|
void *data, int size)
|
|
|
|
|
{
|
|
|
|
|
D3DKMT_QUERYADAPTERINFO args = {0};
|
|
|
|
|
|
|
|
|
|
args.hAdapter = adapter;
|
|
|
|
|
args.Type = type;
|
|
|
|
|
args.pPrivateDriverData = data;
|
|
|
|
|
args.PrivateDriverDataSize = size;
|
|
|
|
|
|
2025-09-10 10:58:06 +08:00
|
|
|
return DXCORE_CALL(D3DKMTQueryAdapterInfo(&args));
|
2024-04-30 09:01:09 -05:00
|
|
|
}
|
|
|
|
|
|
2025-11-06 17:31:47 +08:00
|
|
|
bool WDDMDevice::QuerySegmentInfo()
|
|
|
|
|
{
|
|
|
|
|
uint32_t segmentCount = 0;
|
|
|
|
|
segment_infos_.clear();
|
|
|
|
|
|
|
|
|
|
// Get the number of segments
|
|
|
|
|
D3DKMT_QUERYSTATISTICS adapterQuery = {};
|
|
|
|
|
adapterQuery.Type = D3DKMT_QUERYSTATISTICS_ADAPTER;
|
|
|
|
|
adapterQuery.AdapterLuid = adapter_luid_;
|
|
|
|
|
|
|
|
|
|
NTSTATUS ret = DXCORE_CALL(D3DKMTQueryStatistics(&adapterQuery));
|
|
|
|
|
if (ret == STATUS_SUCCESS) {
|
|
|
|
|
segmentCount = adapterQuery.QueryResult.AdapterInformation.NbSegments;
|
|
|
|
|
pr_debug("Total Segments: %u\n", segmentCount);
|
|
|
|
|
} else {
|
|
|
|
|
pr_err("Failed to query adapter info\n");
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
for (uint32_t i = 0; i < segmentCount; i++) {
|
|
|
|
|
|
|
|
|
|
D3DKMT_QUERYSTATISTICS segQuery = {};
|
|
|
|
|
segQuery.Type = D3DKMT_QUERYSTATISTICS_SEGMENT;
|
|
|
|
|
segQuery.AdapterLuid = adapter_luid_;
|
|
|
|
|
segQuery.QuerySegment.SegmentId = i;
|
|
|
|
|
|
|
|
|
|
ret = DXCORE_CALL(D3DKMTQueryStatistics(&segQuery));
|
|
|
|
|
if (ret != STATUS_SUCCESS) {
|
|
|
|
|
pr_err("Failed to query segment %u info\n", i);
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
auto& seg = segQuery.QueryResult.SegmentInformation;
|
|
|
|
|
|
|
|
|
|
SegmentInfo info;
|
|
|
|
|
info.segment_id = i;
|
|
|
|
|
info.segment_type = seg.SegmentProperties.SegmentType;
|
|
|
|
|
info.system_memory = seg.SegmentProperties.SystemMemory;
|
|
|
|
|
info.aperture = seg.Aperture;
|
|
|
|
|
info.commit_limit = seg.CommitLimit;
|
|
|
|
|
|
|
|
|
|
segment_infos_.push_back(info);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool WDDMDevice::GetSegmentId(D3DKMT_QUERYSTATISTICS_SEGMENT_TYPE segment_type,
|
|
|
|
|
uint32_t &segment_id)
|
|
|
|
|
{
|
|
|
|
|
for (const auto& seg_info : segment_infos_) {
|
|
|
|
|
if (seg_info.segment_type == segment_type) {
|
|
|
|
|
segment_id = seg_info.segment_id;
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
pr_err("Failed to get segment id for type %u\n", segment_type);
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
2025-10-27 11:20:26 +08:00
|
|
|
/*Local heap(dedicated GPU memory) includes visiable heap and invisiable heap.
|
|
|
|
|
*Non local heap refers to shared GPU memory and it is sytem memory.
|
|
|
|
|
*/
|
2024-04-30 09:01:09 -05:00
|
|
|
uint64_t WDDMDevice::VramAvail(void) {
|
|
|
|
|
D3DKMT_QUERYSTATISTICS stats;
|
|
|
|
|
NTSTATUS ret;
|
|
|
|
|
uint64_t usedVis = 0;
|
|
|
|
|
uint64_t usedInv = 0;
|
2025-10-27 11:20:26 +08:00
|
|
|
uint64_t usedNonLocal = 0;
|
|
|
|
|
uint32_t segmentId = 0;
|
2024-04-30 09:01:09 -05:00
|
|
|
|
|
|
|
|
// wait fence complete
|
|
|
|
|
uint64_t value = page_fence_value_.load();
|
|
|
|
|
if(!CpuWait(&page_syncobj_, &value, 1, false))
|
|
|
|
|
return HSA_STATUS_ERROR;
|
|
|
|
|
|
2025-10-27 11:20:26 +08:00
|
|
|
if (IsDgpu()) {
|
|
|
|
|
// local cpu-visible memory
|
|
|
|
|
if(!GetSegmentId(D3DKMT_QUERYSTATISTICS_SEGMENT_TYPE_MEMORY, segmentId))
|
|
|
|
|
return HSA_STATUS_ERROR;
|
|
|
|
|
|
|
|
|
|
memset(&stats, 0, sizeof(D3DKMT_QUERYSTATISTICS));
|
|
|
|
|
stats.Type = D3DKMT_QUERYSTATISTICS_SEGMENT;
|
|
|
|
|
stats.AdapterLuid = adapter_luid_;
|
|
|
|
|
stats.QuerySegment.SegmentId = segmentId;
|
|
|
|
|
ret = DXCORE_CALL(D3DKMTQueryStatistics(&stats));
|
|
|
|
|
if (ret == 0)
|
|
|
|
|
usedVis = stats.QueryResult.SegmentInformation.BytesResident;
|
|
|
|
|
|
|
|
|
|
// local invisible memory
|
|
|
|
|
if (device_info_.local_invisible_heap_size) {
|
|
|
|
|
segmentId++;
|
|
|
|
|
memset(&stats, 0, sizeof(D3DKMT_QUERYSTATISTICS));
|
|
|
|
|
stats.Type = D3DKMT_QUERYSTATISTICS_SEGMENT;
|
|
|
|
|
stats.AdapterLuid = adapter_luid_;
|
|
|
|
|
stats.QuerySegment.SegmentId = 1;
|
|
|
|
|
|
|
|
|
|
ret = DXCORE_CALL(D3DKMTQueryStatistics(&stats));
|
|
|
|
|
if (ret == 0)
|
|
|
|
|
usedInv = stats.QueryResult.SegmentInformation.BytesResident;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return LocalHeapSize() - usedVis - usedInv;
|
|
|
|
|
} else {
|
|
|
|
|
// APU - NonLocal memory
|
|
|
|
|
if(!GetSegmentId(D3DKMT_QUERYSTATISTICS_SEGMENT_TYPE_SYSMEM, segmentId))
|
|
|
|
|
return HSA_STATUS_ERROR;
|
|
|
|
|
|
|
|
|
|
memset(&stats, 0, sizeof(D3DKMT_QUERYSTATISTICS));
|
|
|
|
|
stats.Type = D3DKMT_QUERYSTATISTICS_SEGMENT;
|
|
|
|
|
stats.AdapterLuid = adapter_luid_;
|
|
|
|
|
stats.QuerySegment.SegmentId = segmentId;
|
|
|
|
|
ret = DXCORE_CALL(D3DKMTQueryStatistics(&stats));
|
|
|
|
|
if (ret == 0)
|
|
|
|
|
usedNonLocal = stats.QueryResult.SegmentInformation.BytesResident;
|
|
|
|
|
|
|
|
|
|
return NonLocalHeapSize() - usedNonLocal;
|
|
|
|
|
}
|
2024-04-30 09:01:09 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool WDDMDevice::CreateDevice(void) {
|
|
|
|
|
D3DKMT_CREATEDEVICE args = {0};
|
|
|
|
|
args.hAdapter = adapter_;
|
|
|
|
|
|
2025-09-10 10:58:06 +08:00
|
|
|
NTSTATUS ret = DXCORE_CALL(D3DKMTCreateDevice(&args));
|
2024-04-30 09:01:09 -05:00
|
|
|
if (ret == STATUS_SUCCESS) {
|
|
|
|
|
device_ = args.hDevice;
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
|
2024-10-14 16:04:16 +08:00
|
|
|
pr_err("fail %x\n", ret);
|
2024-04-30 09:01:09 -05:00
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool WDDMDevice::DestroyDevice(void) {
|
|
|
|
|
D3DKMT_DESTROYDEVICE args = {0};
|
|
|
|
|
args.hDevice = device_;
|
|
|
|
|
|
2025-09-10 10:58:06 +08:00
|
|
|
NTSTATUS ret = DXCORE_CALL(D3DKMTDestroyDevice(&args));
|
2024-04-30 09:01:09 -05:00
|
|
|
if (ret == STATUS_SUCCESS)
|
|
|
|
|
return true;
|
|
|
|
|
|
2024-10-14 16:04:16 +08:00
|
|
|
pr_err("fail %x\n", ret);
|
2024-04-30 09:01:09 -05:00
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool WDDMDevice::CreatePagingQueue(void) {
|
|
|
|
|
D3DKMT_CREATEPAGINGQUEUE args = {0};
|
|
|
|
|
args.hDevice = device_;
|
|
|
|
|
args.Priority = D3DDDI_PAGINGQUEUE_PRIORITY_NORMAL;
|
|
|
|
|
|
2025-09-10 10:58:06 +08:00
|
|
|
NTSTATUS ret = DXCORE_CALL(D3DKMTCreatePagingQueue(&args));
|
2024-04-30 09:01:09 -05:00
|
|
|
if (ret == STATUS_SUCCESS) {
|
|
|
|
|
page_queue_ = args.hPagingQueue;
|
|
|
|
|
page_syncobj_ = args.hSyncObject;
|
|
|
|
|
page_fence_addr_ = (uint64_t *)args.FenceValueCPUVirtualAddress;
|
|
|
|
|
page_fence_value_ = 0;
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
|
2024-10-14 16:04:16 +08:00
|
|
|
pr_err("fail %x\n", ret);
|
2024-04-30 09:01:09 -05:00
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool WDDMDevice::DestroyPagingQueue(void) {
|
|
|
|
|
D3DDDI_DESTROYPAGINGQUEUE args = {0};
|
|
|
|
|
args.hPagingQueue = page_queue_;
|
|
|
|
|
|
2025-09-10 10:58:06 +08:00
|
|
|
NTSTATUS ret = DXCORE_CALL(D3DKMTDestroyPagingQueue(&args));
|
2024-04-30 09:01:09 -05:00
|
|
|
if (ret == STATUS_SUCCESS)
|
|
|
|
|
return true;
|
|
|
|
|
|
2024-10-14 16:04:16 +08:00
|
|
|
pr_err("fail %x\n", ret);
|
2024-04-30 09:01:09 -05:00
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void WDDMDevice::SetPowerOptimization(bool restore) {
|
|
|
|
|
void *priv_data;
|
|
|
|
|
int priv_size;
|
|
|
|
|
|
2025-08-01 15:18:51 +08:00
|
|
|
priv_size = thunk_proxy::GetPowerOptPrivDataSize();
|
|
|
|
|
priv_data = malloc(priv_size);
|
|
|
|
|
assert(priv_data);
|
|
|
|
|
memset(priv_data, 0, priv_size);
|
|
|
|
|
thunk_proxy::FillinPowerOptPrivData(priv_data, restore);
|
2024-04-30 09:01:09 -05:00
|
|
|
|
|
|
|
|
D3DKMT_ESCAPE d3dkmt_escape;
|
|
|
|
|
memset(&d3dkmt_escape, 0, sizeof(d3dkmt_escape));
|
|
|
|
|
|
|
|
|
|
d3dkmt_escape.hAdapter = adapter_;
|
|
|
|
|
d3dkmt_escape.hDevice = device_;
|
|
|
|
|
d3dkmt_escape.hContext = 0; //KMD only use device to identify the process
|
|
|
|
|
d3dkmt_escape.Type = D3DKMT_ESCAPE_DRIVERPRIVATE;
|
|
|
|
|
d3dkmt_escape.pPrivateDriverData = priv_data;
|
|
|
|
|
d3dkmt_escape.PrivateDriverDataSize = priv_size;
|
|
|
|
|
d3dkmt_escape.Flags.HardwareAccess = true;
|
|
|
|
|
|
2025-09-10 10:58:06 +08:00
|
|
|
NTSTATUS status = DXCORE_CALL(D3DKMTEscape(&d3dkmt_escape));
|
2024-10-09 15:35:44 +08:00
|
|
|
pr_debug("status %d, restore %d\n", status, restore);
|
2025-08-01 15:18:51 +08:00
|
|
|
free(priv_data);
|
2024-04-30 09:01:09 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void WDDMDevice::UpdatePageFence(uint64_t fence_value) {
|
|
|
|
|
uint64_t current = page_fence_value_.load();
|
|
|
|
|
|
|
|
|
|
// atomically set fence value when target is bigger than current one
|
|
|
|
|
do {
|
|
|
|
|
if (current >= fence_value)
|
|
|
|
|
break;
|
|
|
|
|
} while (!page_fence_value_.compare_exchange_weak(current, fence_value));
|
|
|
|
|
}
|
|
|
|
|
|
2025-07-05 12:38:07 +08:00
|
|
|
ErrorCode WDDMDevice::CreateGpuMemory(const GpuMemoryCreateInfo &create_info,
|
|
|
|
|
GpuMemory **gpu_mem, gpusize *gpu_va) {
|
2024-04-30 09:01:09 -05:00
|
|
|
ErrorCode ret;
|
|
|
|
|
|
|
|
|
|
*gpu_mem = nullptr;
|
|
|
|
|
auto mem = new GpuMemory(this);
|
|
|
|
|
if (create_info.dmabuf_fd > 0)
|
2025-07-05 12:38:07 +08:00
|
|
|
ret = mem->ImportPhysicalHandle(create_info, gpu_va);
|
2024-04-30 09:01:09 -05:00
|
|
|
else
|
|
|
|
|
ret = mem->Init(create_info);
|
|
|
|
|
if (ret == ErrorCode::Success)
|
|
|
|
|
*gpu_mem = mem;
|
2024-09-10 10:38:30 +08:00
|
|
|
else
|
|
|
|
|
delete mem;
|
2024-04-30 09:01:09 -05:00
|
|
|
|
|
|
|
|
return ret;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void *WDDMDevice::Lock(D3DKMT_HANDLE handle) {
|
|
|
|
|
D3DKMT_LOCK2 args = {0};
|
|
|
|
|
args.hDevice = device_;
|
|
|
|
|
args.hAllocation = handle;
|
|
|
|
|
|
2025-09-10 10:58:06 +08:00
|
|
|
NTSTATUS ret = DXCORE_CALL(D3DKMTLock2(&args));
|
2024-04-30 09:01:09 -05:00
|
|
|
if (ret == STATUS_SUCCESS)
|
|
|
|
|
return args.pData;
|
|
|
|
|
|
2024-10-14 16:04:16 +08:00
|
|
|
pr_err("fail %x\n", ret);
|
2024-04-30 09:01:09 -05:00
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool WDDMDevice::Unlock(D3DKMT_HANDLE handle) {
|
|
|
|
|
D3DKMT_UNLOCK2 args = {0};
|
|
|
|
|
args.hDevice = device_;
|
|
|
|
|
args.hAllocation = handle;
|
|
|
|
|
|
2025-09-10 10:58:06 +08:00
|
|
|
NTSTATUS ret = DXCORE_CALL(D3DKMTUnlock2(&args));
|
2024-04-30 09:01:09 -05:00
|
|
|
if (ret == STATUS_SUCCESS)
|
|
|
|
|
return true;
|
|
|
|
|
|
2024-10-14 16:04:16 +08:00
|
|
|
pr_err("fail %x\n", ret);
|
2024-04-30 09:01:09 -05:00
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool WDDMDevice::CreateContext(int engine, D3DKMT_HANDLE *handle) {
|
|
|
|
|
void *priv_data;
|
|
|
|
|
int priv_size;
|
|
|
|
|
|
|
|
|
|
int ordinal = EngineOrdinal(engine, &device_info_);
|
|
|
|
|
if (ordinal < 0)
|
|
|
|
|
return false;
|
|
|
|
|
|
2025-08-01 15:18:51 +08:00
|
|
|
priv_size = thunk_proxy::GetContextPrivDataSize();
|
|
|
|
|
priv_data = malloc(priv_size);
|
|
|
|
|
assert(priv_data);
|
|
|
|
|
memset(priv_data, 0, priv_size);
|
|
|
|
|
thunk_proxy::FillinContextPrivData(priv_data, SupportStateShadowingByCpFw());
|
2024-04-30 09:01:09 -05:00
|
|
|
|
|
|
|
|
D3DKMT_CREATECONTEXTVIRTUAL args = {0};
|
|
|
|
|
args.hDevice = device_;
|
|
|
|
|
args.EngineAffinity = 1 << 0;
|
|
|
|
|
args.NodeOrdinal = ordinal;
|
|
|
|
|
args.pPrivateDriverData = priv_data;
|
|
|
|
|
args.PrivateDriverDataSize = priv_size;
|
|
|
|
|
args.ClientHint = D3DKMT_CLIENTHINT_OPENCL;
|
|
|
|
|
|
|
|
|
|
if (IsHwsEnabled(engine))
|
|
|
|
|
args.Flags.HwQueueSupported = 1;
|
|
|
|
|
else
|
2024-10-14 15:52:52 +08:00
|
|
|
args.Flags.DisableGpuTimeout = thunk_proxy::ShouldDisableGpuTimeout(engine, &device_info_);
|
2024-04-30 09:01:09 -05:00
|
|
|
|
2025-09-10 10:58:06 +08:00
|
|
|
NTSTATUS ret = DXCORE_CALL(D3DKMTCreateContextVirtual(&args));
|
2024-04-30 09:01:09 -05:00
|
|
|
if (ret == STATUS_SUCCESS) {
|
|
|
|
|
*handle = args.hContext;
|
2025-08-01 15:18:51 +08:00
|
|
|
free(priv_data);
|
2024-04-30 09:01:09 -05:00
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
|
2025-08-01 15:18:51 +08:00
|
|
|
free(priv_data);
|
2024-04-30 09:01:09 -05:00
|
|
|
|
2024-10-14 16:04:16 +08:00
|
|
|
pr_err("fail %x\n", ret);
|
2024-04-30 09:01:09 -05:00
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool WDDMDevice::DestroyContext(D3DKMT_HANDLE handle) {
|
|
|
|
|
D3DKMT_DESTROYCONTEXT args = {0};
|
|
|
|
|
args.hContext = handle;
|
|
|
|
|
|
2025-09-10 10:58:06 +08:00
|
|
|
NTSTATUS ret = DXCORE_CALL(D3DKMTDestroyContext(&args));
|
2024-04-30 09:01:09 -05:00
|
|
|
if (ret == STATUS_SUCCESS)
|
|
|
|
|
return true;
|
|
|
|
|
|
2024-10-14 16:04:16 +08:00
|
|
|
pr_err("fail %x\n", ret);
|
2024-04-30 09:01:09 -05:00
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool WDDMDevice::GpuWait(WDDMQueue *queue, const D3DKMT_HANDLE *syncobjs,
|
|
|
|
|
uint64_t *values, int count) {
|
|
|
|
|
|
|
|
|
|
D3DKMT_WAITFORSYNCHRONIZATIONOBJECTFROMGPU args = {0};
|
|
|
|
|
args.hContext = queue->context;
|
|
|
|
|
args.ObjectCount = count;
|
|
|
|
|
args.ObjectHandleArray = syncobjs;
|
|
|
|
|
args.MonitoredFenceValueArray = values;
|
|
|
|
|
|
2025-09-10 10:58:06 +08:00
|
|
|
NTSTATUS ret = DXCORE_CALL(D3DKMTWaitForSynchronizationObjectFromGpu(&args));
|
2024-04-30 09:01:09 -05:00
|
|
|
if (ret == STATUS_SUCCESS)
|
|
|
|
|
return true;
|
|
|
|
|
|
2024-10-14 16:04:16 +08:00
|
|
|
pr_err("fail %x\n", ret);
|
2024-04-30 09:01:09 -05:00
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool WDDMDevice::GpuSignal(D3DKMT_HANDLE context, const D3DKMT_HANDLE *syncobjs,
|
|
|
|
|
uint64_t *value, int count) {
|
|
|
|
|
D3DKMT_SIGNALSYNCHRONIZATIONOBJECTFROMGPU args = {0};
|
|
|
|
|
args.hContext = context;
|
|
|
|
|
args.ObjectCount = count;
|
|
|
|
|
args.ObjectHandleArray = syncobjs;
|
|
|
|
|
args.MonitoredFenceValueArray = value;
|
|
|
|
|
|
2025-09-10 10:58:06 +08:00
|
|
|
NTSTATUS ret = DXCORE_CALL(D3DKMTSignalSynchronizationObjectFromGpu(&args));
|
2024-04-30 09:01:09 -05:00
|
|
|
if (ret == STATUS_SUCCESS)
|
|
|
|
|
return true;
|
|
|
|
|
|
2024-10-14 16:04:16 +08:00
|
|
|
pr_err("fail %x\n", ret);
|
2024-04-30 09:01:09 -05:00
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool WDDMDevice::CpuWait(const D3DKMT_HANDLE *syncobjs, uint64_t *value,
|
|
|
|
|
int count, bool wait_any) {
|
|
|
|
|
D3DKMT_WAITFORSYNCHRONIZATIONOBJECTFROMCPU args = {0};
|
|
|
|
|
args.hDevice = device_;
|
|
|
|
|
args.ObjectCount = count;
|
|
|
|
|
args.ObjectHandleArray = syncobjs;
|
|
|
|
|
args.FenceValueArray = value;
|
|
|
|
|
args.Flags.WaitAny = wait_any;
|
|
|
|
|
|
2025-09-10 10:58:06 +08:00
|
|
|
NTSTATUS ret = DXCORE_CALL(D3DKMTWaitForSynchronizationObjectFromCpu(&args));
|
2024-04-30 09:01:09 -05:00
|
|
|
if (ret == STATUS_SUCCESS)
|
|
|
|
|
return true;
|
|
|
|
|
|
2024-10-14 16:04:16 +08:00
|
|
|
pr_err("fail %x\n", ret);
|
2024-04-30 09:01:09 -05:00
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool WDDMDevice::WaitOnPagingFenceFromCpu() {
|
|
|
|
|
uint64_t page_fence_value = 0;
|
|
|
|
|
|
|
|
|
|
page_fence_value = page_fence_value_.load();
|
|
|
|
|
if (CpuWait(&page_syncobj_, &page_fence_value, 1, false))
|
|
|
|
|
return true;
|
|
|
|
|
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool WDDMDevice::CreateSyncobj(D3DKMT_HANDLE *handle, uint64_t **addr) {
|
|
|
|
|
D3DKMT_CREATESYNCHRONIZATIONOBJECT2 args = {0};
|
|
|
|
|
args.hDevice = device_;
|
|
|
|
|
args.Info.Type = D3DDDI_MONITORED_FENCE;
|
|
|
|
|
args.Info.MonitoredFence.EngineAffinity = 1 << 0;
|
|
|
|
|
|
2025-09-10 10:58:06 +08:00
|
|
|
NTSTATUS ret = DXCORE_CALL(D3DKMTCreateSynchronizationObject2(&args));
|
2024-04-30 09:01:09 -05:00
|
|
|
if (ret == STATUS_SUCCESS) {
|
|
|
|
|
*handle = args.hSyncObject;
|
|
|
|
|
*addr = (uint64_t *)args.Info.MonitoredFence.FenceValueCPUVirtualAddress;
|
2024-10-09 15:35:44 +08:00
|
|
|
pr_debug("create syncobj cpu addr=%p gpu addr=%" PRIx64 "\n",
|
|
|
|
|
args.Info.MonitoredFence.FenceValueCPUVirtualAddress,
|
|
|
|
|
args.Info.MonitoredFence.FenceValueGPUVirtualAddress);
|
|
|
|
|
|
2024-04-30 09:01:09 -05:00
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
|
2024-10-14 16:04:16 +08:00
|
|
|
pr_err("fail %x\n", ret);
|
2024-04-30 09:01:09 -05:00
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void WDDMDevice::DestroySyncobj(D3DKMT_HANDLE handle) {
|
|
|
|
|
D3DKMT_DESTROYSYNCHRONIZATIONOBJECT args = {0};
|
|
|
|
|
args.hSyncObject = handle;
|
|
|
|
|
|
2025-09-10 10:58:06 +08:00
|
|
|
NTSTATUS ret = DXCORE_CALL(D3DKMTDestroySynchronizationObject(&args));
|
2024-04-30 09:01:09 -05:00
|
|
|
if (ret != STATUS_SUCCESS)
|
2024-10-14 16:04:16 +08:00
|
|
|
pr_err("fail %x\n", ret);
|
2024-04-30 09:01:09 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void WDDMDevice::InitCmdbufInfo(void) {
|
|
|
|
|
if (device_info_.major == 9) {
|
|
|
|
|
cmdbuf_aql_frame_size_ = 2 * sizeof(gfx9::AcquireMemTemplate);
|
|
|
|
|
} else if (device_info_.major >= 10) {
|
|
|
|
|
cmdbuf_aql_frame_size_ = 2 * sizeof(gfx10::AcquireMemTemplate);
|
|
|
|
|
}
|
|
|
|
|
|
2025-11-18 17:31:24 +08:00
|
|
|
if (device_info_.major >= 11) {
|
2024-04-30 09:01:09 -05:00
|
|
|
cmdbuf_aql_frame_size_ += sizeof(SetScratchTemplate);
|
2025-11-18 17:31:24 +08:00
|
|
|
cmdbuf_aql_frame_size_ += sizeof(DispatchProgramResourceRegs); // BuildComputeShaderParams
|
|
|
|
|
}
|
2024-04-30 09:01:09 -05:00
|
|
|
|
|
|
|
|
cmdbuf_aql_frame_size_ +=
|
|
|
|
|
sizeof(PM4MEC_COPY_DATA) * 2 +
|
|
|
|
|
sizeof(BarrierTemplate) * 2 +
|
|
|
|
|
sizeof(DispatchTemplate) +
|
|
|
|
|
sizeof(AtomicTemplate) * 2;
|
2025-11-18 17:31:24 +08:00
|
|
|
|
|
|
|
|
// Add safety margin to account for alignment and future additions
|
|
|
|
|
cmdbuf_aql_frame_size_ += 128;
|
|
|
|
|
|
2024-04-30 09:01:09 -05:00
|
|
|
cmdbuf_aql_frame_size_ = AlignUp(cmdbuf_aql_frame_size_, 0x10);
|
|
|
|
|
|
|
|
|
|
cmdbuf_size_ = AlignUp(cmdbuf_aql_frame_num_ * cmdbuf_aql_frame_size_, 0x1000);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
uint32_t WDDMDevice::LdsBlocks(const hsa_kernel_dispatch_packet_t *pkt) {
|
|
|
|
|
static const uint32_t blk_sz = 512;
|
|
|
|
|
uint32_t total_sz = pkt->group_segment_size;
|
|
|
|
|
uint32_t blk_num = (total_sz + blk_sz - 1) / blk_sz;
|
|
|
|
|
return blk_num;
|
|
|
|
|
}
|
|
|
|
|
|
2025-07-25 11:42:16 +08:00
|
|
|
NTSTATUS WDDMCreateDevices(std::vector<WDDMDevice *> &devices)
|
2024-04-30 09:01:09 -05:00
|
|
|
{
|
|
|
|
|
bool supported = false;
|
|
|
|
|
D3DKMT_ENUMADAPTERS2 args = {0};
|
2025-09-10 10:58:06 +08:00
|
|
|
NTSTATUS ret = DXCORE_CALL(D3DKMTEnumAdapters2(&args));
|
2024-04-30 09:01:09 -05:00
|
|
|
if (ret != STATUS_SUCCESS)
|
|
|
|
|
return ret;
|
|
|
|
|
|
|
|
|
|
if (!args.NumAdapters) {
|
|
|
|
|
return STATUS_SUCCESS;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
D3DKMT_ADAPTERINFO *info = new D3DKMT_ADAPTERINFO[args.NumAdapters];
|
|
|
|
|
if (!info)
|
|
|
|
|
return STATUS_NO_MEMORY;
|
|
|
|
|
|
|
|
|
|
args.pAdapters = info;
|
2025-09-10 10:58:06 +08:00
|
|
|
ret = DXCORE_CALL(D3DKMTEnumAdapters2(&args));
|
2024-04-30 09:01:09 -05:00
|
|
|
if (ret != STATUS_SUCCESS)
|
|
|
|
|
goto err_out0;
|
|
|
|
|
|
|
|
|
|
for (int i = 0; i < args.NumAdapters; i++) {
|
2025-07-25 11:23:04 +08:00
|
|
|
D3DKMT_QUERY_DEVICE_IDS query = {0};
|
2024-04-30 09:01:09 -05:00
|
|
|
|
2025-07-25 11:23:04 +08:00
|
|
|
ret = WDDMQueryAdapter(info[i].hAdapter, KMTQAITYPE_PHYSICALADAPTERDEVICEIDS,
|
2024-04-30 09:01:09 -05:00
|
|
|
&query, sizeof(query));
|
|
|
|
|
if (ret != STATUS_SUCCESS)
|
|
|
|
|
goto err_out1;
|
|
|
|
|
|
2025-07-25 11:23:04 +08:00
|
|
|
if (query.DeviceIds.VendorID != 0x1002)
|
2025-03-19 16:56:29 +08:00
|
|
|
continue;
|
|
|
|
|
|
2025-07-25 11:23:04 +08:00
|
|
|
supported = thunk_proxy::QueryAdapterSupported(query.DeviceIds.DeviceID);
|
2024-04-30 09:01:09 -05:00
|
|
|
|
2025-03-19 16:56:29 +08:00
|
|
|
if (supported) {
|
2025-07-25 11:42:16 +08:00
|
|
|
auto device = new WDDMDevice(
|
|
|
|
|
info[i].hAdapter, info[i].AdapterLuid, devices.size() + 1);
|
|
|
|
|
if (!device)
|
|
|
|
|
goto err_out1;
|
|
|
|
|
devices.push_back(device);
|
2024-04-30 09:01:09 -05:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2024-11-04 16:44:42 +08:00
|
|
|
delete[] info;
|
2024-04-30 09:01:09 -05:00
|
|
|
return STATUS_SUCCESS;
|
|
|
|
|
|
|
|
|
|
err_out1:
|
2025-07-25 11:42:16 +08:00
|
|
|
for (auto &device : devices)
|
|
|
|
|
delete device;
|
2024-04-30 09:01:09 -05:00
|
|
|
err_out0:
|
2024-11-04 16:44:42 +08:00
|
|
|
delete[] info;
|
2024-04-30 09:01:09 -05:00
|
|
|
return ret;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool WDDMDevice::ParseDeviceInfo() {
|
|
|
|
|
bool ret;
|
|
|
|
|
|
|
|
|
|
memset(&device_info_, 0, sizeof(device_info_));
|
2024-10-14 15:52:52 +08:00
|
|
|
ret = thunk_proxy::ParseAdapterInfo(adapter_, &device_info_);
|
2024-04-30 09:01:09 -05:00
|
|
|
if (!ret)
|
|
|
|
|
return false;
|
|
|
|
|
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void WDDMDevice::DestroyDeviceInfo() {
|
|
|
|
|
free(device_info_.adapter_info);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void WDDMDevice::GetClockCounters(uint64_t *gpu, uint64_t *cpu) {
|
|
|
|
|
|
2025-06-25 17:10:12 +08:00
|
|
|
uint32_t engine = GetComputeEngine();
|
|
|
|
|
int ordinal = EngineOrdinal(engine, &device_info_);
|
2024-04-30 09:01:09 -05:00
|
|
|
|
2025-06-25 17:10:12 +08:00
|
|
|
D3DKMT_QUERYCLOCKCALIBRATION args = {0};
|
2024-04-30 09:01:09 -05:00
|
|
|
|
2025-06-25 17:10:12 +08:00
|
|
|
/* LDA(Linked Display Adapter)
|
|
|
|
|
* In the LDA design multiple physical GPUs are linked together to be controlled
|
|
|
|
|
* as a single object from the point of view of power manager, GPU scheduler and
|
|
|
|
|
* GPU memory manager. The physical GPUs are represented by a signal logical adapter
|
|
|
|
|
* object. There is a single DXGADAPTER objects, a single KMD adapter object.
|
|
|
|
|
*
|
|
|
|
|
* Set PhysicalAdapterIndex to 0 by default with None LDA mode.
|
|
|
|
|
*/
|
|
|
|
|
args.hAdapter = adapter_;
|
|
|
|
|
args.NodeOrdinal = ordinal;
|
|
|
|
|
args.PhysicalAdapterIndex = 0;
|
2024-04-30 09:01:09 -05:00
|
|
|
|
2025-09-10 10:58:06 +08:00
|
|
|
NTSTATUS status = DXCORE_CALL(D3DKMTQueryClockCalibration(&args));
|
2024-04-30 09:01:09 -05:00
|
|
|
if (status) {
|
2024-10-09 15:35:44 +08:00
|
|
|
pr_debug("status %d \n", status);
|
2024-04-30 09:01:09 -05:00
|
|
|
} else {
|
2025-06-25 17:10:12 +08:00
|
|
|
if (gpu)
|
|
|
|
|
*gpu = args.ClockData.GpuClockCounter;
|
|
|
|
|
|
|
|
|
|
if (cpu)
|
|
|
|
|
*cpu = args.ClockData.CpuClockCounter;
|
2024-04-30 09:01:09 -05:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool WDDMDevice::CreateQueue(WDDMQueue *queue) {
|
|
|
|
|
if (!CreateContext(queue->queue_engine, &queue->context))
|
|
|
|
|
return false;
|
|
|
|
|
|
|
|
|
|
GpuMemory *gpu_mem = nullptr;
|
2024-09-11 14:21:54 +08:00
|
|
|
if (queue->cmdbuf_addr == 0) {
|
|
|
|
|
GpuMemoryCreateInfo create_info{};
|
|
|
|
|
create_info.size = queue->cmdbuf_size;
|
|
|
|
|
create_info.domain = thunk_proxy::kSystem;
|
|
|
|
|
|
|
|
|
|
auto code = CreateGpuMemory(create_info, &gpu_mem);
|
|
|
|
|
if (code != ErrorCode::Success)
|
|
|
|
|
goto err_out0;
|
2024-04-30 09:01:09 -05:00
|
|
|
|
2024-09-11 14:21:54 +08:00
|
|
|
queue->cmdbuf = gpu_mem->GetGpuMemoryHandle();
|
|
|
|
|
queue->cmdbuf_addr = gpu_mem->GpuAddress();
|
|
|
|
|
}
|
2024-04-30 09:01:09 -05:00
|
|
|
|
|
|
|
|
if (queue->Init())
|
|
|
|
|
goto err_out1;
|
|
|
|
|
|
|
|
|
|
return true;
|
|
|
|
|
|
|
|
|
|
err_out1:
|
|
|
|
|
delete gpu_mem;
|
|
|
|
|
err_out0:
|
|
|
|
|
DestroyContext(queue->context);
|
|
|
|
|
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void WDDMDevice::DestroyQueue(WDDMQueue *queue) {
|
|
|
|
|
|
|
|
|
|
queue->Fini();
|
|
|
|
|
|
|
|
|
|
auto cmdbuf_mem = GpuMemory::Convert(queue->cmdbuf);
|
|
|
|
|
delete cmdbuf_mem;
|
|
|
|
|
|
|
|
|
|
DestroyContext(queue->context);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool WDDMDevice::SubmitToSwQueue(WDDMQueue *queue, uint64_t command_addr,
|
|
|
|
|
uint64_t command_size, uint64_t fence_value) {
|
|
|
|
|
void *priv_data;
|
|
|
|
|
int priv_size;
|
|
|
|
|
|
2025-08-01 15:18:51 +08:00
|
|
|
priv_size = thunk_proxy::GetSubmitPrivDataSize();
|
|
|
|
|
priv_data = malloc(priv_size);
|
|
|
|
|
assert(priv_data);
|
|
|
|
|
memset(priv_data, 0, priv_size);
|
|
|
|
|
thunk_proxy::FillinSubmitPrivData(priv_data, queue->queue, command_addr, command_size, false);
|
2024-04-30 09:01:09 -05:00
|
|
|
|
|
|
|
|
D3DKMT_SUBMITCOMMAND args = {0};
|
|
|
|
|
args.Commands = command_addr;
|
|
|
|
|
args.CommandLength = command_size;
|
|
|
|
|
args.BroadcastContextCount = 1;
|
|
|
|
|
args.BroadcastContext[0] = queue->context;
|
|
|
|
|
args.pPrivateDriverData = priv_data;
|
|
|
|
|
args.PrivateDriverDataSize = priv_size;
|
|
|
|
|
|
2025-09-10 10:58:06 +08:00
|
|
|
NTSTATUS ret = DXCORE_CALL(D3DKMTSubmitCommand(&args));
|
2024-04-30 09:01:09 -05:00
|
|
|
if (ret != STATUS_SUCCESS) {
|
2024-10-14 16:04:16 +08:00
|
|
|
pr_err("fail %x\n", ret);
|
2025-08-01 15:18:51 +08:00
|
|
|
free(priv_data);
|
2024-04-30 09:01:09 -05:00
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
2025-08-01 15:18:51 +08:00
|
|
|
free(priv_data);
|
2024-04-30 09:01:09 -05:00
|
|
|
|
|
|
|
|
if (!GpuSignal(queue->context, &queue->syncobj, &fence_value, 1))
|
|
|
|
|
return false;
|
|
|
|
|
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool WDDMDevice::CreateHwQueue(WDDMQueue *queue) {
|
|
|
|
|
void *priv_data;
|
|
|
|
|
int priv_size;
|
|
|
|
|
|
2025-08-01 15:18:51 +08:00
|
|
|
priv_size = thunk_proxy::GetHwQueuePrivDataSize();
|
|
|
|
|
priv_data = malloc(priv_size);
|
|
|
|
|
assert(priv_data);
|
|
|
|
|
memset(priv_data, 0, priv_size);
|
2024-04-30 09:01:09 -05:00
|
|
|
bool FwManagedGfxState = SupportStateShadowingByCpFw();
|
2025-08-01 15:18:51 +08:00
|
|
|
thunk_proxy::FillinHwQueuePrivData(priv_data, FwManagedGfxState, queue->prio);
|
2024-04-30 09:01:09 -05:00
|
|
|
|
|
|
|
|
D3DKMT_CREATEHWQUEUE createHwQueue = {0};
|
|
|
|
|
createHwQueue.hHwContext = queue->context;
|
2024-10-14 15:52:52 +08:00
|
|
|
createHwQueue.Flags.DisableGpuTimeout = thunk_proxy::ShouldDisableGpuTimeout(queue->queue_engine, &device_info_);
|
2024-04-30 09:01:09 -05:00
|
|
|
createHwQueue.pPrivateDriverData = priv_data;
|
|
|
|
|
createHwQueue.PrivateDriverDataSize = priv_size;
|
|
|
|
|
|
2025-09-10 10:58:06 +08:00
|
|
|
NTSTATUS ret = DXCORE_CALL(D3DKMTCreateHwQueue(&createHwQueue));
|
2024-04-30 09:01:09 -05:00
|
|
|
if (ret != STATUS_SUCCESS) {
|
2024-10-14 16:04:16 +08:00
|
|
|
pr_err("fail %x\n", ret);
|
2025-08-01 15:18:51 +08:00
|
|
|
free(priv_data);
|
2024-04-30 09:01:09 -05:00
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
2025-08-01 15:18:51 +08:00
|
|
|
free(priv_data);
|
2024-04-30 09:01:09 -05:00
|
|
|
|
|
|
|
|
queue->queue = createHwQueue.hHwQueue;
|
|
|
|
|
queue->syncobj = createHwQueue.hHwQueueProgressFence;
|
|
|
|
|
queue->sync_addr = (uint64_t *)createHwQueue.HwQueueProgressFenceCPUVirtualAddress;
|
|
|
|
|
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool WDDMDevice::DestroyHwQueue(WDDMQueue *queue) {
|
|
|
|
|
D3DKMT_DESTROYHWQUEUE DestroyHwQueue = {
|
|
|
|
|
.hHwQueue = queue->queue,
|
|
|
|
|
};
|
|
|
|
|
|
2025-09-10 10:58:06 +08:00
|
|
|
NTSTATUS ret = DXCORE_CALL(D3DKMTDestroyHwQueue(&DestroyHwQueue));
|
2024-04-30 09:01:09 -05:00
|
|
|
if (ret != STATUS_SUCCESS) {
|
2024-10-14 16:04:16 +08:00
|
|
|
pr_err("fail %x\n", ret);
|
2024-04-30 09:01:09 -05:00
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool WDDMDevice::SubmitToHwQueue(WDDMQueue *queue, uint64_t command_addr,
|
|
|
|
|
uint64_t command_size, uint64_t fence_value) {
|
|
|
|
|
void *priv_data;
|
|
|
|
|
int priv_size;
|
|
|
|
|
|
2025-08-01 15:18:51 +08:00
|
|
|
priv_size = thunk_proxy::GetSubmitPrivDataSize();
|
|
|
|
|
priv_data = malloc(priv_size);
|
|
|
|
|
assert(priv_data);
|
|
|
|
|
memset(priv_data, 0, priv_size);
|
|
|
|
|
thunk_proxy::FillinSubmitPrivData(priv_data, queue->queue, command_addr, command_size, true);
|
2024-04-30 09:01:09 -05:00
|
|
|
|
|
|
|
|
D3DKMT_SUBMITCOMMANDTOHWQUEUE args = {0};
|
|
|
|
|
args.hHwQueue = queue->queue;
|
|
|
|
|
args.HwQueueProgressFenceId = fence_value;
|
|
|
|
|
args.CommandBuffer = command_addr;
|
|
|
|
|
args.CommandLength = command_size;
|
|
|
|
|
args.pPrivateDriverData = priv_data;
|
|
|
|
|
args.PrivateDriverDataSize = priv_size;
|
|
|
|
|
|
2025-09-10 10:58:06 +08:00
|
|
|
NTSTATUS ret = DXCORE_CALL(D3DKMTSubmitCommandToHwQueue(&args));
|
2024-04-30 09:01:09 -05:00
|
|
|
if (ret != STATUS_SUCCESS) {
|
2024-10-14 16:04:16 +08:00
|
|
|
pr_err("fail %x\n", ret);
|
2025-08-01 15:18:51 +08:00
|
|
|
free(priv_data);
|
2024-04-30 09:01:09 -05:00
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
2025-08-01 15:18:51 +08:00
|
|
|
free(priv_data);
|
2024-04-30 09:01:09 -05:00
|
|
|
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
|
2024-09-10 08:16:11 -07:00
|
|
|
} // namespace thunk
|
|
|
|
|
} // namespace wsl
|