Файли
rocm-systems/projects/rocr-runtime/libhsakmt/tests/kfdtest/src/SDMAPacket.cpp
T

269 рядки
9.7 KiB
C++
Неформатований Звичайний вигляд Історія

2018-07-23 14:45:44 -04:00
/*
* Copyright (C) 2014-2018 Advanced Micro Devices, Inc. All Rights Reserved.
*
* Permission is hereby granted, free of charge, to any person obtaining a
* copy of this software and associated documentation files (the "Software"),
* to deal in the Software without restriction, including without limitation
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
* and/or sell copies of the Software, and to permit persons to whom the
* Software is furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice shall be included in
* all copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
* OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
* ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
* OTHER DEALINGS IN THE SOFTWARE.
*
*/
#include <stdint.h>
#include <stddef.h>
#include <string.h>
#include "SDMAPacket.hpp"
#include "KFDTestUtil.hpp"
2018-08-14 09:52:31 -04:00
/* Byte/dword count in many SDMA packets is 1-based in AI, meaning a
* count of 1 is encoded as 0.
*/
#define SDMA_COUNT(c) (m_FamilyId < FAMILY_AI ? (c) : (c)-1)
2018-07-23 14:45:44 -04:00
SDMAWriteDataPacket::SDMAWriteDataPacket(unsigned int familyId, void* destAddr, unsigned int data,
unsigned int packetSizeOffset):
2018-07-23 14:45:44 -04:00
packetData(NULL) {
m_FamilyId = familyId;
InitPacket(destAddr, 1, &data, packetSizeOffset);
2018-07-23 14:45:44 -04:00
}
SDMAWriteDataPacket::SDMAWriteDataPacket(unsigned int familyId, void* destAddr, unsigned int ndw,
2018-07-23 14:45:44 -04:00
void *data):
packetData(NULL) {
m_FamilyId = familyId;
2018-07-23 14:45:44 -04:00
InitPacket(destAddr, ndw, data);
}
void SDMAWriteDataPacket::InitPacket(void* destAddr, unsigned int ndw,
void *data, unsigned int packetSizeOffset) {
2018-07-23 14:45:44 -04:00
packetSize = sizeof(SDMA_PKT_WRITE_UNTILED) +
(ndw - 1) * sizeof(unsigned int);
packetSize -= packetSizeOffset;
packetData = reinterpret_cast<SDMA_PKT_WRITE_UNTILED *>(AllocPacket());
2018-07-23 14:45:44 -04:00
packetData->HEADER_UNION.op = SDMA_OP_WRITE;
packetData->HEADER_UNION.sub_op = SDMA_SUBOP_WRITE_LINEAR;
2018-08-13 09:03:31 -04:00
SplitU64(reinterpret_cast<HSAuint64>(destAddr),
2018-07-23 14:45:44 -04:00
packetData->DST_ADDR_LO_UNION.DW_1_DATA, // dst_addr_31_0
packetData->DST_ADDR_HI_UNION.DW_2_DATA); // dst_addr_63_32
packetData->DW_3_UNION.count = SDMA_COUNT(ndw);
memcpy(&packetData->DATA0_UNION.DW_4_DATA, data, ndw*sizeof(unsigned int));
}
2018-08-02 17:13:26 +08:00
#define BITS (21)
#define TWO_MEG (1 << BITS)
SDMACopyDataPacket::SDMACopyDataPacket(unsigned int familyId,
void *const dsts[], void *src, int n, unsigned int surfsize) {
2018-08-02 17:13:26 +08:00
int32_t size = 0, i;
2018-08-13 09:03:31 -04:00
void **dst = reinterpret_cast<void**>(malloc(sizeof(void*) * n));
2018-08-02 17:13:26 +08:00
const int singlePacketSize = sizeof(SDMA_PKT_COPY_LINEAR) +
sizeof(SDMA_PKT_COPY_LINEAR::DST_ADDR[0]) * n;
if (n > 2)
WARN() << "SDMACopyDataPacket does not support more than 2 dst addresses!" << std::endl;
m_FamilyId = familyId;
2018-08-02 17:13:26 +08:00
memcpy(dst, dsts, sizeof(void*) * n);
packetSize = ((surfsize + TWO_MEG - 1) >> BITS) * singlePacketSize;
2018-07-23 14:45:44 -04:00
SDMA_PKT_COPY_LINEAR *pSDMA = reinterpret_cast<SDMA_PKT_COPY_LINEAR *>(AllocPacket());
2018-07-23 14:45:44 -04:00
packetData = pSDMA;
while (surfsize > 0) {
2018-08-14 09:52:31 -04:00
/* SDMA support maximum 0x3fffe0 byte in one copy, take 2M here */
2018-07-23 14:45:44 -04:00
if (surfsize > TWO_MEG)
size = TWO_MEG;
else
size = surfsize;
2018-08-02 17:13:26 +08:00
memset(pSDMA, 0, singlePacketSize);
2018-07-23 14:45:44 -04:00
pSDMA->HEADER_UNION.op = SDMA_OP_COPY;
pSDMA->HEADER_UNION.sub_op = SDMA_SUBOP_COPY_LINEAR;
2018-08-02 17:13:26 +08:00
pSDMA->HEADER_UNION.broadcast = n > 1 ? 1 : 0;
2018-07-23 14:45:44 -04:00
pSDMA->COUNT_UNION.count = SDMA_COUNT(size);
2018-08-13 09:03:31 -04:00
SplitU64(reinterpret_cast<HSAuint64>(src),
2018-07-23 14:45:44 -04:00
pSDMA->SRC_ADDR_LO_UNION.DW_3_DATA, // src_addr_31_0
pSDMA->SRC_ADDR_HI_UNION.DW_4_DATA); // src_addr_63_32
2018-08-02 17:13:26 +08:00
for (i = 0; i < n; i++)
2018-08-13 09:03:31 -04:00
SplitU64(reinterpret_cast<HSAuint64>(dst[i]),
2018-08-02 17:13:26 +08:00
pSDMA->DST_ADDR[i].DST_ADDR_LO_UNION.DW_5_DATA, // dst_addr_31_0
pSDMA->DST_ADDR[i].DST_ADDR_HI_UNION.DW_6_DATA); // dst_addr_63_32
2018-08-13 09:03:31 -04:00
pSDMA = reinterpret_cast<SDMA_PKT_COPY_LINEAR *>(reinterpret_cast<char *>(pSDMA) + singlePacketSize);
2018-08-02 17:13:26 +08:00
for (i = 0; i < n; i++)
2018-08-13 09:03:31 -04:00
dst[i] = reinterpret_cast<char *>(dst[i]) + size;
src = reinterpret_cast<char *>(src) + size;
2018-07-23 14:45:44 -04:00
surfsize -= size;
}
2018-08-02 17:13:26 +08:00
free(dst);
}
SDMACopyDataPacket::SDMACopyDataPacket(unsigned int familyId, void* dst, void *src, unsigned int surfsize) {
new (this)SDMACopyDataPacket(familyId, &dst, src, 1, surfsize);
2018-07-23 14:45:44 -04:00
}
SDMAFillDataPacket::SDMAFillDataPacket(unsigned int familyId, void *dst, unsigned int data, unsigned int size) {
2018-07-23 14:45:44 -04:00
unsigned int copy_size;
SDMA_PKT_CONSTANT_FILL *pSDMA;
m_FamilyId = familyId;
2018-07-23 14:45:44 -04:00
/* SDMA support maximum 0x3fffe0 byte in one copy. Use 2M copy_size */
2018-08-02 17:13:26 +08:00
m_PacketSize = ((size + TWO_MEG - 1) >> BITS) * sizeof(SDMA_PKT_CONSTANT_FILL);
pSDMA = reinterpret_cast<SDMA_PKT_CONSTANT_FILL *>(AllocPacket());
2018-07-23 14:45:44 -04:00
m_PacketData = pSDMA;
while (size > 0) {
if (size > TWO_MEG)
copy_size = TWO_MEG;
else
copy_size = size;
pSDMA->HEADER_UNION.op = SDMA_OP_CONST_FILL;
pSDMA->HEADER_UNION.sub_op = 0;
2018-08-14 09:52:31 -04:00
/* If both size and address are DW aligned, then use DW fill */
2018-07-23 14:45:44 -04:00
if (!(copy_size & 0x3) && !((HSAuint64)dst & 0x3))
pSDMA->HEADER_UNION.fillsize = 2; /* DW Fill */
else
pSDMA->HEADER_UNION.fillsize = 0; /* Byte Fill */
pSDMA->COUNT_UNION.count = SDMA_COUNT(copy_size);
2018-08-13 09:03:31 -04:00
SplitU64(reinterpret_cast<HSAuint64>(dst),
2018-07-23 14:45:44 -04:00
pSDMA->DST_ADDR_LO_UNION.DW_1_DATA, /*dst_addr_31_0*/
pSDMA->DST_ADDR_HI_UNION.DW_2_DATA); /*dst_addr_63_32*/
pSDMA->DATA_UNION.DW_3_DATA = data;
pSDMA++;
2018-08-13 09:03:31 -04:00
dst = reinterpret_cast<char *>(dst) + copy_size;
2018-07-23 14:45:44 -04:00
size -= copy_size;
}
}
SDMAFencePacket::SDMAFencePacket(void) {
}
SDMAFencePacket::SDMAFencePacket(unsigned int familyId, void* destAddr, unsigned int data) {
m_FamilyId = familyId;
if (m_FamilyId < FAMILY_NV)
InitPacketCI(destAddr, data);
else
InitPacketNV(destAddr, data);
2018-07-23 14:45:44 -04:00
}
SDMAFencePacket::~SDMAFencePacket(void) {
}
void SDMAFencePacket::InitPacketCI(void* destAddr, unsigned int data) {
2018-07-23 14:45:44 -04:00
memset(&packetData, 0, SizeInBytes());
packetData.HEADER_UNION.op = SDMA_OP_FENCE;
2018-08-13 09:03:31 -04:00
SplitU64(reinterpret_cast<HSAuint64>(destAddr),
2018-07-23 14:45:44 -04:00
packetData.ADDR_LO_UNION.DW_1_DATA, /*dst_addr_31_0*/
packetData.ADDR_HI_UNION.DW_2_DATA); /*dst_addr_63_32*/
packetData.DATA_UNION.data = data;
}
void SDMAFencePacket::InitPacketNV(void * destAddr,unsigned int data) {
memset(&packetData, 0, SizeInBytes());
/* GPA=0 becaue we use virtual address
* Snoop = 1 because we want the write be CPU coherent
* System = 1 because the memory is system memory
* mtype = uncached, for the purpose of CPU coherent, L2 policy doesn't matter in this case
*/
packetData.HEADER_UNION.DW_0_DATA = (0 << 23) | (1 << 22) | (1 << 20) | (3 << 16) | SDMA_OP_FENCE;
SplitU64(reinterpret_cast<unsigned long long>(destAddr),
packetData.ADDR_LO_UNION.DW_1_DATA, /*dst_addr_31_0*/
packetData.ADDR_HI_UNION.DW_2_DATA); /*dst_addr_63_32*/
packetData.DATA_UNION.data = data;
}
2018-07-23 14:45:44 -04:00
SDMATrapPacket::SDMATrapPacket(unsigned int eventID) {
InitPacket(eventID);
}
SDMATrapPacket::~SDMATrapPacket(void) {
}
void SDMATrapPacket::InitPacket(unsigned int eventID) {
memset(&packetData, 0, SizeInBytes());
packetData.HEADER_UNION.op = SDMA_OP_TRAP;
packetData.INT_CONTEXT_UNION.int_context = eventID;
}
2018-08-27 15:01:21 +08:00
SDMAPollRegMemPacket::SDMAPollRegMemPacket(void *addr, int value) {
InitPacket(addr, value);
}
SDMAPollRegMemPacket::~SDMAPollRegMemPacket(void) {
}
void SDMAPollRegMemPacket::InitPacket(void *addr, int value) {
memset(&packetData, 0, SizeInBytes());
packetData.HEADER_UNION.op = SDMA_OP_POLL_REGMEM;
packetData.HEADER_UNION.mem_poll = 1;
packetData.HEADER_UNION.func = 0x3; // IsEqual.
SplitU64(reinterpret_cast<unsigned long long>(addr),
packetData.ADDR_LO_UNION.DW_1_DATA,
packetData.ADDR_HI_UNION.DW_2_DATA);
packetData.VALUE_UNION.value = value;
packetData.MASK_UNION.mask = 0xffffffff; // Compare the whole content.
packetData.DW5_UNION.interval = 0x04;
packetData.DW5_UNION.retry_count = 0xfff;
}
2018-08-27 15:01:21 +08:00
SDMATimePacket::SDMATimePacket(void *destaddr) {
InitPacket(destaddr);
}
SDMATimePacket::~SDMATimePacket(void) {
}
void SDMATimePacket::InitPacket(void *destaddr) {
memset(&packetData, 0, SizeInBytes());
packetData.HEADER_UNION.op = SDMA_OP_TIMESTAMP;
packetData.HEADER_UNION.sub_op = 1 << 1; /* Get Global GPU Timestamp*/
if (reinterpret_cast<unsigned long long>(destaddr) & 0x1f)
WARN() << "SDMATimePacket dst address must aligned to 32bytes boundary" << std::endl;
SplitU64(reinterpret_cast<unsigned long long>(destaddr),
packetData.ADDR_LO_UNION.DW_1_DATA, /*dst_addr_31_0*/
packetData.ADDR_HI_UNION.DW_2_DATA); /*dst_addr_63_32*/
}
2019-09-22 17:13:17 -04:00
SDMANopPacket::SDMANopPacket(unsigned int count) {
2019-10-30 22:11:22 -04:00
packetSize = count * sizeof(unsigned int);
packetData = reinterpret_cast<SDMA_PKT_NOP *>(AllocPacket());
2019-09-22 17:13:17 -04:00
packetData->HEADER_UNION.op = SDMA_OP_NOP;
packetData->HEADER_UNION.sub_op = 0;
packetData->HEADER_UNION.count = count - 1;
}