2024-03-25 17:05:31 -04:00
|
|
|
/*
|
|
|
|
|
Copyright (c) 2024 Advanced Micro Devices, Inc. All rights reserved.
|
|
|
|
|
|
|
|
|
|
Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
|
|
|
of this software and associated documentation files (the "Software"), to deal
|
|
|
|
|
in the Software without restriction, including without limitation the rights
|
|
|
|
|
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
|
|
|
copies of the Software, and to permit persons to whom the Software is
|
|
|
|
|
furnished to do so, subject to the following conditions:
|
|
|
|
|
|
|
|
|
|
The above copyright notice and this permission notice shall be included in
|
|
|
|
|
all copies or substantial portions of the Software.
|
|
|
|
|
|
|
|
|
|
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
|
|
|
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
|
|
|
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
|
|
|
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
|
|
|
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
|
|
|
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
|
|
|
THE SOFTWARE.
|
|
|
|
|
*/
|
|
|
|
|
|
|
|
|
|
#include "rocjpeg_vaapi_decoder.h"
|
|
|
|
|
|
2024-05-15 13:44:51 -04:00
|
|
|
/**
|
2024-07-12 15:20:38 -04:00
|
|
|
* @brief Default constructor for RocJpegVaapiMemoryPool class.
|
2024-05-15 13:44:51 -04:00
|
|
|
*
|
|
|
|
|
* This constructor initializes the memory pool for different surface formats used in RocJpegVappiDecoder.
|
|
|
|
|
* It creates an empty vector for each surface format and stores it in the mem_pool_ map.
|
|
|
|
|
*
|
|
|
|
|
* @param None
|
|
|
|
|
* @return None
|
|
|
|
|
*/
|
2024-07-12 15:20:38 -04:00
|
|
|
RocJpegVaapiMemoryPool::RocJpegVaapiMemoryPool() {
|
2024-07-19 19:04:31 -04:00
|
|
|
std::vector<uint32_t> surface_formats = {VA_FOURCC_RGBA, VA_FOURCC_RGBP, VA_FOURCC_444P, VA_FOURCC_422V, ROCJPEG_FOURCC_YUYV, VA_FOURCC_NV12, VA_FOURCC_Y800};
|
2024-04-22 14:37:45 -04:00
|
|
|
for (auto surface_format : surface_formats) {
|
2024-07-12 15:20:38 -04:00
|
|
|
mem_pool_[surface_format] = std::vector<RocJpegVaapiMemPoolEntry>();
|
2024-04-22 14:37:45 -04:00
|
|
|
}
|
2024-07-19 19:04:31 -04:00
|
|
|
max_pool_size_ = 2;
|
2024-04-22 14:37:45 -04:00
|
|
|
}
|
|
|
|
|
|
2024-05-15 13:44:51 -04:00
|
|
|
/**
|
2024-07-12 15:20:38 -04:00
|
|
|
* @brief Releases the resources used by the RocJpegVaapiMemoryPool.
|
2024-05-15 13:44:51 -04:00
|
|
|
*
|
|
|
|
|
* This function releases the VA-API contexts, surfaces, HIP device memory, and HIP external memory
|
|
|
|
|
* associated with the memory pool. It iterates over each entry in the memory pool and checks if
|
|
|
|
|
* the VA-API context ID, VA-API surface ID, HIP mapped device memory, or HIP external memory is
|
|
|
|
|
* non-zero. If so, it destroys the corresponding resource using the appropriate API function.
|
|
|
|
|
* Finally, it resets the HIP interop structure for each entry in the memory pool.
|
|
|
|
|
*/
|
2024-07-12 15:20:38 -04:00
|
|
|
void RocJpegVaapiMemoryPool::ReleaseResources() {
|
2024-04-22 14:37:45 -04:00
|
|
|
VAStatus va_status;
|
|
|
|
|
hipError_t hip_status;
|
|
|
|
|
for (auto& pair : mem_pool_) {
|
|
|
|
|
for (auto& entry : pair.second) {
|
2024-07-12 15:20:38 -04:00
|
|
|
if (!entry.va_surface_ids.empty()) {
|
|
|
|
|
va_status = vaDestroySurfaces(va_display_, entry.va_surface_ids.data(), entry.va_surface_ids.size());
|
2024-04-22 14:37:45 -04:00
|
|
|
if (va_status != VA_STATUS_SUCCESS) {
|
|
|
|
|
ERR("ERROR: vaDestroySurfaces failed!");
|
|
|
|
|
}
|
|
|
|
|
}
|
2024-07-12 15:20:38 -04:00
|
|
|
if (!entry.hip_interops.empty()) {
|
|
|
|
|
for(auto& hip_interop_entry : entry.hip_interops) {
|
|
|
|
|
if (hip_interop_entry.hip_mapped_device_mem != nullptr) {
|
|
|
|
|
hip_status = hipFree(hip_interop_entry.hip_mapped_device_mem);
|
|
|
|
|
if (hip_status != hipSuccess) {
|
|
|
|
|
ERR("ERROR: hipFree failed!");
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
if (hip_interop_entry.hip_ext_mem != nullptr) {
|
|
|
|
|
hip_status = hipDestroyExternalMemory(hip_interop_entry.hip_ext_mem);
|
|
|
|
|
if (hip_status != hipSuccess) {
|
|
|
|
|
ERR("ERROR: hipDestroyExternalMemory failed!");
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
2024-04-22 14:37:45 -04:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2024-07-19 19:04:31 -04:00
|
|
|
void RocJpegVaapiMemoryPool::SetPoolSize(uint32_t max_pool_size) {
|
|
|
|
|
max_pool_size_ = max_pool_size;
|
2024-04-22 14:37:45 -04:00
|
|
|
}
|
|
|
|
|
|
2024-07-12 15:20:38 -04:00
|
|
|
void RocJpegVaapiMemoryPool::SetVaapiDisplay(const VADisplay& va_display) {
|
2024-04-22 14:37:45 -04:00
|
|
|
va_display_ = va_display;
|
|
|
|
|
}
|
|
|
|
|
|
2024-10-01 09:14:15 -04:00
|
|
|
/**
|
|
|
|
|
* @brief Retrieves the total size of the memory pool.
|
|
|
|
|
*
|
|
|
|
|
* This function iterates through the memory pool and sums up the sizes of all entries.
|
|
|
|
|
*
|
|
|
|
|
* @return The total size of the memory pool.
|
|
|
|
|
*/
|
|
|
|
|
size_t RocJpegVaapiMemoryPool::GetTotalMemPoolSize() const {
|
|
|
|
|
size_t total_mem_pool_size = 0;
|
|
|
|
|
for (const auto& pair : mem_pool_) {
|
|
|
|
|
total_mem_pool_size += pair.second.size();
|
|
|
|
|
}
|
|
|
|
|
return total_mem_pool_size;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* @brief Deletes an idle entry from the memory pool.
|
|
|
|
|
*
|
|
|
|
|
* This function iterates through the memory pool and searches for an entry
|
|
|
|
|
* with the status `kIdle`. If such an entry is found, it performs the following
|
|
|
|
|
* cleanup operations:
|
|
|
|
|
* - Destroys the VAAPI context if it exists.
|
|
|
|
|
* - Destroys the VAAPI surfaces if they exist.
|
|
|
|
|
* - Frees HIP mapped device memory and destroys HIP external memory if they exist.
|
|
|
|
|
* - Resets the HIP interop entries.
|
|
|
|
|
*
|
|
|
|
|
* After performing the cleanup, the idle entry is removed from the memory pool.
|
|
|
|
|
*
|
|
|
|
|
* @return true if an idle entry was found and deleted, false otherwise.
|
|
|
|
|
*/
|
|
|
|
|
bool RocJpegVaapiMemoryPool::DeleteIdleEntry() {
|
|
|
|
|
for (auto& pair : mem_pool_) {
|
|
|
|
|
auto it = std::find_if(pair.second.begin(), pair.second.end(), [](const RocJpegVaapiMemPoolEntry& entry) {return entry.entry_status == kIdle;});
|
|
|
|
|
if (it != pair.second.end()) {
|
|
|
|
|
auto index = std::distance(pair.second.begin(), it);
|
|
|
|
|
if (!pair.second[index].va_surface_ids.empty()) {
|
|
|
|
|
CHECK_VAAPI(vaDestroySurfaces(va_display_, pair.second[index].va_surface_ids.data(), pair.second[index].va_surface_ids.size()));
|
|
|
|
|
std::fill(pair.second[index].va_surface_ids.begin(), pair.second[index].va_surface_ids.end(), 0);
|
|
|
|
|
}
|
|
|
|
|
if (!pair.second[index].hip_interops.empty()) {
|
|
|
|
|
for(auto& hip_interop_entry : pair.second[index].hip_interops) {
|
|
|
|
|
if (hip_interop_entry.hip_mapped_device_mem != nullptr)
|
|
|
|
|
CHECK_HIP(hipFree(hip_interop_entry.hip_mapped_device_mem));
|
|
|
|
|
if (hip_interop_entry.hip_ext_mem != nullptr)
|
|
|
|
|
CHECK_HIP(hipDestroyExternalMemory(hip_interop_entry.hip_ext_mem));
|
|
|
|
|
memset((void*)&hip_interop_entry, 0, sizeof(hip_interop_entry));
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
pair.second.erase(it);
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
2024-05-15 13:44:51 -04:00
|
|
|
/**
|
|
|
|
|
* @brief Adds a pool entry to the memory pool for a specific surface format.
|
|
|
|
|
*
|
|
|
|
|
* This function adds a pool entry to the memory pool for a specific surface format.
|
|
|
|
|
* If the memory pool for the given surface format is not full, the new entry is added to the pool.
|
|
|
|
|
* If the memory pool is full, the oldest entry is removed from the pool and replaced with the new entry.
|
|
|
|
|
* If the removed entry has associated resources (VA context, VA surface, HIP memory), they are destroyed and freed.
|
|
|
|
|
*
|
|
|
|
|
* @param surface_format The surface format for which the pool entry is being added.
|
|
|
|
|
* @param pool_entry The pool entry to be added.
|
|
|
|
|
* @return The status of the operation. Returns ROCJPEG_STATUS_SUCCESS if the operation is successful.
|
|
|
|
|
*/
|
2024-07-12 15:20:38 -04:00
|
|
|
RocJpegStatus RocJpegVaapiMemoryPool::AddPoolEntry(uint32_t surface_format, const RocJpegVaapiMemPoolEntry& pool_entry) {
|
2024-10-01 09:14:15 -04:00
|
|
|
size_t total_mem_pool_size = GetTotalMemPoolSize();
|
2024-07-19 19:04:31 -04:00
|
|
|
auto& entries = mem_pool_[surface_format];
|
2024-10-01 09:14:15 -04:00
|
|
|
if (total_mem_pool_size < max_pool_size_) {
|
2024-07-19 19:04:31 -04:00
|
|
|
entries.push_back(pool_entry);
|
2024-04-22 14:37:45 -04:00
|
|
|
} else {
|
2024-10-01 09:14:15 -04:00
|
|
|
if (DeleteIdleEntry()) {
|
2024-08-14 16:45:05 -04:00
|
|
|
entries.push_back(pool_entry);
|
|
|
|
|
} else {
|
|
|
|
|
ERR("cannot find an idle entry in the the memory pool!");
|
|
|
|
|
return ROCJPEG_STATUS_INVALID_PARAMETER;
|
2024-04-22 14:37:45 -04:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return ROCJPEG_STATUS_SUCCESS;
|
|
|
|
|
}
|
|
|
|
|
|
2024-05-15 13:44:51 -04:00
|
|
|
/**
|
2024-07-12 15:20:38 -04:00
|
|
|
* @brief Retrieves a `RocJpegVaapiMemPoolEntry` from the memory pool based on the specified surface format, image width, and image height.
|
2024-05-15 13:44:51 -04:00
|
|
|
*
|
2024-07-04 15:15:50 -04:00
|
|
|
* @param surface_format The surface pixel format of the entry to retrieve.
|
2024-05-15 13:44:51 -04:00
|
|
|
* @param image_width The width of the image of the entry to retrieve.
|
|
|
|
|
* @param image_height The height of the image of the entry to retrieve.
|
2024-07-12 15:20:38 -04:00
|
|
|
* @param num_surfaces The number of surfaces of the entry to retrieve.
|
|
|
|
|
* @return The matching `RocJpegVaapiMemPoolEntry` if found, or a default-initialized entry if not found.
|
2024-05-15 13:44:51 -04:00
|
|
|
*/
|
2024-07-12 15:20:38 -04:00
|
|
|
RocJpegVaapiMemPoolEntry RocJpegVaapiMemoryPool::GetEntry(uint32_t surface_format, uint32_t image_width, uint32_t image_height, uint32_t num_surfaces) {
|
2024-08-14 16:45:05 -04:00
|
|
|
for (auto& entry : mem_pool_[surface_format]) {
|
|
|
|
|
if (entry.image_width == image_width && entry.image_height == image_height && entry.va_surface_ids.size() == num_surfaces && entry.entry_status == kIdle) {
|
|
|
|
|
entry.entry_status = kBusy;
|
2024-04-22 14:37:45 -04:00
|
|
|
return entry;
|
|
|
|
|
}
|
|
|
|
|
}
|
2024-10-30 11:48:47 -04:00
|
|
|
return {0, 0, kIdle, {}, {}};
|
2024-04-22 14:37:45 -04:00
|
|
|
}
|
|
|
|
|
|
2024-07-12 15:20:38 -04:00
|
|
|
bool RocJpegVaapiMemoryPool::FindSurfaceId(VASurfaceID surface_id) {
|
2024-04-22 14:37:45 -04:00
|
|
|
for (auto& pair : mem_pool_) {
|
|
|
|
|
for (auto& entry : pair.second) {
|
2024-07-12 15:20:38 -04:00
|
|
|
if (std::find(entry.va_surface_ids.begin(), entry.va_surface_ids.end(), surface_id) != entry.va_surface_ids.end()) {
|
2024-04-22 14:37:45 -04:00
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
2024-05-15 13:44:51 -04:00
|
|
|
/**
|
|
|
|
|
* @brief Retrieves the HipInteropDeviceMem associated with a given VASurfaceID from the memory pool.
|
|
|
|
|
*
|
|
|
|
|
* This function searches the memory pool for the entry that matches the provided VASurfaceID.
|
|
|
|
|
* If a matching entry is found and the associated HipInteropDeviceMem is not already initialized,
|
|
|
|
|
* it initializes the HipInteropDeviceMem by exporting the VASurfaceID as a DRM prime surface handle,
|
|
|
|
|
* importing it as an external memory object, and getting the mapped buffer for the external memory.
|
|
|
|
|
* The function then updates the HipInteropDeviceMem with the surface format, width, height, offsets,
|
|
|
|
|
* pitches, and number of layers from the exported surface descriptor.
|
|
|
|
|
*
|
|
|
|
|
* @param surface_id The VASurfaceID to retrieve the HipInteropDeviceMem for.
|
|
|
|
|
* @param hip_interop [out] The retrieved HipInteropDeviceMem.
|
|
|
|
|
* @return RocJpegStatus Returns ROCJPEG_STATUS_SUCCESS if the HipInteropDeviceMem is successfully retrieved,
|
|
|
|
|
* ROCJPEG_STATUS_INVALID_PARAMETER if the requested surface_id is not found in the memory pool.
|
|
|
|
|
*/
|
2024-07-12 15:20:38 -04:00
|
|
|
RocJpegStatus RocJpegVaapiMemoryPool::GetHipInteropMem(VASurfaceID surface_id, HipInteropDeviceMem& hip_interop) {
|
2024-04-22 14:37:45 -04:00
|
|
|
for (auto& pair : mem_pool_) {
|
|
|
|
|
auto& entries = pair.second;
|
|
|
|
|
auto it = std::find_if(entries.begin(), entries.end(),
|
2024-07-12 15:20:38 -04:00
|
|
|
[surface_id](const RocJpegVaapiMemPoolEntry& entry){return std::find(entry.va_surface_ids.begin(), entry.va_surface_ids.end(), surface_id) != entry.va_surface_ids.end();});
|
2024-04-22 14:37:45 -04:00
|
|
|
if (it != entries.end()) {
|
2024-07-12 15:20:38 -04:00
|
|
|
auto idx = std::distance(it->va_surface_ids.begin(), std::find(it->va_surface_ids.begin(), it->va_surface_ids.end(), surface_id));
|
|
|
|
|
if (it->hip_interops[idx].hip_mapped_device_mem != nullptr) {
|
|
|
|
|
CHECK_HIP(hipFree(it->hip_interops[idx].hip_mapped_device_mem));
|
|
|
|
|
if (it->hip_interops[idx].hip_ext_mem != nullptr) {
|
|
|
|
|
CHECK_HIP(hipDestroyExternalMemory(it->hip_interops[idx].hip_ext_mem));
|
2024-07-04 13:13:39 -04:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
VADRMPRIMESurfaceDescriptor va_drm_prime_surface_desc = {};
|
|
|
|
|
CHECK_VAAPI(vaExportSurfaceHandle(va_display_, surface_id, VA_SURFACE_ATTRIB_MEM_TYPE_DRM_PRIME_2,
|
|
|
|
|
VA_EXPORT_SURFACE_READ_ONLY | VA_EXPORT_SURFACE_SEPARATE_LAYERS,
|
|
|
|
|
&va_drm_prime_surface_desc));
|
2024-04-22 14:37:45 -04:00
|
|
|
|
2024-07-04 13:13:39 -04:00
|
|
|
hipExternalMemoryHandleDesc external_mem_handle_desc = {};
|
|
|
|
|
hipExternalMemoryBufferDesc external_mem_buffer_desc = {};
|
|
|
|
|
external_mem_handle_desc.type = hipExternalMemoryHandleTypeOpaqueFd;
|
|
|
|
|
external_mem_handle_desc.handle.fd = va_drm_prime_surface_desc.objects[0].fd;
|
|
|
|
|
external_mem_handle_desc.size = va_drm_prime_surface_desc.objects[0].size;
|
2024-04-22 14:37:45 -04:00
|
|
|
|
2024-07-12 15:20:38 -04:00
|
|
|
CHECK_HIP(hipImportExternalMemory(&it->hip_interops[idx].hip_ext_mem, &external_mem_handle_desc));
|
2024-07-04 13:13:39 -04:00
|
|
|
external_mem_buffer_desc.size = va_drm_prime_surface_desc.objects[0].size;
|
2024-07-12 15:20:38 -04:00
|
|
|
CHECK_HIP(hipExternalMemoryGetMappedBuffer((void**)&it->hip_interops[idx].hip_mapped_device_mem, it->hip_interops[idx].hip_ext_mem, &external_mem_buffer_desc));
|
|
|
|
|
|
|
|
|
|
it->hip_interops[idx].surface_format = va_drm_prime_surface_desc.fourcc;
|
|
|
|
|
it->hip_interops[idx].width = va_drm_prime_surface_desc.width;
|
|
|
|
|
it->hip_interops[idx].height = va_drm_prime_surface_desc.height;
|
|
|
|
|
it->hip_interops[idx].size = va_drm_prime_surface_desc.objects[0].size;
|
|
|
|
|
it->hip_interops[idx].offset[0] = va_drm_prime_surface_desc.layers[0].offset[0];
|
|
|
|
|
it->hip_interops[idx].offset[1] = va_drm_prime_surface_desc.layers[1].offset[0];
|
|
|
|
|
it->hip_interops[idx].offset[2] = va_drm_prime_surface_desc.layers[2].offset[0];
|
|
|
|
|
it->hip_interops[idx].pitch[0] = va_drm_prime_surface_desc.layers[0].pitch[0];
|
|
|
|
|
it->hip_interops[idx].pitch[1] = va_drm_prime_surface_desc.layers[1].pitch[0];
|
|
|
|
|
it->hip_interops[idx].pitch[2] = va_drm_prime_surface_desc.layers[2].pitch[0];
|
|
|
|
|
it->hip_interops[idx].num_layers = va_drm_prime_surface_desc.num_layers;
|
2024-04-22 14:37:45 -04:00
|
|
|
|
2024-07-04 13:13:39 -04:00
|
|
|
for (uint32_t i = 0; i < va_drm_prime_surface_desc.num_objects; ++i) {
|
|
|
|
|
close(va_drm_prime_surface_desc.objects[i].fd);
|
2024-04-22 14:37:45 -04:00
|
|
|
}
|
2024-07-12 15:20:38 -04:00
|
|
|
hip_interop = it->hip_interops[idx];
|
2024-04-22 14:37:45 -04:00
|
|
|
return ROCJPEG_STATUS_SUCCESS;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
// it shouldn't reach here unless the requested surface_id is not in the memory pool.
|
|
|
|
|
ERR("the surface_id: " + TOSTR(surface_id) + " was not found in the memory pool!");
|
|
|
|
|
return ROCJPEG_STATUS_INVALID_PARAMETER;
|
|
|
|
|
}
|
2024-08-14 16:45:05 -04:00
|
|
|
|
|
|
|
|
bool RocJpegVaapiMemoryPool::SetSurfaceAsIdle(VASurfaceID surface_id) {
|
|
|
|
|
for (auto& pair : mem_pool_) {
|
|
|
|
|
for (auto& entry : pair.second) {
|
|
|
|
|
if (std::find(entry.va_surface_ids.begin(), entry.va_surface_ids.end(), surface_id) != entry.va_surface_ids.end()) {
|
|
|
|
|
entry.entry_status = kIdle;
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
2024-05-15 13:44:51 -04:00
|
|
|
/**
|
|
|
|
|
* @brief Constructs a RocJpegVappiDecoder object.
|
|
|
|
|
*
|
|
|
|
|
* This constructor initializes a RocJpegVappiDecoder object with the specified device ID and default values for other member variables.
|
|
|
|
|
*
|
|
|
|
|
* @param device_id The ID of the device to be used for decoding.
|
|
|
|
|
*/
|
2024-03-25 17:05:31 -04:00
|
|
|
RocJpegVappiDecoder::RocJpegVappiDecoder(int device_id) : device_id_{device_id}, drm_fd_{-1}, min_picture_width_{64}, min_picture_height_{64},
|
|
|
|
|
max_picture_width_{4096}, max_picture_height_{4096}, va_display_{0}, va_config_attrib_{{}}, va_config_id_{0}, va_profile_{VAProfileJPEGBaseline},
|
2024-07-12 15:20:38 -04:00
|
|
|
vaapi_mem_pool_(std::make_unique<RocJpegVaapiMemoryPool>()), current_vcn_jpeg_spec_{0}, va_picture_parameter_buf_id_{0}, va_quantization_matrix_buf_id_{0}, va_huffmantable_buf_id_{0},
|
2024-04-22 14:37:45 -04:00
|
|
|
va_slice_param_buf_id_{0}, va_slice_data_buf_id_{0} {
|
2024-04-11 13:37:08 -04:00
|
|
|
vcn_jpeg_spec_ = {{"gfx908", {2, false, false}},
|
|
|
|
|
{"gfx90a", {2, false, false}},
|
|
|
|
|
{"gfx940", {24, true, true}},
|
|
|
|
|
{"gfx941", {32, true, true}},
|
2024-07-12 15:20:38 -04:00
|
|
|
{"gfx942_mi300a", {24, true, true}},
|
|
|
|
|
{"gfx942_mi300x", {32, true, true}},
|
2024-07-08 09:32:01 -04:00
|
|
|
{"gfx1030", {1, false, false}},
|
|
|
|
|
{"gfx1031", {1, false, false}},
|
|
|
|
|
{"gfx1032", {1, false, false}},
|
|
|
|
|
{"gfx1100", {1, false, false}},
|
2024-04-11 13:37:08 -04:00
|
|
|
{"gfx1101", {1, false, false}},
|
2024-07-24 12:36:54 -04:00
|
|
|
{"gfx1102", {1, false, false}},
|
|
|
|
|
{"gfx1200", {1, false, false}},
|
|
|
|
|
{"gfx1201", {1, false, false}}};
|
2024-05-15 13:44:51 -04:00
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* @brief Destructor for the RocJpegVappiDecoder class.
|
|
|
|
|
*
|
|
|
|
|
* This destructor is responsible for cleaning up the resources used by the RocJpegVappiDecoder object.
|
|
|
|
|
* It closes the DRM file descriptor, releases the VAAPI memory pool resources, destroys the VAAPI data buffers,
|
|
|
|
|
* destroys the VAAPI configuration, and terminates the VAAPI display.
|
|
|
|
|
*
|
|
|
|
|
* @note If any of the cleanup operations fail, an error message will be printed.
|
|
|
|
|
*/
|
2024-03-25 17:05:31 -04:00
|
|
|
RocJpegVappiDecoder::~RocJpegVappiDecoder() {
|
|
|
|
|
if (drm_fd_ != -1) {
|
|
|
|
|
close(drm_fd_);
|
|
|
|
|
}
|
|
|
|
|
if (va_display_) {
|
2024-04-22 14:37:45 -04:00
|
|
|
vaapi_mem_pool_->ReleaseResources();
|
2024-03-25 17:05:31 -04:00
|
|
|
RocJpegStatus rocjpeg_status = DestroyDataBuffers();
|
|
|
|
|
if (rocjpeg_status != ROCJPEG_STATUS_SUCCESS) {
|
|
|
|
|
ERR("Error: Failed to destroy VAAPI buffer");
|
|
|
|
|
}
|
|
|
|
|
VAStatus va_status;
|
2024-10-30 11:48:47 -04:00
|
|
|
if (va_surface_id_ != 0) {
|
|
|
|
|
va_status = vaDestroySurfaces(va_display_, &va_surface_id_, 1);
|
|
|
|
|
if (va_status != VA_STATUS_SUCCESS) {
|
|
|
|
|
ERR("ERROR: vaDestroySurfaces failed!");
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
if (va_context_id_ != 0) {
|
|
|
|
|
va_status = vaDestroyContext(va_display_, va_context_id_);
|
|
|
|
|
if (va_status != VA_STATUS_SUCCESS) {
|
|
|
|
|
ERR("ERROR: vaDestroyContext failed!");
|
|
|
|
|
}
|
|
|
|
|
}
|
2024-03-25 17:05:31 -04:00
|
|
|
if (va_config_id_) {
|
|
|
|
|
va_status = vaDestroyConfig(va_display_, va_config_id_);
|
|
|
|
|
if (va_status != VA_STATUS_SUCCESS) {
|
|
|
|
|
ERR("ERROR: vaDestroyConfig failed!");
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
va_status = vaTerminate(va_display_);
|
|
|
|
|
if (va_status != VA_STATUS_SUCCESS) {
|
|
|
|
|
ERR("ERROR: vaTerminate failed!");
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2024-05-15 13:44:51 -04:00
|
|
|
/**
|
|
|
|
|
* @brief Initializes the VAAPI decoder for RocJpeg.
|
|
|
|
|
*
|
|
|
|
|
* This function initializes the VAAPI decoder for RocJpeg by setting the device ID, GCN architecture name,
|
|
|
|
|
* and other necessary parameters. It also sets up the VAAPI display and creates the decoder configuration.
|
|
|
|
|
*
|
|
|
|
|
* @param device_name The name of the device.
|
|
|
|
|
* @param gcn_arch_name The name of the GCN architecture.
|
|
|
|
|
* @param device_id The ID of the device.
|
|
|
|
|
* @return The status of the initialization process.
|
|
|
|
|
*/
|
2024-04-01 18:06:44 -04:00
|
|
|
RocJpegStatus RocJpegVappiDecoder::InitializeDecoder(std::string device_name, std::string gcn_arch_name, int device_id) {
|
|
|
|
|
device_id_ = device_id;
|
2024-03-27 14:14:27 -04:00
|
|
|
std::size_t pos = gcn_arch_name.find_first_of(":");
|
|
|
|
|
std::string gcn_arch_name_base = (pos != std::string::npos) ? gcn_arch_name.substr(0, pos) : gcn_arch_name;
|
|
|
|
|
|
2024-07-12 15:20:38 -04:00
|
|
|
std::string gcn_arch_name_base_temp = gcn_arch_name_base;
|
|
|
|
|
// Check if the device name contains "MI300A" to identify if it is MI300A or MI300X ASIC
|
|
|
|
|
// as both have the same gfx942 architecture name.
|
|
|
|
|
bool is_gfx942_detected = (gcn_arch_name_base.compare("gfx942") == 0);
|
|
|
|
|
if (is_gfx942_detected) {
|
|
|
|
|
std::string mi300a = "MI300A";
|
|
|
|
|
size_t found_mi300a = device_name.find(mi300a);
|
2024-07-19 19:04:31 -04:00
|
|
|
gcn_arch_name_base_temp = (found_mi300a != std::string::npos) ? gcn_arch_name_base_temp + "_mi300a"
|
|
|
|
|
: gcn_arch_name_base_temp + "_mi300x";
|
2024-07-12 15:20:38 -04:00
|
|
|
}
|
|
|
|
|
|
2024-03-27 14:14:27 -04:00
|
|
|
std::vector<int> visible_devices;
|
|
|
|
|
GetVisibleDevices(visible_devices);
|
2024-04-01 14:51:56 -04:00
|
|
|
|
|
|
|
|
int offset = 0;
|
|
|
|
|
if (gcn_arch_name_base.compare("gfx940") == 0 ||
|
|
|
|
|
gcn_arch_name_base.compare("gfx941") == 0 ||
|
|
|
|
|
gcn_arch_name_base.compare("gfx942") == 0) {
|
|
|
|
|
std::vector<ComputePartition> current_compute_partitions;
|
|
|
|
|
GetCurrentComputePartition(current_compute_partitions);
|
|
|
|
|
if (current_compute_partitions.empty()) {
|
|
|
|
|
//if the current_compute_partitions is empty then the default SPX mode is assumed.
|
2024-04-09 20:28:57 -04:00
|
|
|
if (device_id_ < visible_devices.size()) {
|
|
|
|
|
offset = visible_devices[device_id_] * 7;
|
|
|
|
|
} else {
|
|
|
|
|
offset = device_id_ * 7;
|
|
|
|
|
}
|
2024-04-01 14:51:56 -04:00
|
|
|
} else {
|
2024-04-09 20:28:57 -04:00
|
|
|
GetDrmNodeOffset(device_name, device_id_, visible_devices, current_compute_partitions, offset);
|
2024-04-01 14:51:56 -04:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
std::string drm_node = "/dev/dri/renderD";
|
2024-03-27 14:14:27 -04:00
|
|
|
if (device_id_ < visible_devices.size()) {
|
2024-04-09 20:28:57 -04:00
|
|
|
drm_node += std::to_string(128 + offset + visible_devices[device_id_]);
|
2024-03-27 14:14:27 -04:00
|
|
|
} else {
|
2024-04-09 20:28:57 -04:00
|
|
|
drm_node += std::to_string(128 + offset + device_id_);
|
2024-03-27 14:14:27 -04:00
|
|
|
}
|
2024-03-25 17:05:31 -04:00
|
|
|
CHECK_ROCJPEG(InitVAAPI(drm_node));
|
|
|
|
|
CHECK_ROCJPEG(CreateDecoderConfig());
|
2024-10-30 11:48:47 -04:00
|
|
|
CHECK_ROCJPEG(CreateDecoderContext());
|
2024-03-25 17:05:31 -04:00
|
|
|
|
2024-04-22 14:37:45 -04:00
|
|
|
vaapi_mem_pool_->SetVaapiDisplay(va_display_);
|
2024-07-24 12:36:54 -04:00
|
|
|
|
|
|
|
|
auto it = vcn_jpeg_spec_.find(gcn_arch_name_base_temp);
|
|
|
|
|
if (it != vcn_jpeg_spec_.end()) {
|
|
|
|
|
current_vcn_jpeg_spec_ = it->second;
|
|
|
|
|
} else {
|
|
|
|
|
INFO("WARNING: didn't find the vcn jpeg spec for " + gcn_arch_name_base_temp + " using the default setting");
|
|
|
|
|
current_vcn_jpeg_spec_.num_jpeg_cores = 1;
|
|
|
|
|
}
|
2024-08-14 16:45:05 -04:00
|
|
|
vaapi_mem_pool_->SetPoolSize(current_vcn_jpeg_spec_.num_jpeg_cores + 1);
|
2024-04-22 14:37:45 -04:00
|
|
|
|
2024-03-25 17:05:31 -04:00
|
|
|
return ROCJPEG_STATUS_SUCCESS;
|
|
|
|
|
}
|
|
|
|
|
|
2024-05-15 13:44:51 -04:00
|
|
|
/**
|
|
|
|
|
* @brief Initializes the VAAPI decoder.
|
|
|
|
|
*
|
|
|
|
|
* This function initializes the VAAPI decoder by opening the DRM node, creating the va_display,
|
|
|
|
|
* setting the info callback, and initializing the va_display.
|
|
|
|
|
*
|
|
|
|
|
* @param drm_node The path to the DRM node.
|
|
|
|
|
* @return The status of the initialization process.
|
|
|
|
|
* - ROCJPEG_STATUS_SUCCESS if the initialization is successful.
|
|
|
|
|
* - ROCJPEG_STATUS_NOT_INITIALIZED if the initialization fails.
|
|
|
|
|
*/
|
2024-03-25 17:05:31 -04:00
|
|
|
RocJpegStatus RocJpegVappiDecoder::InitVAAPI(std::string drm_node) {
|
|
|
|
|
drm_fd_ = open(drm_node.c_str(), O_RDWR);
|
|
|
|
|
if (drm_fd_ < 0) {
|
|
|
|
|
ERR("ERROR: failed to open drm node " + drm_node);
|
|
|
|
|
return ROCJPEG_STATUS_NOT_INITIALIZED;
|
|
|
|
|
}
|
|
|
|
|
va_display_ = vaGetDisplayDRM(drm_fd_);
|
|
|
|
|
if (!va_display_) {
|
|
|
|
|
ERR("ERROR: failed to create va_display!");
|
|
|
|
|
return ROCJPEG_STATUS_NOT_INITIALIZED;
|
|
|
|
|
}
|
|
|
|
|
vaSetInfoCallback(va_display_, NULL, NULL);
|
|
|
|
|
int major_version = 0, minor_version = 0;
|
|
|
|
|
CHECK_VAAPI(vaInitialize(va_display_, &major_version, &minor_version))
|
|
|
|
|
return ROCJPEG_STATUS_SUCCESS;
|
|
|
|
|
}
|
|
|
|
|
|
2024-05-15 13:44:51 -04:00
|
|
|
/**
|
|
|
|
|
* @brief Creates the decoder configuration for the RocJpegVappiDecoder.
|
|
|
|
|
*
|
|
|
|
|
* This function creates the decoder configuration by querying the VA API for supported entrypoints
|
|
|
|
|
* and checking if the hardware JPEG decoder is supported. If the hardware JPEG decoder is supported,
|
|
|
|
|
* it retrieves the maximum picture width and height attributes from the VA API and creates the configuration.
|
|
|
|
|
*
|
|
|
|
|
* @return The status of the decoder configuration creation.
|
|
|
|
|
* - ROCJPEG_STATUS_SUCCESS if the configuration is created successfully.
|
|
|
|
|
* - ROCJPEG_STATUS_HW_JPEG_DECODER_NOT_SUPPORTED if the hardware JPEG decoder is not supported.
|
|
|
|
|
*/
|
2024-03-25 17:05:31 -04:00
|
|
|
RocJpegStatus RocJpegVappiDecoder::CreateDecoderConfig() {
|
|
|
|
|
int max_num_entrypoints = vaMaxNumEntrypoints(va_display_);
|
|
|
|
|
std::vector<VAEntrypoint> jpeg_entrypoint_list;
|
|
|
|
|
jpeg_entrypoint_list.resize(max_num_entrypoints);
|
|
|
|
|
int num_entrypoints = 0;
|
|
|
|
|
CHECK_VAAPI(vaQueryConfigEntrypoints(va_display_, va_profile_, jpeg_entrypoint_list.data(), &num_entrypoints));
|
|
|
|
|
bool hw_jpeg_decoder_supported = false;
|
|
|
|
|
if (num_entrypoints > 0) {
|
|
|
|
|
for (auto entry_point : jpeg_entrypoint_list) {
|
|
|
|
|
if (entry_point == VAEntrypointVLD) {
|
|
|
|
|
hw_jpeg_decoder_supported = true;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
return ROCJPEG_STATUS_HW_JPEG_DECODER_NOT_SUPPORTED;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (hw_jpeg_decoder_supported) {
|
|
|
|
|
va_config_attrib_.resize(3);
|
|
|
|
|
va_config_attrib_[0].type = VAConfigAttribRTFormat;
|
|
|
|
|
va_config_attrib_[1].type = VAConfigAttribMaxPictureWidth;
|
|
|
|
|
va_config_attrib_[2].type = VAConfigAttribMaxPictureHeight;
|
|
|
|
|
CHECK_VAAPI(vaGetConfigAttributes(va_display_, va_profile_, VAEntrypointVLD, va_config_attrib_.data(), va_config_attrib_.size()));
|
|
|
|
|
CHECK_VAAPI(vaCreateConfig(va_display_, va_profile_, VAEntrypointVLD, &va_config_attrib_[0], 1, &va_config_id_));
|
|
|
|
|
if (va_config_attrib_[1].value != VA_ATTRIB_NOT_SUPPORTED) {
|
|
|
|
|
max_picture_width_ = va_config_attrib_[1].value;
|
|
|
|
|
}
|
|
|
|
|
if (va_config_attrib_[2].value != VA_ATTRIB_NOT_SUPPORTED) {
|
|
|
|
|
max_picture_height_ = va_config_attrib_[2].value;
|
|
|
|
|
}
|
|
|
|
|
return ROCJPEG_STATUS_SUCCESS;
|
|
|
|
|
} else {
|
|
|
|
|
return ROCJPEG_STATUS_HW_JPEG_DECODER_NOT_SUPPORTED;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2024-10-30 11:48:47 -04:00
|
|
|
/**
|
|
|
|
|
* @brief Creates the decoder context for the VAAPI-based JPEG decoder.
|
|
|
|
|
*
|
|
|
|
|
* This function initializes the VAAPI decoder context.
|
|
|
|
|
*
|
|
|
|
|
* @return RocJpegStatus indicating the success or failure of the context creation.
|
|
|
|
|
*/
|
|
|
|
|
RocJpegStatus RocJpegVappiDecoder::CreateDecoderContext() {
|
|
|
|
|
|
|
|
|
|
uint32_t surface_format;
|
|
|
|
|
surface_format = VA_RT_FORMAT_YUV420;
|
|
|
|
|
|
|
|
|
|
VASurfaceAttrib surface_attrib;
|
|
|
|
|
surface_attrib.type = VASurfaceAttribPixelFormat;
|
|
|
|
|
surface_attrib.flags = VA_SURFACE_ATTRIB_SETTABLE;
|
|
|
|
|
surface_attrib.value.type = VAGenericValueTypeInteger;
|
|
|
|
|
surface_attrib.value.value.i = VA_FOURCC_NV12;
|
|
|
|
|
|
|
|
|
|
// Create a dummy surface with a resolution of min_picture_width_ x min_picture_height_ supported by the hardware.
|
|
|
|
|
// This surface is only used to create the context for the decoding pipeline, as context creation requires an initial surface.
|
|
|
|
|
// During the actual submission, the appropriate surfaces with the correct resolution will be created.
|
|
|
|
|
CHECK_VAAPI(vaCreateSurfaces(va_display_, surface_format, min_picture_width_, min_picture_height_, &va_surface_id_, 1, &surface_attrib, 1));
|
|
|
|
|
CHECK_VAAPI(vaCreateContext(va_display_, va_config_id_, min_picture_width_, min_picture_height_, VA_PROGRESSIVE, &va_surface_id_, 1, &va_context_id_));
|
|
|
|
|
|
|
|
|
|
return ROCJPEG_STATUS_SUCCESS;
|
|
|
|
|
}
|
|
|
|
|
|
2024-05-15 13:44:51 -04:00
|
|
|
/**
|
|
|
|
|
* @brief Destroys the data buffers used by the RocJpegVappiDecoder.
|
|
|
|
|
*
|
|
|
|
|
* This function destroys the data buffers used by the RocJpegVappiDecoder, including the picture parameter buffer,
|
|
|
|
|
* quantization matrix buffer, Huffman table buffer, slice parameter buffer, and slice data buffer.
|
|
|
|
|
*
|
|
|
|
|
* @return The status of the operation. Returns ROCJPEG_STATUS_SUCCESS if the data buffers were successfully destroyed.
|
|
|
|
|
*/
|
2024-03-25 17:05:31 -04:00
|
|
|
RocJpegStatus RocJpegVappiDecoder::DestroyDataBuffers() {
|
|
|
|
|
if (va_picture_parameter_buf_id_) {
|
|
|
|
|
CHECK_VAAPI(vaDestroyBuffer(va_display_, va_picture_parameter_buf_id_));
|
|
|
|
|
va_picture_parameter_buf_id_ = 0;
|
|
|
|
|
}
|
|
|
|
|
if (va_quantization_matrix_buf_id_) {
|
|
|
|
|
CHECK_VAAPI(vaDestroyBuffer(va_display_, va_quantization_matrix_buf_id_));
|
|
|
|
|
va_quantization_matrix_buf_id_ = 0;
|
|
|
|
|
}
|
|
|
|
|
if (va_huffmantable_buf_id_) {
|
|
|
|
|
CHECK_VAAPI(vaDestroyBuffer(va_display_, va_huffmantable_buf_id_));
|
|
|
|
|
va_huffmantable_buf_id_ = 0;
|
|
|
|
|
}
|
|
|
|
|
if (va_slice_param_buf_id_) {
|
|
|
|
|
CHECK_VAAPI(vaDestroyBuffer(va_display_, va_slice_param_buf_id_));
|
|
|
|
|
va_slice_param_buf_id_ = 0;
|
|
|
|
|
}
|
|
|
|
|
if (va_slice_data_buf_id_) {
|
|
|
|
|
CHECK_VAAPI(vaDestroyBuffer(va_display_, va_slice_data_buf_id_));
|
|
|
|
|
va_slice_data_buf_id_ = 0;
|
|
|
|
|
}
|
|
|
|
|
return ROCJPEG_STATUS_SUCCESS;
|
|
|
|
|
}
|
|
|
|
|
|
2024-05-15 13:44:51 -04:00
|
|
|
/**
|
|
|
|
|
* @brief Submits a JPEG decode operation to the VAAPI decoder.
|
|
|
|
|
*
|
|
|
|
|
* This function submits a JPEG decode operation to the VAAPI decoder using the provided JPEG stream parameters.
|
|
|
|
|
* It checks for invalid parameters and unsupported image resolutions before proceeding with the decode operation.
|
|
|
|
|
* The output format is determined based on the requested format and the capabilities of the hardware decoder.
|
|
|
|
|
*
|
|
|
|
|
* @param jpeg_stream_params The JPEG stream parameters for the decode operation.
|
|
|
|
|
* @param surface_id [out] The ID of the output surface where the decoded image will be stored.
|
2024-07-12 15:20:38 -04:00
|
|
|
* @param decode_params Additional parameters for the decode operation.
|
2024-05-15 13:44:51 -04:00
|
|
|
* @return The status of the decode operation.
|
|
|
|
|
* - ROCJPEG_STATUS_SUCCESS if the decode operation was successful.
|
|
|
|
|
* - ROCJPEG_STATUS_INVALID_PARAMETER if the provided parameters are invalid.
|
|
|
|
|
* - ROCJPEG_STATUS_JPEG_NOT_SUPPORTED if the JPEG image resolution or chroma subsampling is not supported.
|
|
|
|
|
*/
|
2024-07-12 15:20:38 -04:00
|
|
|
RocJpegStatus RocJpegVappiDecoder::SubmitDecode(const JpegStreamParameters *jpeg_stream_params, uint32_t &surface_id, const RocJpegDecodeParams *decode_params) {
|
|
|
|
|
if (jpeg_stream_params == nullptr || decode_params == nullptr) {
|
2024-03-25 17:05:31 -04:00
|
|
|
return ROCJPEG_STATUS_INVALID_PARAMETER;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (sizeof(jpeg_stream_params->picture_parameter_buffer) != sizeof(VAPictureParameterBufferJPEGBaseline) ||
|
|
|
|
|
sizeof(jpeg_stream_params->quantization_matrix_buffer) != sizeof(VAIQMatrixBufferJPEGBaseline) ||
|
|
|
|
|
sizeof(jpeg_stream_params->huffman_table_buffer) != sizeof(VAHuffmanTableBufferJPEGBaseline) ||
|
|
|
|
|
sizeof(jpeg_stream_params->slice_parameter_buffer) != sizeof(VASliceParameterBufferJPEGBaseline)) {
|
|
|
|
|
return ROCJPEG_STATUS_INVALID_PARAMETER;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (jpeg_stream_params->picture_parameter_buffer.picture_width < min_picture_width_ ||
|
|
|
|
|
jpeg_stream_params->picture_parameter_buffer.picture_height < min_picture_height_ ||
|
|
|
|
|
jpeg_stream_params->picture_parameter_buffer.picture_width > max_picture_width_ ||
|
|
|
|
|
jpeg_stream_params->picture_parameter_buffer.picture_height > max_picture_height_) {
|
|
|
|
|
ERR("The JPEG image resolution is not supported!");
|
|
|
|
|
return ROCJPEG_STATUS_JPEG_NOT_SUPPORTED;
|
|
|
|
|
}
|
|
|
|
|
|
2024-04-11 13:37:08 -04:00
|
|
|
uint32_t surface_format;
|
|
|
|
|
VASurfaceAttrib surface_attrib;
|
|
|
|
|
surface_attrib.type = VASurfaceAttribPixelFormat;
|
|
|
|
|
surface_attrib.flags = VA_SURFACE_ATTRIB_SETTABLE;
|
|
|
|
|
surface_attrib.value.type = VAGenericValueTypeInteger;
|
|
|
|
|
|
|
|
|
|
// If RGB output format is requested, and the HW JPEG decoder has a built-in format conversion,
|
|
|
|
|
// set the RGB surface format and attributes to obtain the RGB output directly from the JPEG HW decoder.
|
|
|
|
|
// otherwise set the appropriate surface format and attributes based on the chroma subsampling of the image.
|
2024-10-10 15:42:38 -04:00
|
|
|
if ((decode_params->output_format == ROCJPEG_OUTPUT_RGB || decode_params->output_format == ROCJPEG_OUTPUT_RGB_PLANAR) && current_vcn_jpeg_spec_.can_convert_to_rgb && jpeg_stream_params->chroma_subsampling != CSS_440) {
|
2024-07-12 15:20:38 -04:00
|
|
|
if (decode_params->output_format == ROCJPEG_OUTPUT_RGB) {
|
2024-04-16 18:27:22 -04:00
|
|
|
surface_format = VA_RT_FORMAT_RGB32;
|
|
|
|
|
surface_attrib.value.value.i = VA_FOURCC_RGBA;
|
2024-07-12 15:20:38 -04:00
|
|
|
} else if (decode_params->output_format == ROCJPEG_OUTPUT_RGB_PLANAR) {
|
2024-04-16 18:27:22 -04:00
|
|
|
surface_format = VA_RT_FORMAT_RGBP;
|
|
|
|
|
surface_attrib.value.value.i = VA_FOURCC_RGBP;
|
|
|
|
|
}
|
2024-04-11 13:37:08 -04:00
|
|
|
} else {
|
|
|
|
|
switch (jpeg_stream_params->chroma_subsampling) {
|
|
|
|
|
case CSS_444:
|
|
|
|
|
surface_format = VA_RT_FORMAT_YUV444;
|
|
|
|
|
surface_attrib.value.value.i = VA_FOURCC_444P;
|
|
|
|
|
break;
|
2024-05-30 22:00:07 -04:00
|
|
|
case CSS_440:
|
|
|
|
|
surface_format = VA_RT_FORMAT_YUV422;
|
|
|
|
|
surface_attrib.value.value.i = VA_FOURCC_422V;
|
|
|
|
|
break;
|
2024-04-11 13:37:08 -04:00
|
|
|
case CSS_422:
|
|
|
|
|
surface_format = VA_RT_FORMAT_YUV422;
|
|
|
|
|
surface_attrib.value.value.i = ROCJPEG_FOURCC_YUYV;
|
|
|
|
|
break;
|
|
|
|
|
case CSS_420:
|
|
|
|
|
surface_format = VA_RT_FORMAT_YUV420;
|
|
|
|
|
surface_attrib.value.value.i = VA_FOURCC_NV12;
|
|
|
|
|
break;
|
|
|
|
|
case CSS_400:
|
|
|
|
|
surface_format = VA_RT_FORMAT_YUV400;
|
|
|
|
|
surface_attrib.value.value.i = VA_FOURCC_Y800;
|
|
|
|
|
break;
|
|
|
|
|
default:
|
|
|
|
|
ERR("ERROR: The chroma subsampling is not supported by the VCN hardware!");
|
|
|
|
|
return ROCJPEG_STATUS_JPEG_NOT_SUPPORTED;
|
|
|
|
|
break;
|
|
|
|
|
}
|
2024-03-25 17:05:31 -04:00
|
|
|
}
|
|
|
|
|
|
2024-08-22 17:04:03 -04:00
|
|
|
// if the HW JPEG decoder has a built-in ROI-decode capability then fill the requested crop rectangle to the picture parameter buffer
|
|
|
|
|
void *picture_parameter_buffer = (void*)&jpeg_stream_params->picture_parameter_buffer;
|
|
|
|
|
if (current_vcn_jpeg_spec_.can_roi_decode) {
|
|
|
|
|
uint32_t roi_width;
|
|
|
|
|
uint32_t roi_height;
|
|
|
|
|
roi_width = decode_params->crop_rectangle.right - decode_params->crop_rectangle.left;
|
|
|
|
|
roi_height = decode_params->crop_rectangle.bottom - decode_params->crop_rectangle.top;
|
|
|
|
|
if (roi_width > 0 && roi_height > 0 && roi_width <= jpeg_stream_params->picture_parameter_buffer.picture_width && roi_height <= jpeg_stream_params->picture_parameter_buffer.picture_height) {
|
|
|
|
|
#if VA_CHECK_VERSION(1, 21, 0)
|
|
|
|
|
reinterpret_cast<VAPictureParameterBufferJPEGBaseline*>(picture_parameter_buffer)->crop_rectangle.x = decode_params->crop_rectangle.left;
|
|
|
|
|
reinterpret_cast<VAPictureParameterBufferJPEGBaseline*>(picture_parameter_buffer)->crop_rectangle.y = decode_params->crop_rectangle.top;
|
|
|
|
|
reinterpret_cast<VAPictureParameterBufferJPEGBaseline*>(picture_parameter_buffer)->crop_rectangle.width = roi_width;
|
|
|
|
|
reinterpret_cast<VAPictureParameterBufferJPEGBaseline*>(picture_parameter_buffer)->crop_rectangle.height = roi_height;
|
|
|
|
|
#else
|
|
|
|
|
reinterpret_cast<VAPictureParameterBufferJPEGBaseline*>(picture_parameter_buffer)->va_reserved[0] = decode_params->crop_rectangle.top << 16 | decode_params->crop_rectangle.left;
|
|
|
|
|
reinterpret_cast<VAPictureParameterBufferJPEGBaseline*>(picture_parameter_buffer)->va_reserved[1] = roi_height << 16 | roi_width;
|
|
|
|
|
#endif
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2024-07-04 15:15:50 -04:00
|
|
|
uint32_t surface_pixel_format = static_cast<uint32_t>(surface_attrib.value.value.i);
|
2024-07-12 15:20:38 -04:00
|
|
|
RocJpegVaapiMemPoolEntry mem_pool_entry = vaapi_mem_pool_->GetEntry(surface_pixel_format, jpeg_stream_params->picture_parameter_buffer.picture_width, jpeg_stream_params->picture_parameter_buffer.picture_height, 1);
|
2024-10-30 11:48:47 -04:00
|
|
|
if (mem_pool_entry.va_surface_ids.empty()) {
|
2024-07-12 15:20:38 -04:00
|
|
|
mem_pool_entry.va_surface_ids.resize(1);
|
|
|
|
|
CHECK_VAAPI(vaCreateSurfaces(va_display_, surface_format, jpeg_stream_params->picture_parameter_buffer.picture_width, jpeg_stream_params->picture_parameter_buffer.picture_height, mem_pool_entry.va_surface_ids.data(), 1, &surface_attrib, 1));
|
2024-04-22 14:37:45 -04:00
|
|
|
mem_pool_entry.image_width = jpeg_stream_params->picture_parameter_buffer.picture_width;
|
|
|
|
|
mem_pool_entry.image_height = jpeg_stream_params->picture_parameter_buffer.picture_height;
|
2024-07-12 15:20:38 -04:00
|
|
|
mem_pool_entry.hip_interops.resize(1);
|
|
|
|
|
surface_id = mem_pool_entry.va_surface_ids[0];
|
2024-08-14 16:45:05 -04:00
|
|
|
mem_pool_entry.entry_status = kBusy;
|
2024-07-04 15:15:50 -04:00
|
|
|
CHECK_ROCJPEG(vaapi_mem_pool_->AddPoolEntry(surface_pixel_format, mem_pool_entry));
|
2024-04-22 14:37:45 -04:00
|
|
|
} else {
|
2024-07-12 15:20:38 -04:00
|
|
|
surface_id = mem_pool_entry.va_surface_ids[0];
|
2024-03-25 17:05:31 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
CHECK_ROCJPEG(DestroyDataBuffers());
|
|
|
|
|
|
2024-10-30 11:48:47 -04:00
|
|
|
CHECK_VAAPI(vaCreateBuffer(va_display_, va_context_id_, VAPictureParameterBufferType, sizeof(VAPictureParameterBufferJPEGBaseline), 1, picture_parameter_buffer, &va_picture_parameter_buf_id_));
|
|
|
|
|
CHECK_VAAPI(vaCreateBuffer(va_display_, va_context_id_, VAIQMatrixBufferType, sizeof(VAIQMatrixBufferJPEGBaseline), 1, (void *)&jpeg_stream_params->quantization_matrix_buffer, &va_quantization_matrix_buf_id_));
|
|
|
|
|
CHECK_VAAPI(vaCreateBuffer(va_display_, va_context_id_, VAHuffmanTableBufferType, sizeof(VAHuffmanTableBufferJPEGBaseline), 1, (void *)&jpeg_stream_params->huffman_table_buffer, &va_huffmantable_buf_id_));
|
|
|
|
|
CHECK_VAAPI(vaCreateBuffer(va_display_, va_context_id_, VASliceParameterBufferType, sizeof(VASliceParameterBufferJPEGBaseline), 1, (void *)&jpeg_stream_params->slice_parameter_buffer, &va_slice_param_buf_id_));
|
|
|
|
|
CHECK_VAAPI(vaCreateBuffer(va_display_, va_context_id_, VASliceDataBufferType, jpeg_stream_params->slice_parameter_buffer.slice_data_size, 1, (void *)jpeg_stream_params->slice_data_buffer, &va_slice_data_buf_id_));
|
2024-03-25 17:05:31 -04:00
|
|
|
|
2024-10-30 11:48:47 -04:00
|
|
|
CHECK_VAAPI(vaBeginPicture(va_display_, va_context_id_, surface_id));
|
|
|
|
|
CHECK_VAAPI(vaRenderPicture(va_display_, va_context_id_, &va_picture_parameter_buf_id_, 1));
|
|
|
|
|
CHECK_VAAPI(vaRenderPicture(va_display_, va_context_id_, &va_quantization_matrix_buf_id_, 1));
|
|
|
|
|
CHECK_VAAPI(vaRenderPicture(va_display_, va_context_id_, &va_huffmantable_buf_id_, 1));
|
|
|
|
|
CHECK_VAAPI(vaRenderPicture(va_display_, va_context_id_, &va_slice_param_buf_id_, 1));
|
|
|
|
|
CHECK_VAAPI(vaRenderPicture(va_display_, va_context_id_, &va_slice_data_buf_id_, 1));
|
|
|
|
|
CHECK_VAAPI(vaEndPicture(va_display_, va_context_id_));
|
2024-03-25 17:05:31 -04:00
|
|
|
|
|
|
|
|
return ROCJPEG_STATUS_SUCCESS;
|
|
|
|
|
}
|
|
|
|
|
|
2024-07-12 15:20:38 -04:00
|
|
|
RocJpegStatus RocJpegVappiDecoder::SubmitDecodeBatched(JpegStreamParameters *jpeg_streams_params, int batch_size, const RocJpegDecodeParams *decode_params, uint32_t *surface_ids) {
|
|
|
|
|
if (jpeg_streams_params == nullptr || decode_params == nullptr || surface_ids == nullptr) {
|
|
|
|
|
return ROCJPEG_STATUS_INVALID_PARAMETER;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// Group the JPEG streams in the jpeg_streams_params array based on their chroma subsampling, width, and height.
|
|
|
|
|
// Store the groups in an unordered map, where the key is a JpegStreamKey struct and the value is a vector of integers
|
|
|
|
|
// representing the indices of the JPEG streams in the batch.
|
|
|
|
|
std::unordered_map<JpegStreamKey, std::vector<int>> jpeg_stream_groups;
|
|
|
|
|
for (int i = 0; i < batch_size; i++) {
|
|
|
|
|
if (sizeof(jpeg_streams_params[i].picture_parameter_buffer) != sizeof(VAPictureParameterBufferJPEGBaseline) ||
|
|
|
|
|
sizeof(jpeg_streams_params[i].quantization_matrix_buffer) != sizeof(VAIQMatrixBufferJPEGBaseline) ||
|
|
|
|
|
sizeof(jpeg_streams_params[i].huffman_table_buffer) != sizeof(VAHuffmanTableBufferJPEGBaseline) ||
|
|
|
|
|
sizeof(jpeg_streams_params[i].slice_parameter_buffer) != sizeof(VASliceParameterBufferJPEGBaseline)) {
|
|
|
|
|
return ROCJPEG_STATUS_INVALID_PARAMETER;
|
|
|
|
|
}
|
|
|
|
|
JpegStreamKey jpeg_stream_key = {};
|
|
|
|
|
jpeg_stream_key.width = jpeg_streams_params[i].picture_parameter_buffer.picture_width;
|
|
|
|
|
jpeg_stream_key.height = jpeg_streams_params[i].picture_parameter_buffer.picture_height;
|
|
|
|
|
if (jpeg_stream_key.width < min_picture_width_ ||
|
|
|
|
|
jpeg_stream_key.height < min_picture_height_ ||
|
|
|
|
|
jpeg_stream_key.width > max_picture_width_ ||
|
|
|
|
|
jpeg_stream_key.height > max_picture_height_) {
|
|
|
|
|
ERR("The JPEG image resolution is not supported!");
|
|
|
|
|
return ROCJPEG_STATUS_JPEG_NOT_SUPPORTED;
|
|
|
|
|
}
|
|
|
|
|
|
2024-10-10 15:42:38 -04:00
|
|
|
if ((decode_params->output_format == ROCJPEG_OUTPUT_RGB || decode_params->output_format == ROCJPEG_OUTPUT_RGB_PLANAR) && current_vcn_jpeg_spec_.can_convert_to_rgb && jpeg_streams_params[i].chroma_subsampling != CSS_440) {
|
2024-07-12 15:20:38 -04:00
|
|
|
if (decode_params->output_format == ROCJPEG_OUTPUT_RGB) {
|
|
|
|
|
jpeg_stream_key.surface_format = VA_RT_FORMAT_RGB32;
|
|
|
|
|
jpeg_stream_key.pixel_format = VA_FOURCC_RGBA;
|
|
|
|
|
} else if (decode_params->output_format == ROCJPEG_OUTPUT_RGB_PLANAR) {
|
|
|
|
|
jpeg_stream_key.surface_format = VA_RT_FORMAT_RGBP;
|
|
|
|
|
jpeg_stream_key.pixel_format = VA_FOURCC_RGBP;
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
switch (jpeg_streams_params[i].chroma_subsampling) {
|
|
|
|
|
case CSS_444:
|
|
|
|
|
jpeg_stream_key.surface_format = VA_RT_FORMAT_YUV444;
|
|
|
|
|
jpeg_stream_key.pixel_format = VA_FOURCC_444P;
|
|
|
|
|
break;
|
|
|
|
|
case CSS_440:
|
|
|
|
|
jpeg_stream_key.surface_format = VA_RT_FORMAT_YUV422;
|
|
|
|
|
jpeg_stream_key.pixel_format = VA_FOURCC_422V;
|
|
|
|
|
break;
|
|
|
|
|
case CSS_422:
|
|
|
|
|
jpeg_stream_key.surface_format = VA_RT_FORMAT_YUV422;
|
|
|
|
|
jpeg_stream_key.pixel_format = ROCJPEG_FOURCC_YUYV;
|
|
|
|
|
break;
|
|
|
|
|
case CSS_420:
|
|
|
|
|
jpeg_stream_key.surface_format = VA_RT_FORMAT_YUV420;
|
|
|
|
|
jpeg_stream_key.pixel_format = VA_FOURCC_NV12;
|
|
|
|
|
break;
|
|
|
|
|
case CSS_400:
|
|
|
|
|
jpeg_stream_key.surface_format = VA_RT_FORMAT_YUV400;
|
|
|
|
|
jpeg_stream_key.pixel_format = VA_FOURCC_Y800;
|
|
|
|
|
break;
|
|
|
|
|
default:
|
|
|
|
|
ERR("ERROR: The chroma subsampling is not supported by the VCN hardware!");
|
|
|
|
|
return ROCJPEG_STATUS_JPEG_NOT_SUPPORTED;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
jpeg_stream_groups[jpeg_stream_key].push_back(i);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
uint32_t surface_format;
|
|
|
|
|
VASurfaceAttrib surface_attrib;
|
|
|
|
|
surface_attrib.type = VASurfaceAttribPixelFormat;
|
|
|
|
|
surface_attrib.flags = VA_SURFACE_ATTRIB_SETTABLE;
|
|
|
|
|
surface_attrib.value.type = VAGenericValueTypeInteger;
|
2024-08-22 17:04:03 -04:00
|
|
|
uint32_t roi_width;
|
|
|
|
|
uint32_t roi_height;
|
|
|
|
|
roi_width = decode_params->crop_rectangle.right - decode_params->crop_rectangle.left;
|
|
|
|
|
roi_height = decode_params->crop_rectangle.bottom - decode_params->crop_rectangle.top;
|
2024-07-12 15:20:38 -04:00
|
|
|
|
|
|
|
|
// Iterate through all entries of jpeg_stream_groups.
|
|
|
|
|
// Check if there is a matching entry in the memory pool.
|
|
|
|
|
// If not, allocate surfaces and create a context for each group.
|
|
|
|
|
// Submit the JPEG streams to the hardware for decoding.
|
|
|
|
|
for (const auto& group : jpeg_stream_groups) {
|
|
|
|
|
const JpegStreamKey& key = group.first;
|
|
|
|
|
const std::vector<int>& indices = group.second;
|
|
|
|
|
|
|
|
|
|
surface_format = key.surface_format;
|
|
|
|
|
surface_attrib.value.value.i = key.pixel_format;
|
|
|
|
|
|
|
|
|
|
RocJpegVaapiMemPoolEntry mem_pool_entry = vaapi_mem_pool_->GetEntry(key.pixel_format, key.width, key.height, indices.size());
|
2024-10-30 11:48:47 -04:00
|
|
|
if (mem_pool_entry.va_surface_ids.empty()) {
|
2024-07-12 15:20:38 -04:00
|
|
|
mem_pool_entry.va_surface_ids.resize(indices.size());
|
|
|
|
|
CHECK_VAAPI(vaCreateSurfaces(va_display_, surface_format, key.width, key.height, mem_pool_entry.va_surface_ids.data(), mem_pool_entry.va_surface_ids.size(), &surface_attrib, 1));
|
|
|
|
|
mem_pool_entry.image_width = key.width;
|
|
|
|
|
mem_pool_entry.image_height = key.height;
|
|
|
|
|
for (int i = 0; i < mem_pool_entry.va_surface_ids.size(); i++) {
|
|
|
|
|
surface_ids[indices[i]] = mem_pool_entry.va_surface_ids[i];
|
|
|
|
|
}
|
|
|
|
|
mem_pool_entry.hip_interops.resize(indices.size());
|
2024-08-14 16:45:05 -04:00
|
|
|
mem_pool_entry.entry_status = kBusy;
|
2024-07-12 15:20:38 -04:00
|
|
|
CHECK_ROCJPEG(vaapi_mem_pool_->AddPoolEntry(key.pixel_format, mem_pool_entry));
|
|
|
|
|
} else {
|
|
|
|
|
for (int i = 0; i < mem_pool_entry.va_surface_ids.size(); i++) {
|
|
|
|
|
surface_ids[indices[i]] = mem_pool_entry.va_surface_ids[i];
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
for (int idx : indices) {
|
2024-08-22 17:04:03 -04:00
|
|
|
// if the HW JPEG decoder has a built-in ROI-decode capability then fill the requested crop rectangle to the picture parameter buffer
|
|
|
|
|
void* picture_parameter_buffer = &jpeg_streams_params[idx].picture_parameter_buffer;
|
|
|
|
|
if (current_vcn_jpeg_spec_.can_roi_decode && roi_width > 0 && roi_height > 0 &&
|
|
|
|
|
roi_width <= jpeg_streams_params[idx].picture_parameter_buffer.picture_width &&
|
|
|
|
|
roi_height <= jpeg_streams_params[idx].picture_parameter_buffer.picture_height) {
|
|
|
|
|
#if VA_CHECK_VERSION(1, 21, 0)
|
|
|
|
|
reinterpret_cast<VAPictureParameterBufferJPEGBaseline*>(picture_parameter_buffer)->crop_rectangle.x = decode_params->crop_rectangle.left;
|
|
|
|
|
reinterpret_cast<VAPictureParameterBufferJPEGBaseline*>(picture_parameter_buffer)->crop_rectangle.y = decode_params->crop_rectangle.top;
|
|
|
|
|
reinterpret_cast<VAPictureParameterBufferJPEGBaseline*>(picture_parameter_buffer)->crop_rectangle.width = roi_width;
|
|
|
|
|
reinterpret_cast<VAPictureParameterBufferJPEGBaseline*>(picture_parameter_buffer)->crop_rectangle.height = roi_height;
|
|
|
|
|
#else
|
|
|
|
|
reinterpret_cast<VAPictureParameterBufferJPEGBaseline*>(picture_parameter_buffer)->va_reserved[0] = decode_params->crop_rectangle.top << 16 | decode_params->crop_rectangle.left;
|
|
|
|
|
reinterpret_cast<VAPictureParameterBufferJPEGBaseline*>(picture_parameter_buffer)->va_reserved[1] = roi_height << 16 | roi_width;
|
|
|
|
|
#endif
|
|
|
|
|
}
|
2024-07-12 15:20:38 -04:00
|
|
|
CHECK_ROCJPEG(DestroyDataBuffers());
|
2024-10-30 11:48:47 -04:00
|
|
|
CHECK_VAAPI(vaCreateBuffer(va_display_, va_context_id_, VAPictureParameterBufferType, sizeof(VAPictureParameterBufferJPEGBaseline), 1, picture_parameter_buffer, &va_picture_parameter_buf_id_));
|
|
|
|
|
CHECK_VAAPI(vaCreateBuffer(va_display_, va_context_id_, VAIQMatrixBufferType, sizeof(VAIQMatrixBufferJPEGBaseline), 1, (void *)&jpeg_streams_params[idx].quantization_matrix_buffer, &va_quantization_matrix_buf_id_));
|
|
|
|
|
CHECK_VAAPI(vaCreateBuffer(va_display_, va_context_id_, VAHuffmanTableBufferType, sizeof(VAHuffmanTableBufferJPEGBaseline), 1, (void *)&jpeg_streams_params[idx].huffman_table_buffer, &va_huffmantable_buf_id_));
|
|
|
|
|
CHECK_VAAPI(vaCreateBuffer(va_display_, va_context_id_, VASliceParameterBufferType, sizeof(VASliceParameterBufferJPEGBaseline), 1, (void *)&jpeg_streams_params[idx].slice_parameter_buffer, &va_slice_param_buf_id_));
|
|
|
|
|
CHECK_VAAPI(vaCreateBuffer(va_display_, va_context_id_, VASliceDataBufferType, jpeg_streams_params[idx].slice_parameter_buffer.slice_data_size, 1, (void *)jpeg_streams_params[idx].slice_data_buffer, &va_slice_data_buf_id_));
|
|
|
|
|
|
|
|
|
|
CHECK_VAAPI(vaBeginPicture(va_display_, va_context_id_, surface_ids[idx]));
|
|
|
|
|
CHECK_VAAPI(vaRenderPicture(va_display_, va_context_id_, &va_picture_parameter_buf_id_, 1));
|
|
|
|
|
CHECK_VAAPI(vaRenderPicture(va_display_, va_context_id_, &va_quantization_matrix_buf_id_, 1));
|
|
|
|
|
CHECK_VAAPI(vaRenderPicture(va_display_, va_context_id_, &va_huffmantable_buf_id_, 1));
|
|
|
|
|
CHECK_VAAPI(vaRenderPicture(va_display_, va_context_id_, &va_slice_param_buf_id_, 1));
|
|
|
|
|
CHECK_VAAPI(vaRenderPicture(va_display_, va_context_id_, &va_slice_data_buf_id_, 1));
|
|
|
|
|
CHECK_VAAPI(vaEndPicture(va_display_, va_context_id_));
|
2024-07-12 15:20:38 -04:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
return ROCJPEG_STATUS_SUCCESS;
|
|
|
|
|
}
|
|
|
|
|
|
2024-05-15 13:44:51 -04:00
|
|
|
/**
|
|
|
|
|
* @brief Synchronizes the specified VASurfaceID.
|
|
|
|
|
*
|
|
|
|
|
* This function synchronizes the specified VASurfaceID by querying its status and waiting until it becomes ready.
|
|
|
|
|
* If the surface ID is not found in the VAAPI memory pool, it returns ROCJPEG_STATUS_INVALID_PARAMETER.
|
|
|
|
|
* If any error occurs during synchronization, it returns ROCJPEG_STATUS_RUNTIME_ERROR.
|
|
|
|
|
*
|
|
|
|
|
* @param surface_id The VASurfaceID to synchronize.
|
|
|
|
|
* @return The status of the synchronization operation.
|
|
|
|
|
*/
|
2024-03-25 17:05:31 -04:00
|
|
|
RocJpegStatus RocJpegVappiDecoder::SyncSurface(VASurfaceID surface_id) {
|
|
|
|
|
VASurfaceStatus surface_status;
|
2024-04-22 14:37:45 -04:00
|
|
|
if (!vaapi_mem_pool_->FindSurfaceId(surface_id)) {
|
2024-03-25 17:05:31 -04:00
|
|
|
return ROCJPEG_STATUS_INVALID_PARAMETER;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
CHECK_VAAPI(vaQuerySurfaceStatus(va_display_, surface_id, &surface_status));
|
|
|
|
|
while (surface_status != VASurfaceReady) {
|
|
|
|
|
VAStatus va_status = vaSyncSurface(va_display_, surface_id);
|
|
|
|
|
if (va_status != VA_STATUS_SUCCESS) {
|
|
|
|
|
if (va_status == 0x26 /*VA_STATUS_ERROR_TIMEDOUT*/) {
|
|
|
|
|
CHECK_VAAPI(vaQuerySurfaceStatus(va_display_, surface_id, &surface_status));
|
|
|
|
|
} else {
|
|
|
|
|
std::cout << "vaSyncSurface() failed with error code: 0x" << std::hex << va_status <<
|
|
|
|
|
std::dec << "', status: " << vaErrorStr(va_status) << "' at " << __FILE__ << ":" << __LINE__ << std::endl;
|
|
|
|
|
return ROCJPEG_STATUS_RUNTIME_ERROR;
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return ROCJPEG_STATUS_SUCCESS;
|
|
|
|
|
}
|
|
|
|
|
|
2024-05-15 13:44:51 -04:00
|
|
|
/**
|
|
|
|
|
* @brief Retrieves the HipInteropDeviceMem associated with the specified VASurfaceID.
|
|
|
|
|
*
|
|
|
|
|
* This function retrieves the HipInteropDeviceMem associated with the specified VASurfaceID
|
|
|
|
|
* from the vaapi_mem_pool_ and stores it in the provided `hip_interop` parameter.
|
|
|
|
|
*
|
|
|
|
|
* @param surface_id The VASurfaceID of the surface to retrieve the HipInteropDeviceMem for.
|
|
|
|
|
* @param hip_interop The reference to a HipInteropDeviceMem object where the retrieved memory will be stored.
|
|
|
|
|
* @return The RocJpegStatus indicating the success or failure of the operation.
|
|
|
|
|
*/
|
2024-04-22 14:37:45 -04:00
|
|
|
RocJpegStatus RocJpegVappiDecoder::GetHipInteropMem(VASurfaceID surface_id, HipInteropDeviceMem& hip_interop) {
|
|
|
|
|
return vaapi_mem_pool_->GetHipInteropMem(surface_id, hip_interop);
|
2024-03-27 14:14:27 -04:00
|
|
|
}
|
|
|
|
|
|
2024-05-15 13:44:51 -04:00
|
|
|
/**
|
|
|
|
|
* @brief Retrieves the visible devices for the RocJpegVappiDecoder.
|
|
|
|
|
*
|
|
|
|
|
* This function retrieves the visible devices for the RocJpegVappiDecoder by reading the value of the environment variable "HIP_VISIBLE_DEVICES".
|
|
|
|
|
* The visible devices are stored in the provided vector `visible_devices_vector`.
|
|
|
|
|
*
|
|
|
|
|
* @param visible_devices_vector The vector to store the visible devices.
|
|
|
|
|
*/
|
2024-03-27 14:14:27 -04:00
|
|
|
void RocJpegVappiDecoder::GetVisibleDevices(std::vector<int>& visible_devices_vetor) {
|
|
|
|
|
char *visible_devices = std::getenv("HIP_VISIBLE_DEVICES");
|
|
|
|
|
if (visible_devices != nullptr) {
|
|
|
|
|
char *token = std::strtok(visible_devices,",");
|
|
|
|
|
while (token != nullptr) {
|
|
|
|
|
visible_devices_vetor.push_back(std::atoi(token));
|
|
|
|
|
token = std::strtok(nullptr,",");
|
|
|
|
|
}
|
|
|
|
|
std::sort(visible_devices_vetor.begin(), visible_devices_vetor.end());
|
|
|
|
|
}
|
2024-04-01 14:51:56 -04:00
|
|
|
}
|
|
|
|
|
|
2024-05-15 13:44:51 -04:00
|
|
|
/**
|
|
|
|
|
* Retrieves the current compute partitions from the system.
|
|
|
|
|
*
|
|
|
|
|
* This function searches for the "current_compute_partition" file in the "/sys/devices/" directory
|
|
|
|
|
* and reads the partition value from each file found. The partition value is then compared to known
|
|
|
|
|
* partition names and the corresponding ComputePartition enum value is added to the provided vector.
|
|
|
|
|
*
|
|
|
|
|
* @param current_compute_partitions A vector to store the current compute partitions.
|
|
|
|
|
*/
|
2024-04-01 14:51:56 -04:00
|
|
|
void RocJpegVappiDecoder::GetCurrentComputePartition(std::vector<ComputePartition> ¤t_compute_partitions) {
|
|
|
|
|
std::string search_path = "/sys/devices/";
|
|
|
|
|
std::string partition_file = "current_compute_partition";
|
2024-05-30 09:08:35 -04:00
|
|
|
std::error_code ec;
|
|
|
|
|
if (fs::exists(search_path)) {
|
|
|
|
|
for (auto it = fs::recursive_directory_iterator(search_path, fs::directory_options::skip_permission_denied); it != fs::recursive_directory_iterator(); ) {
|
|
|
|
|
try {
|
|
|
|
|
if (it->path().filename() == partition_file) {
|
|
|
|
|
std::ifstream file(it->path());
|
|
|
|
|
if (file.is_open()) {
|
|
|
|
|
std::string partition;
|
|
|
|
|
std::getline(file, partition);
|
|
|
|
|
if (partition.compare("SPX") == 0 || partition.compare("spx") == 0) {
|
|
|
|
|
current_compute_partitions.push_back(kSpx);
|
|
|
|
|
} else if (partition.compare("DPX") == 0 || partition.compare("dpx") == 0) {
|
|
|
|
|
current_compute_partitions.push_back(kDpx);
|
|
|
|
|
} else if (partition.compare("TPX") == 0 || partition.compare("tpx") == 0) {
|
|
|
|
|
current_compute_partitions.push_back(kTpx);
|
|
|
|
|
} else if (partition.compare("QPX") == 0 || partition.compare("qpx") == 0) {
|
|
|
|
|
current_compute_partitions.push_back(kQpx);
|
|
|
|
|
} else if (partition.compare("CPX") == 0 || partition.compare("cpx") == 0) {
|
|
|
|
|
current_compute_partitions.push_back(kCpx);
|
|
|
|
|
}
|
|
|
|
|
file.close();
|
|
|
|
|
}
|
2024-04-01 14:51:56 -04:00
|
|
|
}
|
2024-05-30 09:08:35 -04:00
|
|
|
++it;
|
|
|
|
|
} catch (fs::filesystem_error& e) {
|
|
|
|
|
it.increment(ec);
|
2024-04-01 14:51:56 -04:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2024-05-15 13:44:51 -04:00
|
|
|
/**
|
|
|
|
|
* @brief Calculates the offset for the DRM node based on the device name, device ID, visible devices,
|
|
|
|
|
* current compute partitions, and the selected compute partition.
|
|
|
|
|
*
|
|
|
|
|
* @param device_name The name of the device.
|
|
|
|
|
* @param device_id The ID of the device.
|
|
|
|
|
* @param visible_devices A vector containing the IDs of the visible devices.
|
|
|
|
|
* @param current_compute_partitions A vector containing the current compute partitions.
|
|
|
|
|
* @param offset The calculated offset for the DRM node.
|
|
|
|
|
*/
|
2024-04-09 20:28:57 -04:00
|
|
|
void RocJpegVappiDecoder::GetDrmNodeOffset(std::string device_name, uint8_t device_id, std::vector<int>& visible_devices,
|
2024-04-01 14:51:56 -04:00
|
|
|
std::vector<ComputePartition> ¤t_compute_partitions,
|
2024-04-09 20:28:57 -04:00
|
|
|
int &offset) {
|
2024-04-01 14:51:56 -04:00
|
|
|
if (!current_compute_partitions.empty()) {
|
|
|
|
|
switch (current_compute_partitions[0]) {
|
|
|
|
|
case kSpx:
|
2024-04-09 20:28:57 -04:00
|
|
|
if (device_id < visible_devices.size()) {
|
|
|
|
|
offset = visible_devices[device_id] * 7;
|
|
|
|
|
} else {
|
|
|
|
|
offset = device_id * 7;
|
|
|
|
|
}
|
2024-04-01 14:51:56 -04:00
|
|
|
break;
|
|
|
|
|
case kDpx:
|
2024-04-09 20:28:57 -04:00
|
|
|
if (device_id < visible_devices.size()) {
|
|
|
|
|
offset = (visible_devices[device_id] / 2) * 6;
|
|
|
|
|
} else {
|
|
|
|
|
offset = (device_id / 2) * 6;
|
|
|
|
|
}
|
2024-04-01 14:51:56 -04:00
|
|
|
break;
|
|
|
|
|
case kTpx:
|
|
|
|
|
// Please note that although there are only 6 XCCs per socket on MI300A,
|
|
|
|
|
// there are two dummy render nodes added by the driver.
|
|
|
|
|
// This needs to be taken into account when creating drm_node on each socket in TPX mode.
|
|
|
|
|
if (device_id < visible_devices.size()) {
|
2024-04-09 20:28:57 -04:00
|
|
|
offset = (visible_devices[device_id] / 3) * 5;
|
2024-04-01 14:51:56 -04:00
|
|
|
} else {
|
2024-04-09 20:28:57 -04:00
|
|
|
offset = (device_id / 3) * 5;
|
2024-04-01 14:51:56 -04:00
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
case kQpx:
|
2024-04-09 20:28:57 -04:00
|
|
|
if (device_id < visible_devices.size()) {
|
|
|
|
|
offset = (visible_devices[device_id] / 4) * 4;
|
|
|
|
|
} else {
|
|
|
|
|
offset = (device_id / 4) * 4;
|
|
|
|
|
}
|
2024-04-01 14:51:56 -04:00
|
|
|
break;
|
|
|
|
|
case kCpx:
|
|
|
|
|
// Please note that both MI300A and MI300X have the same gfx_arch_name which is
|
|
|
|
|
// gfx942. Therefore we cannot use the gfx942 to identify MI300A.
|
|
|
|
|
// instead use the device name and look for MI300A
|
|
|
|
|
// Also, as explained aboe in the TPX mode section, we need to be taken into account
|
|
|
|
|
// the extra two dummy nodes when creating drm_node on each socket in CPX mode as well.
|
|
|
|
|
std::string mi300a = "MI300A";
|
|
|
|
|
size_t found_mi300a = device_name.find(mi300a);
|
|
|
|
|
if (found_mi300a != std::string::npos) {
|
2024-04-09 20:28:57 -04:00
|
|
|
if (device_id < visible_devices.size()) {
|
|
|
|
|
offset = (visible_devices[device_id] / 6) * 2;
|
|
|
|
|
} else {
|
|
|
|
|
offset = (device_id / 6) * 2;
|
|
|
|
|
}
|
2024-04-01 14:51:56 -04:00
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
2024-08-14 16:45:05 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* @brief Sets a VASurfaceID as idle.
|
|
|
|
|
*
|
|
|
|
|
* This function sets the specified VASurfaceID as idle in the RocJpegVappiDecoder's vaapi_mem_pool.
|
|
|
|
|
* If the surface cannot be set as idle, it returns ROCJPEG_STATUS_INVALID_PARAMETER.
|
|
|
|
|
*
|
|
|
|
|
* @param surface_id The VASurfaceID to set as idle.
|
|
|
|
|
* @return RocJpegStatus The status of the operation. Returns ROCJPEG_STATUS_SUCCESS if successful,
|
|
|
|
|
* or ROCJPEG_STATUS_INVALID_PARAMETER if the surface cannot be set as idle.
|
|
|
|
|
*/
|
|
|
|
|
RocJpegStatus RocJpegVappiDecoder::SetSurfaceAsIdle(VASurfaceID surface_id) {
|
|
|
|
|
if (!vaapi_mem_pool_->SetSurfaceAsIdle(surface_id)) {
|
|
|
|
|
return ROCJPEG_STATUS_INVALID_PARAMETER;
|
|
|
|
|
}
|
|
|
|
|
return ROCJPEG_STATUS_SUCCESS;
|
2024-03-25 17:05:31 -04:00
|
|
|
}
|