2024-03-25 17:05:31 -04:00
|
|
|
/*
|
|
|
|
|
Copyright (c) 2024 Advanced Micro Devices, Inc. All rights reserved.
|
|
|
|
|
|
|
|
|
|
Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
|
|
|
of this software and associated documentation files (the "Software"), to deal
|
|
|
|
|
in the Software without restriction, including without limitation the rights
|
|
|
|
|
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
|
|
|
copies of the Software, and to permit persons to whom the Software is
|
|
|
|
|
furnished to do so, subject to the following conditions:
|
|
|
|
|
|
|
|
|
|
The above copyright notice and this permission notice shall be included in
|
|
|
|
|
all copies or substantial portions of the Software.
|
|
|
|
|
|
|
|
|
|
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
|
|
|
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
|
|
|
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
|
|
|
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
|
|
|
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
|
|
|
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
|
|
|
THE SOFTWARE.
|
|
|
|
|
*/
|
|
|
|
|
|
|
|
|
|
#include "rocjpeg_vaapi_decoder.h"
|
|
|
|
|
|
|
|
|
|
RocJpegVappiDecoder::RocJpegVappiDecoder(int device_id) : device_id_{device_id}, drm_fd_{-1}, min_picture_width_{64}, min_picture_height_{64},
|
|
|
|
|
max_picture_width_{4096}, max_picture_height_{4096}, va_display_{0}, va_config_attrib_{{}}, va_config_id_{0}, va_profile_{VAProfileJPEGBaseline},
|
|
|
|
|
va_context_id_{0}, va_surface_ids_{}, va_picture_parameter_buf_id_{0}, va_quantization_matrix_buf_id_{0}, va_huffmantable_buf_id_{0},
|
|
|
|
|
va_slice_param_buf_id_{0}, va_slice_data_buf_id_{0} {};
|
|
|
|
|
|
|
|
|
|
RocJpegVappiDecoder::~RocJpegVappiDecoder() {
|
|
|
|
|
if (drm_fd_ != -1) {
|
|
|
|
|
close(drm_fd_);
|
|
|
|
|
}
|
|
|
|
|
if (va_display_) {
|
|
|
|
|
RocJpegStatus rocjpeg_status = DestroyDataBuffers();
|
|
|
|
|
if (rocjpeg_status != ROCJPEG_STATUS_SUCCESS) {
|
|
|
|
|
ERR("Error: Failed to destroy VAAPI buffer");
|
|
|
|
|
}
|
|
|
|
|
VAStatus va_status;
|
|
|
|
|
if (va_surface_ids_.size() > 0) {
|
|
|
|
|
va_status = vaDestroySurfaces(va_display_, va_surface_ids_.data(), va_surface_ids_.size());
|
|
|
|
|
if (va_status != VA_STATUS_SUCCESS) {
|
|
|
|
|
ERR("ERROR: vaDestroySurfaces failed!");
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
if (va_context_id_) {
|
|
|
|
|
va_status = vaDestroyContext(va_display_, va_context_id_);
|
|
|
|
|
if (va_status != VA_STATUS_SUCCESS) {
|
|
|
|
|
ERR("ERROR: vaDestroyContext failed!");
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
if (va_config_id_) {
|
|
|
|
|
va_status = vaDestroyConfig(va_display_, va_config_id_);
|
|
|
|
|
if (va_status != VA_STATUS_SUCCESS) {
|
|
|
|
|
ERR("ERROR: vaDestroyConfig failed!");
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
va_status = vaTerminate(va_display_);
|
|
|
|
|
if (va_status != VA_STATUS_SUCCESS) {
|
|
|
|
|
ERR("ERROR: vaTerminate failed!");
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2024-04-01 14:51:56 -04:00
|
|
|
RocJpegStatus RocJpegVappiDecoder::InitializeDecoder(std::string device_name, std::string gcn_arch_name) {
|
2024-03-27 14:14:27 -04:00
|
|
|
std::size_t pos = gcn_arch_name.find_first_of(":");
|
|
|
|
|
std::string gcn_arch_name_base = (pos != std::string::npos) ? gcn_arch_name.substr(0, pos) : gcn_arch_name;
|
|
|
|
|
|
|
|
|
|
std::vector<int> visible_devices;
|
|
|
|
|
GetVisibleDevices(visible_devices);
|
2024-04-01 14:51:56 -04:00
|
|
|
|
|
|
|
|
int num_render_cards_per_socket = 1;
|
|
|
|
|
int offset = 0;
|
|
|
|
|
if (gcn_arch_name_base.compare("gfx940") == 0 ||
|
|
|
|
|
gcn_arch_name_base.compare("gfx941") == 0 ||
|
|
|
|
|
gcn_arch_name_base.compare("gfx942") == 0) {
|
|
|
|
|
std::vector<ComputePartition> current_compute_partitions;
|
|
|
|
|
GetCurrentComputePartition(current_compute_partitions);
|
|
|
|
|
if (current_compute_partitions.empty()) {
|
|
|
|
|
//if the current_compute_partitions is empty then the default SPX mode is assumed.
|
|
|
|
|
num_render_cards_per_socket = 8;
|
|
|
|
|
} else {
|
|
|
|
|
GetNumRenderCardsPerDevice(device_name, device_id_, visible_devices, current_compute_partitions, num_render_cards_per_socket, offset);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
std::string drm_node = "/dev/dri/renderD";
|
2024-03-27 14:14:27 -04:00
|
|
|
if (device_id_ < visible_devices.size()) {
|
2024-04-01 14:51:56 -04:00
|
|
|
drm_node += std::to_string(128 + offset + visible_devices[device_id_] * num_render_cards_per_socket);
|
2024-03-27 14:14:27 -04:00
|
|
|
} else {
|
2024-04-01 14:51:56 -04:00
|
|
|
drm_node += std::to_string(128 + offset + device_id_ * num_render_cards_per_socket);
|
2024-03-27 14:14:27 -04:00
|
|
|
}
|
2024-03-25 17:05:31 -04:00
|
|
|
CHECK_ROCJPEG(InitVAAPI(drm_node));
|
|
|
|
|
CHECK_ROCJPEG(CreateDecoderConfig());
|
|
|
|
|
|
|
|
|
|
return ROCJPEG_STATUS_SUCCESS;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
RocJpegStatus RocJpegVappiDecoder::InitVAAPI(std::string drm_node) {
|
|
|
|
|
drm_fd_ = open(drm_node.c_str(), O_RDWR);
|
|
|
|
|
if (drm_fd_ < 0) {
|
|
|
|
|
ERR("ERROR: failed to open drm node " + drm_node);
|
|
|
|
|
return ROCJPEG_STATUS_NOT_INITIALIZED;
|
|
|
|
|
}
|
|
|
|
|
va_display_ = vaGetDisplayDRM(drm_fd_);
|
|
|
|
|
if (!va_display_) {
|
|
|
|
|
ERR("ERROR: failed to create va_display!");
|
|
|
|
|
return ROCJPEG_STATUS_NOT_INITIALIZED;
|
|
|
|
|
}
|
|
|
|
|
vaSetInfoCallback(va_display_, NULL, NULL);
|
|
|
|
|
int major_version = 0, minor_version = 0;
|
|
|
|
|
CHECK_VAAPI(vaInitialize(va_display_, &major_version, &minor_version))
|
|
|
|
|
return ROCJPEG_STATUS_SUCCESS;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
RocJpegStatus RocJpegVappiDecoder::CreateDecoderConfig() {
|
|
|
|
|
int max_num_entrypoints = vaMaxNumEntrypoints(va_display_);
|
|
|
|
|
std::vector<VAEntrypoint> jpeg_entrypoint_list;
|
|
|
|
|
jpeg_entrypoint_list.resize(max_num_entrypoints);
|
|
|
|
|
int num_entrypoints = 0;
|
|
|
|
|
CHECK_VAAPI(vaQueryConfigEntrypoints(va_display_, va_profile_, jpeg_entrypoint_list.data(), &num_entrypoints));
|
|
|
|
|
bool hw_jpeg_decoder_supported = false;
|
|
|
|
|
if (num_entrypoints > 0) {
|
|
|
|
|
for (auto entry_point : jpeg_entrypoint_list) {
|
|
|
|
|
if (entry_point == VAEntrypointVLD) {
|
|
|
|
|
hw_jpeg_decoder_supported = true;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
return ROCJPEG_STATUS_HW_JPEG_DECODER_NOT_SUPPORTED;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (hw_jpeg_decoder_supported) {
|
|
|
|
|
va_config_attrib_.resize(3);
|
|
|
|
|
va_config_attrib_[0].type = VAConfigAttribRTFormat;
|
|
|
|
|
va_config_attrib_[1].type = VAConfigAttribMaxPictureWidth;
|
|
|
|
|
va_config_attrib_[2].type = VAConfigAttribMaxPictureHeight;
|
|
|
|
|
CHECK_VAAPI(vaGetConfigAttributes(va_display_, va_profile_, VAEntrypointVLD, va_config_attrib_.data(), va_config_attrib_.size()));
|
|
|
|
|
CHECK_VAAPI(vaCreateConfig(va_display_, va_profile_, VAEntrypointVLD, &va_config_attrib_[0], 1, &va_config_id_));
|
|
|
|
|
if (va_config_attrib_[1].value != VA_ATTRIB_NOT_SUPPORTED) {
|
|
|
|
|
max_picture_width_ = va_config_attrib_[1].value;
|
|
|
|
|
}
|
|
|
|
|
if (va_config_attrib_[2].value != VA_ATTRIB_NOT_SUPPORTED) {
|
|
|
|
|
max_picture_height_ = va_config_attrib_[2].value;
|
|
|
|
|
}
|
|
|
|
|
return ROCJPEG_STATUS_SUCCESS;
|
|
|
|
|
} else {
|
|
|
|
|
return ROCJPEG_STATUS_HW_JPEG_DECODER_NOT_SUPPORTED;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
RocJpegStatus RocJpegVappiDecoder::DestroyDataBuffers() {
|
|
|
|
|
if (va_picture_parameter_buf_id_) {
|
|
|
|
|
CHECK_VAAPI(vaDestroyBuffer(va_display_, va_picture_parameter_buf_id_));
|
|
|
|
|
va_picture_parameter_buf_id_ = 0;
|
|
|
|
|
}
|
|
|
|
|
if (va_quantization_matrix_buf_id_) {
|
|
|
|
|
CHECK_VAAPI(vaDestroyBuffer(va_display_, va_quantization_matrix_buf_id_));
|
|
|
|
|
va_quantization_matrix_buf_id_ = 0;
|
|
|
|
|
}
|
|
|
|
|
if (va_huffmantable_buf_id_) {
|
|
|
|
|
CHECK_VAAPI(vaDestroyBuffer(va_display_, va_huffmantable_buf_id_));
|
|
|
|
|
va_huffmantable_buf_id_ = 0;
|
|
|
|
|
}
|
|
|
|
|
if (va_slice_param_buf_id_) {
|
|
|
|
|
CHECK_VAAPI(vaDestroyBuffer(va_display_, va_slice_param_buf_id_));
|
|
|
|
|
va_slice_param_buf_id_ = 0;
|
|
|
|
|
}
|
|
|
|
|
if (va_slice_data_buf_id_) {
|
|
|
|
|
CHECK_VAAPI(vaDestroyBuffer(va_display_, va_slice_data_buf_id_));
|
|
|
|
|
va_slice_data_buf_id_ = 0;
|
|
|
|
|
}
|
|
|
|
|
return ROCJPEG_STATUS_SUCCESS;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
RocJpegStatus RocJpegVappiDecoder::SubmitDecode(const JpegStreamParameters *jpeg_stream_params, uint32_t &surface_id) {
|
|
|
|
|
if (jpeg_stream_params == nullptr) {
|
|
|
|
|
return ROCJPEG_STATUS_INVALID_PARAMETER;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (sizeof(jpeg_stream_params->picture_parameter_buffer) != sizeof(VAPictureParameterBufferJPEGBaseline) ||
|
|
|
|
|
sizeof(jpeg_stream_params->quantization_matrix_buffer) != sizeof(VAIQMatrixBufferJPEGBaseline) ||
|
|
|
|
|
sizeof(jpeg_stream_params->huffman_table_buffer) != sizeof(VAHuffmanTableBufferJPEGBaseline) ||
|
|
|
|
|
sizeof(jpeg_stream_params->slice_parameter_buffer) != sizeof(VASliceParameterBufferJPEGBaseline)) {
|
|
|
|
|
return ROCJPEG_STATUS_INVALID_PARAMETER;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (jpeg_stream_params->picture_parameter_buffer.picture_width < min_picture_width_ ||
|
|
|
|
|
jpeg_stream_params->picture_parameter_buffer.picture_height < min_picture_height_ ||
|
|
|
|
|
jpeg_stream_params->picture_parameter_buffer.picture_width > max_picture_width_ ||
|
|
|
|
|
jpeg_stream_params->picture_parameter_buffer.picture_height > max_picture_height_) {
|
|
|
|
|
ERR("The JPEG image resolution is not supported!");
|
|
|
|
|
return ROCJPEG_STATUS_JPEG_NOT_SUPPORTED;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
uint8_t surface_format;
|
|
|
|
|
switch (jpeg_stream_params->chroma_subsampling) {
|
|
|
|
|
case CSS_444:
|
|
|
|
|
surface_format = VA_RT_FORMAT_YUV444;
|
|
|
|
|
break;
|
|
|
|
|
case CSS_422:
|
|
|
|
|
surface_format = VA_RT_FORMAT_YUV422;
|
|
|
|
|
break;
|
|
|
|
|
case CSS_420:
|
|
|
|
|
surface_format = VA_RT_FORMAT_YUV420;
|
|
|
|
|
break;
|
|
|
|
|
case CSS_400:
|
|
|
|
|
surface_format = VA_RT_FORMAT_YUV400;
|
|
|
|
|
break;
|
|
|
|
|
default:
|
|
|
|
|
ERR("ERROR: The chroma subsampling is not supported by the VCN hardware!");
|
|
|
|
|
return ROCJPEG_STATUS_JPEG_NOT_SUPPORTED;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
VASurfaceID va_surface_id;
|
|
|
|
|
CHECK_VAAPI(vaCreateSurfaces(va_display_, surface_format, jpeg_stream_params->picture_parameter_buffer.picture_width, jpeg_stream_params->picture_parameter_buffer.picture_height, &va_surface_id, 1, nullptr, 1));
|
|
|
|
|
va_surface_ids_.push_back(va_surface_id);
|
|
|
|
|
surface_id = va_surface_id;
|
|
|
|
|
|
|
|
|
|
if (va_context_id_) {
|
|
|
|
|
vaDestroyContext(va_display_, va_context_id_);
|
|
|
|
|
va_context_id_ = 0;
|
|
|
|
|
}
|
|
|
|
|
CHECK_VAAPI(vaCreateContext(va_display_, va_config_id_, jpeg_stream_params->picture_parameter_buffer.picture_width, jpeg_stream_params->picture_parameter_buffer.picture_height, VA_PROGRESSIVE, &va_surface_id, 1, &va_context_id_));
|
|
|
|
|
|
|
|
|
|
CHECK_ROCJPEG(DestroyDataBuffers());
|
|
|
|
|
|
|
|
|
|
CHECK_VAAPI(vaCreateBuffer(va_display_, va_context_id_, VAPictureParameterBufferType, sizeof(VAPictureParameterBufferJPEGBaseline), 1, (void *)&jpeg_stream_params->picture_parameter_buffer, &va_picture_parameter_buf_id_));
|
|
|
|
|
CHECK_VAAPI(vaCreateBuffer(va_display_, va_context_id_, VAIQMatrixBufferType, sizeof(VAIQMatrixBufferJPEGBaseline), 1, (void *)&jpeg_stream_params->quantization_matrix_buffer, &va_quantization_matrix_buf_id_));
|
|
|
|
|
CHECK_VAAPI(vaCreateBuffer(va_display_, va_context_id_, VAHuffmanTableBufferType, sizeof(VAHuffmanTableBufferJPEGBaseline), 1, (void *)&jpeg_stream_params->huffman_table_buffer, &va_huffmantable_buf_id_));
|
|
|
|
|
CHECK_VAAPI(vaCreateBuffer(va_display_, va_context_id_, VASliceParameterBufferType, sizeof(VASliceParameterBufferJPEGBaseline), 1, (void *)&jpeg_stream_params->slice_parameter_buffer, &va_slice_param_buf_id_));
|
|
|
|
|
CHECK_VAAPI(vaCreateBuffer(va_display_, va_context_id_, VASliceDataBufferType, jpeg_stream_params->slice_parameter_buffer.slice_data_size, 1, (void *)jpeg_stream_params->slice_data_buffer, &va_slice_data_buf_id_));
|
|
|
|
|
|
|
|
|
|
CHECK_VAAPI(vaBeginPicture(va_display_, va_context_id_, va_surface_id));
|
|
|
|
|
CHECK_VAAPI(vaRenderPicture(va_display_, va_context_id_, &va_picture_parameter_buf_id_, 1));
|
|
|
|
|
CHECK_VAAPI(vaRenderPicture(va_display_, va_context_id_, &va_quantization_matrix_buf_id_, 1));
|
|
|
|
|
CHECK_VAAPI(vaRenderPicture(va_display_, va_context_id_, &va_huffmantable_buf_id_, 1));
|
|
|
|
|
CHECK_VAAPI(vaRenderPicture(va_display_, va_context_id_, &va_slice_param_buf_id_, 1));
|
|
|
|
|
CHECK_VAAPI(vaRenderPicture(va_display_, va_context_id_, &va_slice_data_buf_id_, 1));
|
|
|
|
|
CHECK_VAAPI(vaEndPicture(va_display_, va_context_id_));
|
|
|
|
|
|
|
|
|
|
return ROCJPEG_STATUS_SUCCESS;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
RocJpegStatus RocJpegVappiDecoder::ExportSurface(VASurfaceID surface_id, VADRMPRIMESurfaceDescriptor &va_drm_prime_surface_desc) {
|
|
|
|
|
|
|
|
|
|
bool is_surface_id_found = false;
|
|
|
|
|
int idx = 0;
|
|
|
|
|
for (idx = 0; idx < va_surface_ids_.size(); idx++) {
|
|
|
|
|
if (va_surface_ids_[idx] == surface_id) {
|
|
|
|
|
is_surface_id_found = true;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
if (!is_surface_id_found) {
|
|
|
|
|
return ROCJPEG_STATUS_INVALID_PARAMETER;
|
|
|
|
|
}
|
|
|
|
|
CHECK_VAAPI(vaExportSurfaceHandle(va_display_, surface_id,
|
|
|
|
|
VA_SURFACE_ATTRIB_MEM_TYPE_DRM_PRIME_2,
|
|
|
|
|
VA_EXPORT_SURFACE_READ_ONLY |
|
|
|
|
|
VA_EXPORT_SURFACE_SEPARATE_LAYERS,
|
|
|
|
|
&va_drm_prime_surface_desc));
|
|
|
|
|
|
|
|
|
|
return ROCJPEG_STATUS_SUCCESS;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
RocJpegStatus RocJpegVappiDecoder::SyncSurface(VASurfaceID surface_id) {
|
|
|
|
|
VASurfaceStatus surface_status;
|
|
|
|
|
bool is_surface_id_found = false;
|
|
|
|
|
int idx = 0;
|
|
|
|
|
|
|
|
|
|
for (idx = 0; idx < va_surface_ids_.size(); idx++) {
|
|
|
|
|
if (va_surface_ids_[idx] == surface_id) {
|
|
|
|
|
is_surface_id_found = true;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (!is_surface_id_found) {
|
|
|
|
|
return ROCJPEG_STATUS_INVALID_PARAMETER;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
CHECK_VAAPI(vaQuerySurfaceStatus(va_display_, surface_id, &surface_status));
|
|
|
|
|
while (surface_status != VASurfaceReady) {
|
|
|
|
|
VAStatus va_status = vaSyncSurface(va_display_, surface_id);
|
|
|
|
|
if (va_status != VA_STATUS_SUCCESS) {
|
|
|
|
|
if (va_status == 0x26 /*VA_STATUS_ERROR_TIMEDOUT*/) {
|
|
|
|
|
CHECK_VAAPI(vaQuerySurfaceStatus(va_display_, surface_id, &surface_status));
|
|
|
|
|
} else {
|
|
|
|
|
std::cout << "vaSyncSurface() failed with error code: 0x" << std::hex << va_status <<
|
|
|
|
|
std::dec << "', status: " << vaErrorStr(va_status) << "' at " << __FILE__ << ":" << __LINE__ << std::endl;
|
|
|
|
|
return ROCJPEG_STATUS_RUNTIME_ERROR;
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return ROCJPEG_STATUS_SUCCESS;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
RocJpegStatus RocJpegVappiDecoder::ReleaseSurface(VASurfaceID surface_id) {
|
|
|
|
|
bool is_surface_id_found = false;
|
|
|
|
|
int idx = 0;
|
|
|
|
|
|
|
|
|
|
for (idx = 0; idx < va_surface_ids_.size(); idx++) {
|
|
|
|
|
if (va_surface_ids_[idx] == surface_id) {
|
|
|
|
|
is_surface_id_found = true;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (!is_surface_id_found) {
|
|
|
|
|
return ROCJPEG_STATUS_INVALID_PARAMETER;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
CHECK_VAAPI(vaDestroySurfaces(va_display_, &va_surface_ids_[idx], 1));
|
|
|
|
|
va_surface_ids_.erase(va_surface_ids_.begin() + idx);
|
|
|
|
|
|
|
|
|
|
return ROCJPEG_STATUS_SUCCESS;
|
2024-03-27 14:14:27 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void RocJpegVappiDecoder::GetVisibleDevices(std::vector<int>& visible_devices_vetor) {
|
|
|
|
|
char *visible_devices = std::getenv("HIP_VISIBLE_DEVICES");
|
|
|
|
|
if (visible_devices != nullptr) {
|
|
|
|
|
char *token = std::strtok(visible_devices,",");
|
|
|
|
|
while (token != nullptr) {
|
|
|
|
|
visible_devices_vetor.push_back(std::atoi(token));
|
|
|
|
|
token = std::strtok(nullptr,",");
|
|
|
|
|
}
|
|
|
|
|
std::sort(visible_devices_vetor.begin(), visible_devices_vetor.end());
|
|
|
|
|
}
|
2024-04-01 14:51:56 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void RocJpegVappiDecoder::GetCurrentComputePartition(std::vector<ComputePartition> ¤t_compute_partitions) {
|
|
|
|
|
std::string search_path = "/sys/devices/";
|
|
|
|
|
std::string partition_file = "current_compute_partition";
|
|
|
|
|
for (const auto& entry : std::filesystem::recursive_directory_iterator(search_path)) {
|
|
|
|
|
if (entry.path().filename() == partition_file) {
|
|
|
|
|
std::ifstream file(entry.path());
|
|
|
|
|
if (file.is_open()) {
|
|
|
|
|
std::string partition;
|
|
|
|
|
std::getline(file, partition);
|
|
|
|
|
if (partition.compare("SPX") == 0 || partition.compare("spx") == 0) {
|
|
|
|
|
current_compute_partitions.push_back(kSpx);
|
|
|
|
|
} else if (partition.compare("DPX") == 0 || partition.compare("dpx") == 0) {
|
|
|
|
|
current_compute_partitions.push_back(kDpx);
|
|
|
|
|
} else if (partition.compare("TPX") == 0 || partition.compare("tpx") == 0) {
|
|
|
|
|
current_compute_partitions.push_back(kTpx);
|
|
|
|
|
} else if (partition.compare("QPX") == 0 || partition.compare("qpx") == 0) {
|
|
|
|
|
current_compute_partitions.push_back(kQpx);
|
|
|
|
|
} else if (partition.compare("CPX") == 0 || partition.compare("cpx") == 0) {
|
|
|
|
|
current_compute_partitions.push_back(kCpx);
|
|
|
|
|
}
|
|
|
|
|
file.close();
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void RocJpegVappiDecoder::GetNumRenderCardsPerDevice(std::string device_name, uint8_t device_id, std::vector<int>& visible_devices,
|
|
|
|
|
std::vector<ComputePartition> ¤t_compute_partitions,
|
|
|
|
|
int &num_render_cards_per_socket, int &offset) {
|
|
|
|
|
offset = 0;
|
|
|
|
|
if (!current_compute_partitions.empty()) {
|
|
|
|
|
switch (current_compute_partitions[0]) {
|
|
|
|
|
case kSpx:
|
|
|
|
|
num_render_cards_per_socket = 8;
|
|
|
|
|
break;
|
|
|
|
|
case kDpx:
|
|
|
|
|
num_render_cards_per_socket = 4;
|
|
|
|
|
break;
|
|
|
|
|
case kTpx:
|
|
|
|
|
num_render_cards_per_socket = 2;
|
|
|
|
|
// Please note that although there are only 6 XCCs per socket on MI300A,
|
|
|
|
|
// there are two dummy render nodes added by the driver.
|
|
|
|
|
// This needs to be taken into account when creating drm_node on each socket in TPX mode.
|
|
|
|
|
if (device_id < visible_devices.size()) {
|
|
|
|
|
offset = (visible_devices[device_id] / 3) * 2;
|
|
|
|
|
} else {
|
|
|
|
|
offset = (device_id / 3) * 2;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
case kQpx:
|
|
|
|
|
num_render_cards_per_socket = 2;
|
|
|
|
|
break;
|
|
|
|
|
case kCpx:
|
|
|
|
|
num_render_cards_per_socket = 1;
|
|
|
|
|
// Please note that both MI300A and MI300X have the same gfx_arch_name which is
|
|
|
|
|
// gfx942. Therefore we cannot use the gfx942 to identify MI300A.
|
|
|
|
|
// instead use the device name and look for MI300A
|
|
|
|
|
// Also, as explained aboe in the TPX mode section, we need to be taken into account
|
|
|
|
|
// the extra two dummy nodes when creating drm_node on each socket in CPX mode as well.
|
|
|
|
|
std::string mi300a = "MI300A";
|
|
|
|
|
size_t found_mi300a = device_name.find(mi300a);
|
|
|
|
|
if (found_mi300a != std::string::npos) {
|
|
|
|
|
offset = (device_id / 6) * 2;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
2024-03-25 17:05:31 -04:00
|
|
|
}
|