Files
Apurv Mishra be375c2dbf rocr: Add support for Mipmapped Array (#1847)
SWDEV-539526 - Add support for Mipmapped Array in Rocr

Add support for Mipmapped Array functionality in Rocr Runtimeenabling GPU applications to work with multi-level texture mipmaps. The implementation introduces new public APIs for creating, querying, and managing mipmapped arrays across different GPU architectures.

Signed-off-by: Apurv Mishra <Apurv.Mishra@amd.com>
Co-authored-by: Shweta Khatri <shweta.khatri@amd.com>
Co-authored-by: taosang2 <tao.sang@amd.com>
2026-01-08 17:14:39 -06:00

192 rader
7.8 KiB
C++

////////////////////////////////////////////////////////////////////////////////
//
// The University of Illinois/NCSA
// Open Source License (NCSA)
//
// Copyright (c) 2014-2020, Advanced Micro Devices, Inc. All rights reserved.
//
// Developed by:
//
// AMD Research and AMD HSA Software Development
//
// Advanced Micro Devices, Inc.
//
// www.amd.com
//
// Permission is hereby granted, free of charge, to any person obtaining a copy
// of this software and associated documentation files (the "Software"), to
// deal with the Software without restriction, including without limitation
// the rights to use, copy, modify, merge, publish, distribute, sublicense,
// and/or sell copies of the Software, and to permit persons to whom the
// Software is furnished to do so, subject to the following conditions:
//
// - Redistributions of source code must retain the above copyright notice,
// this list of conditions and the following disclaimers.
// - Redistributions in binary form must reproduce the above copyright
// notice, this list of conditions and the following disclaimers in
// the documentation and/or other materials provided with the distribution.
// - Neither the names of Advanced Micro Devices, Inc,
// nor the names of its contributors may be used to endorse or promote
// products derived from this Software without specific prior written
// permission.
//
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
// THE CONTRIBUTORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
// OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
// ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
// DEALINGS WITH THE SOFTWARE.
//
////////////////////////////////////////////////////////////////////////////////
#ifndef AMD_HSA_EXT_IMAGE_IMAGE_MANAGER_H
#define AMD_HSA_EXT_IMAGE_IMAGE_MANAGER_H
#include <cstring>
#include "inc/hsa.h"
#include "inc/hsa_ext_image.h"
#include "resource.h"
#include "util.h"
#include "image/addrlib/inc/addrinterface.h"
namespace rocr {
namespace image {
/// @brief Abstract class for creating AMD agent specific image / sampler
/// resources and data transfer.
class ImageManager {
public:
explicit ImageManager();
virtual ~ImageManager();
virtual hsa_status_t Initialize(hsa_agent_t agent_handle) = 0;
virtual void Cleanup() = 0;
/// @brief Retrieve device specific image property of a certain format
/// and geometry.
virtual ImageProperty GetImageProperty(
hsa_agent_t component, const hsa_ext_image_format_t& format,
hsa_ext_image_geometry_t geometry) const = 0;
/// @brief Retrieve device specific supported max width, height, depth,
/// and array size of an image geometry.
virtual void GetImageInfoMaxDimension(hsa_agent_t component,
hsa_ext_image_geometry_t geometry,
uint32_t& width, uint32_t& height,
uint32_t& depth,
uint32_t& array_size) const = 0;
/// @brief Calculate the size and alignment of the backing storage of an
/// image.
virtual hsa_status_t CalculateImageSizeAndAlignment(
hsa_agent_t component, const hsa_ext_image_descriptor_t& desc,
hsa_ext_image_data_layout_t image_data_layout,
uint32_t num_mipmap_levels,
size_t image_data_row_pitch,
size_t image_data_slice_pitch,
hsa_ext_image_data_info_t& image_info) const = 0;
/// @brief Fill image structure with device specific image object.
virtual hsa_status_t PopulateImageSrd(Image& image) const = 0;
/// @brief Fill image structure with device specific image object using the given format.
virtual hsa_status_t PopulateImageSrd(Image& image, const metadata_amd_t* desc) const = 0;
/// @brief Modify device specific image object according to the specified
/// new format.
virtual hsa_status_t ModifyImageSrd(
Image& image, hsa_ext_image_format_t& new_format) const = 0;
/// @brief Fill sampler structure with device specific sampler object.
virtual hsa_status_t PopulateSamplerSrd(Sampler& sampler) const = 0;
// @brief Copy the content of a linear memory to an image object.
virtual hsa_status_t CopyBufferToImage(
const void* src_memory, size_t src_row_pitch, size_t src_slice_pitch,
const Image& dst_image, const hsa_ext_image_region_t& image_region);
/// @brief Copy the content of an image object to a linear memory.
virtual hsa_status_t CopyImageToBuffer(
const Image& src_image, void* dst_memory, size_t dst_row_pitch,
size_t dst_slice_pitch, const hsa_ext_image_region_t& image_region);
/// @brief Transfer images backing storage.
virtual hsa_status_t CopyImage(const Image& dst_image, const Image& src_image,
const hsa_dim3_t& dst_origin,
const hsa_dim3_t& src_origin,
const hsa_dim3_t size);
/// @brief Fill image backing storage using host copy.
virtual hsa_status_t FillImage(const Image& image, const void* pattern,
const hsa_ext_image_region_t& region);
/// @brief Get the address library handle
virtual ADDR_HANDLE GetAddrLib() const = 0;
/// @brief Fill mipmap structure with device specific mipmapped array object.
virtual hsa_status_t PopulateMipmapSrd(MipmappedArray& mipmap_array) const = 0;
/// @brief Fill mipmap structure with pre-computed AMD metadata descriptor.
virtual hsa_status_t PopulateMipmapSrd(MipmappedArray& mipmap_array, const metadata_amd_t* desc) const = 0;
/// @brief Create mip level view using SRD BASE_LEVEL/LAST_LEVEL fields
virtual hsa_status_t PopulateMipLevelSrd(MipmappedArray& level_view,
const MipmappedArray& mipmap_array, uint32_t mip_level) const = 0;
virtual void printSRDDetailed(const uint32_t* srd) const = 0;
virtual void printChannelSelect(uint32_t sel) const = 0;
virtual void printResourceType(uint32_t type) const = 0;
virtual void printSwizzleMode(uint32_t sw_mode) const = 0;
protected:
static uint16_t FloatToHalf(float in);
static inline float Normalize(uint8_t u_val);
static inline uint8_t Denormalize(float f_val);
static float StandardToLinearRGB(float s_val);
static float LinearToStandardRGB(float l_val);
static void FormatPattern(const hsa_ext_image_format_t& format,
const void* pattern_in, void* pattern_out);
template <typename dstT, typename srcT>
static inline hsa_status_t convertAddressMode(dstT &word,
const hsa_ext_sampler_addressing_mode32_t address_mode[3]) {
srcT clamp[3];
for (int i = 0; i < 3; i++) {
switch (address_mode[i]) {
case HSA_EXT_SAMPLER_ADDRESSING_MODE_CLAMP_TO_EDGE:
clamp[i] = srcT::SQ_TEX_CLAMP_LAST_TEXEL;
break;
case HSA_EXT_SAMPLER_ADDRESSING_MODE_CLAMP_TO_BORDER:
clamp[i] = srcT::SQ_TEX_CLAMP_BORDER;
break;
case HSA_EXT_SAMPLER_ADDRESSING_MODE_MIRRORED_REPEAT:
clamp[i] = srcT::SQ_TEX_MIRROR;
break;
case HSA_EXT_SAMPLER_ADDRESSING_MODE_UNDEFINED:
case HSA_EXT_SAMPLER_ADDRESSING_MODE_REPEAT:
clamp[i] = srcT::SQ_TEX_WRAP;
break;
default:
return HSA_STATUS_ERROR_INVALID_ARGUMENT;
}
}
word.bits.CLAMP_X = static_cast<unsigned int>(clamp[0]);
word.bits.CLAMP_Y = static_cast<unsigned int>(clamp[1]);
word.bits.CLAMP_Z = static_cast<unsigned int>(clamp[2]);
return HSA_STATUS_SUCCESS;
}
private:
DISALLOW_COPY_AND_ASSIGN(ImageManager);
};
} // namespace image
} // namespace rocr
#endif // AMD_HSA_EXT_IMAGE_IMAGE_MANAGER_H