文件
rocm-systems/projects/rocr-runtime/runtime/hsa-runtime/image/image_runtime.h
T
Apurv Mishra be375c2dbf rocr: Add support for Mipmapped Array (#1847)
SWDEV-539526 - Add support for Mipmapped Array in Rocr

Add support for Mipmapped Array functionality in Rocr Runtimeenabling GPU applications to work with multi-level texture mipmaps. The implementation introduces new public APIs for creating, querying, and managing mipmapped arrays across different GPU architectures.

Signed-off-by: Apurv Mishra <Apurv.Mishra@amd.com>
Co-authored-by: Shweta Khatri <shweta.khatri@amd.com>
Co-authored-by: taosang2 <tao.sang@amd.com>
2026-01-08 17:14:39 -06:00

233 行
9.4 KiB
C++

////////////////////////////////////////////////////////////////////////////////
//
// The University of Illinois/NCSA
// Open Source License (NCSA)
//
// Copyright (c) 2014-2020, Advanced Micro Devices, Inc. All rights reserved.
//
// Developed by:
//
// AMD Research and AMD HSA Software Development
//
// Advanced Micro Devices, Inc.
//
// www.amd.com
//
// Permission is hereby granted, free of charge, to any person obtaining a copy
// of this software and associated documentation files (the "Software"), to
// deal with the Software without restriction, including without limitation
// the rights to use, copy, modify, merge, publish, distribute, sublicense,
// and/or sell copies of the Software, and to permit persons to whom the
// Software is furnished to do so, subject to the following conditions:
//
// - Redistributions of source code must retain the above copyright notice,
// this list of conditions and the following disclaimers.
// - Redistributions in binary form must reproduce the above copyright
// notice, this list of conditions and the following disclaimers in
// the documentation and/or other materials provided with the distribution.
// - Neither the names of Advanced Micro Devices, Inc,
// nor the names of its contributors may be used to endorse or promote
// products derived from this Software without specific prior written
// permission.
//
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
// THE CONTRIBUTORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
// OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
// ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
// DEALINGS WITH THE SOFTWARE.
//
////////////////////////////////////////////////////////////////////////////////
#ifndef HSA_RUNTIME_EXT_IMAGE_IMAGE_RUNTIME_H
#define HSA_RUNTIME_EXT_IMAGE_IMAGE_RUNTIME_H
#include <atomic>
#include <map>
#include <mutex>
#include "inc/hsa.h"
#include "inc/hsa_ext_image.h"
#include "inc/hsa_ext_amd.h"
#include "blit_kernel.h"
#include "image_manager.h"
#include "util.h"
namespace rocr {
namespace image {
class ImageRuntime {
public:
/// @brief Getter for the ImageRuntime singleton object.
static ImageRuntime* instance();
/// @brief Destroy singleton object.
static void DestroySingleton();
/// @brief Retrieve maximum size of width, height, depth, array size in pixels
/// for a particular geometry on a component.
hsa_status_t GetImageInfoMaxDimension(hsa_agent_t component,
hsa_agent_info_t attribute,
void* value);
/// @brief Query image support with particular format and geometry.
hsa_status_t GetImageCapability(hsa_agent_t component,
const hsa_ext_image_format_t& format,
hsa_ext_image_geometry_t geometry,
uint32_t& capability);
/// @brief Query the size and address alignment of the backing storage of
/// the image.
hsa_status_t GetImageSizeAndAlignment(hsa_agent_t component,
const hsa_ext_image_descriptor_t& desc,
hsa_ext_image_data_layout_t image_data_layout,
size_t image_data_row_pitch,
size_t image_data_slice_pitch,
hsa_ext_image_data_info_t& image_info);
/// @brief Create device image object and return its handle.
hsa_status_t CreateImageHandle(
hsa_agent_t component, const hsa_ext_image_descriptor_t& image_descriptor,
const void* image_data, const hsa_access_permission_t access_permission,
hsa_ext_image_data_layout_t image_data_layout,
size_t image_data_row_pitch,
size_t image_data_slice_pitch,
hsa_ext_image_t& image);
/// @brief Create device image object and return its handle.
hsa_status_t CreateImageHandleWithLayout(
hsa_agent_t component, const hsa_ext_image_descriptor_t& image_descriptor,
const hsa_amd_image_descriptor_t* image_layout,
const void* image_data, const hsa_access_permission_t access_permission,
hsa_ext_image_t& image);
/// @brief Create mipmapped array object with AMD-specific layout and return its handle.
hsa_status_t CreateMipmapArrayHandleWithLayout(
hsa_agent_t component, const hsa_ext_image_descriptor_t& mipmap_descriptor,
const hsa_amd_image_descriptor_t* image_layout,
const void* image_data, const hsa_access_permission_t access_permission,
uint32_t num_mipmap_levels,
hsa_ext_image_t& image_handle);
/// @brief Destroy the device image object referenced by the handle.
hsa_status_t DestroyImageHandle(const hsa_ext_image_t& image);
/// @brief Copy the content of a linear memory to an image object.
hsa_status_t CopyBufferToImage(const void* src_memory, size_t src_row_pitch,
size_t src_slice_pitch,
const hsa_ext_image_t& dst_image,
const hsa_ext_image_region_t& image_region);
/// @brief Copy the content of an image object to a linear memory.
hsa_status_t CopyImageToBuffer(const hsa_ext_image_t& src_image,
void* dst_memory, size_t dst_row_pitch,
size_t dst_slice_pitch,
const hsa_ext_image_region_t& image_region);
/// @brief Copy the content of an image object to another image object.
hsa_status_t CopyImage(const hsa_ext_image_t& src_image,
const hsa_ext_image_t& dst_image,
const hsa_dim3_t& src_origin,
const hsa_dim3_t& dst_origin, const hsa_dim3_t size);
/// @brief Fill the content of an image object with a pattern.
hsa_status_t FillImage(const hsa_ext_image_t& image, const void* pattern,
const hsa_ext_image_region_t& image_region);
/// @brief Create device sampler object and return its handle.
hsa_status_t CreateSamplerHandle(
hsa_agent_t component,
const hsa_ext_sampler_descriptor_v2_t& sampler_descriptor,
hsa_ext_sampler_t& sampler);
/// @brief Destroy the device sampler object referenced by the handle.
hsa_status_t DestroySamplerHandle(hsa_ext_sampler_t& sampler);
/// @brief Create device Mipmap array object and return its handle
hsa_status_t CreateMipmapArrayHandle(
hsa_agent_t component, const hsa_ext_image_descriptor_t& mipmap_descriptor,
const void* image_data, const hsa_access_permission_t access_permission,
uint32_t num_mipmap_levels,
const hsa_ext_image_data_layout_t mipmap_layout,
size_t image_data_row_pitch, size_t image_data_slice_pitch,
hsa_ext_image_t& image_handle);
/// @brief - Helper function to compute mipmapped surface size / alignment & max levels.
hsa_status_t GetMipmapArraySizeAndAlignment(
hsa_agent_t component,
const hsa_ext_image_descriptor_t& desc,
uint32_t num_mipmap_levels,
hsa_ext_image_data_layout_t layout,
size_t row_pitch,
size_t slice_pitch,
size_t& size_out,
size_t& alignment_out);
/// @brief Destroy the mipmapped array object referenced by the handle.
hsa_status_t DestroyMipmapArrayHandle(const hsa_ext_image_t& image_handle);
/// @brief Get the handle for a specific mipmap level in a mipmapped array.
hsa_status_t GetMipmapArrayLevelHandle(
hsa_agent_t agent, const hsa_ext_image_t& mipmapped_array,
uint32_t mip_level, hsa_ext_image_t& level_image_out);
ImageManager* image_manager(hsa_agent_t agent) {
std::map<uint64_t, ImageManager*>::iterator it = image_managers_.find(agent.handle);
return (it != image_managers_.end()) ? it->second : NULL;
}
BlitKernel& blit_kernel() { return blit_kernel_; }
size_t cpu_l2_cache_size() const { return cpu_l2_cache_size_; }
hsa_amd_memory_pool_t kernarg_pool() const {
return kernarg_pool_;
}
private:
/// @brief Initialize singleton object, must be called once.
static ImageRuntime* CreateSingleton();
static hsa_status_t CreateImageManager(hsa_agent_t agent, void* data);
ImageRuntime();
~ImageRuntime();
void Cleanup();
/// Pointer to singleton object.
static __forceinline std::atomic<ImageRuntime*>& get_instance() {
// This allocation is meant to last until the last thread has exited.
// It is intentionally not freed.
static std::atomic<ImageRuntime*>* instance_ = new std::atomic<ImageRuntime*>();
return *instance_;
}
static __forceinline std::mutex& instance_mutex() {
// This allocation is meant to last until the last thread has exited.
// It is intentionally not freed.
static std::mutex* instance_mutex_ = new std::mutex();
return *instance_mutex_;
}
/// @brief Contains mapping of agent and its corresponding ::ImageManager
/// object.
std::map<uint64_t, ImageManager*> image_managers_;
/// @brief Manages kernel for accessing images.
BlitKernel blit_kernel_;
size_t cpu_l2_cache_size_;
hsa_amd_memory_pool_t kernarg_pool_;
DISALLOW_COPY_AND_ASSIGN(ImageRuntime);
};
} // namespace image
} // namespace rocr
#endif // HSA_RUNTIME_EXT_IMAGE_IMAGE_RUNTIME_H