be375c2dbf
SWDEV-539526 - Add support for Mipmapped Array in Rocr Add support for Mipmapped Array functionality in Rocr Runtimeenabling GPU applications to work with multi-level texture mipmaps. The implementation introduces new public APIs for creating, querying, and managing mipmapped arrays across different GPU architectures. Signed-off-by: Apurv Mishra <Apurv.Mishra@amd.com> Co-authored-by: Shweta Khatri <shweta.khatri@amd.com> Co-authored-by: taosang2 <tao.sang@amd.com>
233 行
9.4 KiB
C++
233 行
9.4 KiB
C++
////////////////////////////////////////////////////////////////////////////////
|
|
//
|
|
// The University of Illinois/NCSA
|
|
// Open Source License (NCSA)
|
|
//
|
|
// Copyright (c) 2014-2020, Advanced Micro Devices, Inc. All rights reserved.
|
|
//
|
|
// Developed by:
|
|
//
|
|
// AMD Research and AMD HSA Software Development
|
|
//
|
|
// Advanced Micro Devices, Inc.
|
|
//
|
|
// www.amd.com
|
|
//
|
|
// Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
// of this software and associated documentation files (the "Software"), to
|
|
// deal with the Software without restriction, including without limitation
|
|
// the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
// and/or sell copies of the Software, and to permit persons to whom the
|
|
// Software is furnished to do so, subject to the following conditions:
|
|
//
|
|
// - Redistributions of source code must retain the above copyright notice,
|
|
// this list of conditions and the following disclaimers.
|
|
// - Redistributions in binary form must reproduce the above copyright
|
|
// notice, this list of conditions and the following disclaimers in
|
|
// the documentation and/or other materials provided with the distribution.
|
|
// - Neither the names of Advanced Micro Devices, Inc,
|
|
// nor the names of its contributors may be used to endorse or promote
|
|
// products derived from this Software without specific prior written
|
|
// permission.
|
|
//
|
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
// THE CONTRIBUTORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
|
|
// OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
|
|
// ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
|
|
// DEALINGS WITH THE SOFTWARE.
|
|
//
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
#ifndef HSA_RUNTIME_EXT_IMAGE_IMAGE_RUNTIME_H
|
|
#define HSA_RUNTIME_EXT_IMAGE_IMAGE_RUNTIME_H
|
|
|
|
#include <atomic>
|
|
#include <map>
|
|
#include <mutex>
|
|
|
|
#include "inc/hsa.h"
|
|
|
|
#include "inc/hsa_ext_image.h"
|
|
#include "inc/hsa_ext_amd.h"
|
|
#include "blit_kernel.h"
|
|
#include "image_manager.h"
|
|
#include "util.h"
|
|
|
|
namespace rocr {
|
|
namespace image {
|
|
|
|
class ImageRuntime {
|
|
public:
|
|
/// @brief Getter for the ImageRuntime singleton object.
|
|
static ImageRuntime* instance();
|
|
|
|
/// @brief Destroy singleton object.
|
|
static void DestroySingleton();
|
|
|
|
/// @brief Retrieve maximum size of width, height, depth, array size in pixels
|
|
/// for a particular geometry on a component.
|
|
hsa_status_t GetImageInfoMaxDimension(hsa_agent_t component,
|
|
hsa_agent_info_t attribute,
|
|
void* value);
|
|
|
|
/// @brief Query image support with particular format and geometry.
|
|
hsa_status_t GetImageCapability(hsa_agent_t component,
|
|
const hsa_ext_image_format_t& format,
|
|
hsa_ext_image_geometry_t geometry,
|
|
uint32_t& capability);
|
|
|
|
/// @brief Query the size and address alignment of the backing storage of
|
|
/// the image.
|
|
hsa_status_t GetImageSizeAndAlignment(hsa_agent_t component,
|
|
const hsa_ext_image_descriptor_t& desc,
|
|
hsa_ext_image_data_layout_t image_data_layout,
|
|
size_t image_data_row_pitch,
|
|
size_t image_data_slice_pitch,
|
|
hsa_ext_image_data_info_t& image_info);
|
|
|
|
/// @brief Create device image object and return its handle.
|
|
hsa_status_t CreateImageHandle(
|
|
hsa_agent_t component, const hsa_ext_image_descriptor_t& image_descriptor,
|
|
const void* image_data, const hsa_access_permission_t access_permission,
|
|
hsa_ext_image_data_layout_t image_data_layout,
|
|
size_t image_data_row_pitch,
|
|
size_t image_data_slice_pitch,
|
|
hsa_ext_image_t& image);
|
|
|
|
/// @brief Create device image object and return its handle.
|
|
hsa_status_t CreateImageHandleWithLayout(
|
|
hsa_agent_t component, const hsa_ext_image_descriptor_t& image_descriptor,
|
|
const hsa_amd_image_descriptor_t* image_layout,
|
|
const void* image_data, const hsa_access_permission_t access_permission,
|
|
hsa_ext_image_t& image);
|
|
|
|
/// @brief Create mipmapped array object with AMD-specific layout and return its handle.
|
|
hsa_status_t CreateMipmapArrayHandleWithLayout(
|
|
hsa_agent_t component, const hsa_ext_image_descriptor_t& mipmap_descriptor,
|
|
const hsa_amd_image_descriptor_t* image_layout,
|
|
const void* image_data, const hsa_access_permission_t access_permission,
|
|
uint32_t num_mipmap_levels,
|
|
hsa_ext_image_t& image_handle);
|
|
|
|
/// @brief Destroy the device image object referenced by the handle.
|
|
hsa_status_t DestroyImageHandle(const hsa_ext_image_t& image);
|
|
|
|
/// @brief Copy the content of a linear memory to an image object.
|
|
hsa_status_t CopyBufferToImage(const void* src_memory, size_t src_row_pitch,
|
|
size_t src_slice_pitch,
|
|
const hsa_ext_image_t& dst_image,
|
|
const hsa_ext_image_region_t& image_region);
|
|
|
|
/// @brief Copy the content of an image object to a linear memory.
|
|
hsa_status_t CopyImageToBuffer(const hsa_ext_image_t& src_image,
|
|
void* dst_memory, size_t dst_row_pitch,
|
|
size_t dst_slice_pitch,
|
|
const hsa_ext_image_region_t& image_region);
|
|
|
|
/// @brief Copy the content of an image object to another image object.
|
|
hsa_status_t CopyImage(const hsa_ext_image_t& src_image,
|
|
const hsa_ext_image_t& dst_image,
|
|
const hsa_dim3_t& src_origin,
|
|
const hsa_dim3_t& dst_origin, const hsa_dim3_t size);
|
|
|
|
/// @brief Fill the content of an image object with a pattern.
|
|
hsa_status_t FillImage(const hsa_ext_image_t& image, const void* pattern,
|
|
const hsa_ext_image_region_t& image_region);
|
|
|
|
/// @brief Create device sampler object and return its handle.
|
|
hsa_status_t CreateSamplerHandle(
|
|
hsa_agent_t component,
|
|
const hsa_ext_sampler_descriptor_v2_t& sampler_descriptor,
|
|
hsa_ext_sampler_t& sampler);
|
|
|
|
/// @brief Destroy the device sampler object referenced by the handle.
|
|
hsa_status_t DestroySamplerHandle(hsa_ext_sampler_t& sampler);
|
|
|
|
/// @brief Create device Mipmap array object and return its handle
|
|
hsa_status_t CreateMipmapArrayHandle(
|
|
hsa_agent_t component, const hsa_ext_image_descriptor_t& mipmap_descriptor,
|
|
const void* image_data, const hsa_access_permission_t access_permission,
|
|
uint32_t num_mipmap_levels,
|
|
const hsa_ext_image_data_layout_t mipmap_layout,
|
|
size_t image_data_row_pitch, size_t image_data_slice_pitch,
|
|
hsa_ext_image_t& image_handle);
|
|
|
|
/// @brief - Helper function to compute mipmapped surface size / alignment & max levels.
|
|
hsa_status_t GetMipmapArraySizeAndAlignment(
|
|
hsa_agent_t component,
|
|
const hsa_ext_image_descriptor_t& desc,
|
|
uint32_t num_mipmap_levels,
|
|
hsa_ext_image_data_layout_t layout,
|
|
size_t row_pitch,
|
|
size_t slice_pitch,
|
|
size_t& size_out,
|
|
size_t& alignment_out);
|
|
|
|
/// @brief Destroy the mipmapped array object referenced by the handle.
|
|
hsa_status_t DestroyMipmapArrayHandle(const hsa_ext_image_t& image_handle);
|
|
|
|
/// @brief Get the handle for a specific mipmap level in a mipmapped array.
|
|
hsa_status_t GetMipmapArrayLevelHandle(
|
|
hsa_agent_t agent, const hsa_ext_image_t& mipmapped_array,
|
|
uint32_t mip_level, hsa_ext_image_t& level_image_out);
|
|
|
|
ImageManager* image_manager(hsa_agent_t agent) {
|
|
std::map<uint64_t, ImageManager*>::iterator it = image_managers_.find(agent.handle);
|
|
return (it != image_managers_.end()) ? it->second : NULL;
|
|
}
|
|
|
|
BlitKernel& blit_kernel() { return blit_kernel_; }
|
|
|
|
size_t cpu_l2_cache_size() const { return cpu_l2_cache_size_; }
|
|
|
|
hsa_amd_memory_pool_t kernarg_pool() const {
|
|
return kernarg_pool_;
|
|
}
|
|
|
|
private:
|
|
/// @brief Initialize singleton object, must be called once.
|
|
static ImageRuntime* CreateSingleton();
|
|
|
|
static hsa_status_t CreateImageManager(hsa_agent_t agent, void* data);
|
|
|
|
ImageRuntime();
|
|
|
|
~ImageRuntime();
|
|
|
|
void Cleanup();
|
|
|
|
/// Pointer to singleton object.
|
|
static __forceinline std::atomic<ImageRuntime*>& get_instance() {
|
|
// This allocation is meant to last until the last thread has exited.
|
|
// It is intentionally not freed.
|
|
static std::atomic<ImageRuntime*>* instance_ = new std::atomic<ImageRuntime*>();
|
|
return *instance_;
|
|
}
|
|
|
|
static __forceinline std::mutex& instance_mutex() {
|
|
// This allocation is meant to last until the last thread has exited.
|
|
// It is intentionally not freed.
|
|
static std::mutex* instance_mutex_ = new std::mutex();
|
|
return *instance_mutex_;
|
|
}
|
|
|
|
/// @brief Contains mapping of agent and its corresponding ::ImageManager
|
|
/// object.
|
|
std::map<uint64_t, ImageManager*> image_managers_;
|
|
|
|
/// @brief Manages kernel for accessing images.
|
|
BlitKernel blit_kernel_;
|
|
|
|
size_t cpu_l2_cache_size_;
|
|
|
|
hsa_amd_memory_pool_t kernarg_pool_;
|
|
|
|
DISALLOW_COPY_AND_ASSIGN(ImageRuntime);
|
|
};
|
|
|
|
} // namespace image
|
|
} // namespace rocr
|
|
#endif // HSA_RUNTIME_EXT_IMAGE_IMAGE_RUNTIME_H
|