1a422d9798
In samples/2_Cookbook/11_texture_driver, add Vector data types(char4, short4, int4, float4); More arithmetic data types(char, short, int); Change-Id: I54aa482213d340d32cf912601adead0812c2323a
249 baris
8.9 KiB
C++
249 baris
8.9 KiB
C++
/*
|
|
Copyright (c) 2015 - 2021 Advanced Micro Devices, Inc. All rights reserved.
|
|
|
|
Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
of this software and associated documentation files (the "Software"), to deal
|
|
in the Software without restriction, including without limitation the rights
|
|
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
copies of the Software, and to permit persons to whom the Software is
|
|
furnished to do so, subject to the following conditions:
|
|
|
|
The above copyright notice and this permission notice shall be included in
|
|
all copies or substantial portions of the Software.
|
|
|
|
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
THE SOFTWARE.
|
|
*/
|
|
|
|
#include "hip/hip_runtime.h"
|
|
#include <iostream>
|
|
#include <fstream>
|
|
#include <vector>
|
|
|
|
#define fileName "tex2dKernel.code"
|
|
|
|
bool testResult = true;
|
|
|
|
#define HIP_CHECK(cmd) \
|
|
{ \
|
|
hipError_t status = cmd; \
|
|
if (status != hipSuccess) { \
|
|
std::cout << "error: #" << status << " (" << hipGetErrorString(status) \
|
|
<< ") at line:" << __LINE__ << ": " << #cmd << std::endl; \
|
|
abort(); \
|
|
} \
|
|
}
|
|
|
|
template<typename T,
|
|
typename std::enable_if<std::is_arithmetic<T>::value>::type *t = nullptr>
|
|
static inline hipArray_Format getArrayFormat() {
|
|
if (std::is_same<char, T>::value) {
|
|
return HIP_AD_FORMAT_SIGNED_INT8;
|
|
} else if (std::is_same<short, T>::value) {
|
|
return HIP_AD_FORMAT_SIGNED_INT16;
|
|
} else if (std::is_same<int, T>::value) {
|
|
return HIP_AD_FORMAT_SIGNED_INT32;
|
|
} else if (std::is_same<float, T>::value) {
|
|
return HIP_AD_FORMAT_FLOAT;
|
|
}
|
|
return HIP_AD_FORMAT_HALF;
|
|
}
|
|
|
|
template<typename T,
|
|
typename std::enable_if<!std::is_arithmetic<T>::value>::type *t = nullptr>
|
|
static inline hipArray_Format getArrayFormat() {
|
|
return getArrayFormat<decltype(T::x)>();
|
|
}
|
|
|
|
template<typename T>
|
|
static inline constexpr int rank() {
|
|
return sizeof(T) / sizeof(decltype(T::x));
|
|
}
|
|
|
|
template<typename T>
|
|
static inline T getRandom() {
|
|
double r = 0;
|
|
if (std::is_signed < T > ::value) {
|
|
r = (std::rand() - RAND_MAX / 2.0) / (RAND_MAX / 2.0 + 1.);
|
|
} else {
|
|
r = std::rand() / (RAND_MAX + 1.);
|
|
}
|
|
return static_cast<T>(std::numeric_limits < T > ::max() * r);
|
|
}
|
|
|
|
template<typename T,
|
|
typename std::enable_if<std::is_arithmetic<T>::value>::type* = nullptr>
|
|
static inline constexpr int getChannels() {
|
|
return 1;
|
|
}
|
|
|
|
template<typename T,
|
|
typename std::enable_if<!std::is_arithmetic<T>::value>::type *t = nullptr,
|
|
typename std::enable_if<rank<T>() != 0>::type *r = nullptr>
|
|
static inline constexpr int getChannels() {
|
|
return rank<T>();
|
|
}
|
|
|
|
template<typename T,
|
|
typename std::enable_if<std::is_arithmetic<T>::value>::type* = nullptr>
|
|
static inline void printDiff(const int &i, const int &j, const T &expected,
|
|
const T &output) {
|
|
std::cout << "Difference [" << i << " " << j << "]: " << expected << " - "
|
|
<< output << "\n";
|
|
}
|
|
|
|
template<typename T,
|
|
typename std::enable_if<!std::is_arithmetic<T>::value>::type* = nullptr,
|
|
typename std::enable_if<rank<T>() == 4>::type* = nullptr>
|
|
static inline void printDiff(const int &i, const int &j, const T &expected,
|
|
const T &output) {
|
|
std::cout << "Difference [" << i << " " << j << "]: " << expected.x << ","
|
|
<< expected.y << "," << expected.z << "," << expected.w << " - "
|
|
<< output.x << "," << output.y << "," << output.z << "," << output.w
|
|
<< "\n";
|
|
}
|
|
|
|
template<typename T,
|
|
typename std::enable_if<std::is_arithmetic<T>::value>::type* = nullptr>
|
|
static inline void initVal(T &val) {
|
|
val = getRandom<T>();
|
|
}
|
|
|
|
template<typename T,
|
|
typename std::enable_if<!std::is_arithmetic<T>::value>::type* = nullptr,
|
|
typename std::enable_if<rank<T>() == 4>::type* = nullptr>
|
|
static inline void initVal(T &val) {
|
|
val.x = getRandom<decltype(T::x)>();
|
|
val.y = getRandom<decltype(T::x)>();
|
|
val.z = getRandom<decltype(T::x)>();
|
|
val.w = getRandom<decltype(T::x)>();
|
|
}
|
|
|
|
template<typename T>
|
|
bool runTest(hipModule_t &module, const char *refName, const char *funcName) {
|
|
hipArray_Format format = getArrayFormat<T>();
|
|
int channels = getChannels<T>();
|
|
unsigned int width = 256;
|
|
unsigned int height = 256;
|
|
unsigned int size = width * height * sizeof(T);
|
|
T *hData = (T*) malloc(size);
|
|
memset(hData, 0, size);
|
|
for (int i = 0; i < height; i++) {
|
|
for (int j = 0; j < width; j++) {
|
|
initVal(hData[i * width + j]);
|
|
}
|
|
}
|
|
|
|
hipArray *array;
|
|
HIP_ARRAY_DESCRIPTOR desc;
|
|
desc.Format = format;
|
|
desc.NumChannels = channels;
|
|
desc.Width = width;
|
|
desc.Height = height;
|
|
HIP_CHECK(hipArrayCreate(&array, &desc));
|
|
|
|
hip_Memcpy2D copyParam;
|
|
memset(©Param, 0, sizeof(copyParam));
|
|
copyParam.dstMemoryType = hipMemoryTypeArray;
|
|
copyParam.dstArray = array;
|
|
copyParam.srcMemoryType = hipMemoryTypeHost;
|
|
copyParam.srcHost = hData;
|
|
copyParam.srcPitch = width * sizeof(T);
|
|
copyParam.WidthInBytes = copyParam.srcPitch;
|
|
copyParam.Height = height;
|
|
HIP_CHECK(hipMemcpyParam2D(©Param));
|
|
|
|
textureReference *texref;
|
|
HIP_CHECK(hipModuleGetTexRef(&texref, module, refName));
|
|
HIP_CHECK(hipTexRefSetAddressMode(texref, 0, hipAddressModeClamp));
|
|
HIP_CHECK(hipTexRefSetAddressMode(texref, 1, hipAddressModeClamp));
|
|
HIP_CHECK(hipTexRefSetFilterMode(texref, hipFilterModePoint));
|
|
HIP_CHECK(hipTexRefSetFlags(texref, HIP_TRSF_READ_AS_INTEGER));
|
|
HIP_CHECK(hipTexRefSetFormat(texref, format, channels));
|
|
HIP_CHECK(hipTexRefSetArray(texref, array, HIP_TRSA_OVERRIDE_FORMAT));
|
|
|
|
T *dData = NULL;
|
|
HIP_CHECK(hipMalloc((void** )&dData, size));
|
|
|
|
struct {
|
|
void *_Ad;
|
|
unsigned int _Bd;
|
|
unsigned int _Cd;
|
|
} args;
|
|
args._Ad = (void*) dData;
|
|
args._Bd = width;
|
|
args._Cd = height;
|
|
|
|
size_t sizeTemp = sizeof(args);
|
|
|
|
void *config[] = { HIP_LAUNCH_PARAM_BUFFER_POINTER, &args,
|
|
HIP_LAUNCH_PARAM_BUFFER_SIZE, &sizeTemp, HIP_LAUNCH_PARAM_END };
|
|
|
|
hipFunction_t Function;
|
|
HIP_CHECK(hipModuleGetFunction(&Function, module, funcName));
|
|
|
|
int temp1 = width / 16;
|
|
int temp2 = height / 16;
|
|
HIP_CHECK(
|
|
hipModuleLaunchKernel(Function, 16, 16, 1, temp1, temp2, 1, 0, 0, NULL,
|
|
(void** )&config));
|
|
hipDeviceSynchronize();
|
|
|
|
T *hOutputData = (T*) malloc(size);
|
|
memset(hOutputData, 0, size);
|
|
HIP_CHECK(hipMemcpy(hOutputData, dData, size, hipMemcpyDeviceToHost));
|
|
|
|
for (int i = 0; i < height; i++) {
|
|
for (int j = 0; j < width; j++) {
|
|
if (hData[i * width + j] != hOutputData[i * width + j]) {
|
|
printDiff<T>(i, j, hData[i * width + j], hOutputData[i * width + j]);
|
|
testResult = false;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
HIP_CHECK(hipUnbindTexture(texref));
|
|
HIP_CHECK(hipFree(dData));
|
|
HIP_CHECK(hipFreeArray(array));
|
|
free(hOutputData);
|
|
free(hData);
|
|
printf("%s test %s ...\n", funcName, testResult ? "PASSED" : "FAILED");
|
|
return testResult;
|
|
}
|
|
|
|
inline bool isImageSupported() {
|
|
int imageSupport = 1;
|
|
#ifdef __HIP_PLATFORM_AMD__
|
|
HIP_CHECK(hipDeviceGetAttribute(&imageSupport, hipDeviceAttributeImageSupport,
|
|
0));
|
|
#endif
|
|
return imageSupport != 0;
|
|
}
|
|
|
|
int main(int argc, char** argv) {
|
|
if (!isImageSupported()) {
|
|
printf("Texture is not support on the device. Skipped.\n");
|
|
return 0;
|
|
}
|
|
hipInit(0);
|
|
hipModule_t module;
|
|
HIP_CHECK(hipModuleLoad(&module, fileName));
|
|
testResult = testResult && runTest<char>(module, "texChar", "tex2dKernelChar");
|
|
testResult = testResult && runTest<short>(module, "texShort", "tex2dKernelShort");
|
|
testResult = testResult && runTest<int>(module, "texInt", "tex2dKernelInt");
|
|
testResult = testResult && runTest<float>(module, "texFloat", "tex2dKernelFloat");
|
|
testResult = testResult && runTest<char4>(module, "texChar4", "tex2dKernelChar4");
|
|
testResult = testResult && runTest<short4>(module, "texShort4", "tex2dKernelShort4");
|
|
testResult = testResult && runTest<int4>(module, "texInt4", "tex2dKernelInt4");
|
|
testResult = testResult && runTest<float4>(module, "texFloat4", "tex2dKernelFloat4");
|
|
|
|
HIP_CHECK(hipModuleUnload(module));
|
|
printf("texture2dDrv %s ...\n", testResult ? "PASSED" : "FAILED");
|
|
return testResult ? EXIT_SUCCESS : EXIT_FAILURE;
|
|
}
|