// MIT License // // Copyright (c) 2025 Advanced Micro Devices, Inc. All rights reserved. // // Permission is hereby granted, free of charge, to any person obtaining a copy // of this software and associated documentation files (the "Software"), to deal // in the Software without restriction, including without limitation the rights // to use, copy, modify, merge, publish, distribute, sublicense, and/or sell // copies of the Software, and to permit persons to whom the Software is // furnished to do so, subject to the following conditions: // // The above copyright notice and this permission notice shall be included in all // copies or substantial portions of the Software. // // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, // OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE // SOFTWARE. // [sphinx-start] #include #include #include #include #include #include #define HIP_CHECK(expression) \ { \ const hipError_t status = expression; \ if(status != hipSuccess) \ { \ std::cerr << "HIP error " \ << status << ": " \ << hipGetErrorString(status) \ << " at " << __FILE__ << ":" \ << __LINE__ << std::endl; \ } \ } // Addition of two values. __global__ void add(int *a, int *b, int *c, std::size_t size) { const std::size_t index = threadIdx.x + blockDim.x * blockIdx.x; if(index < size) { c[index] += a[index] + b[index]; } } int main() { constexpr int numOfBlocks = 256; constexpr int threadsPerBlock = 256; constexpr std::size_t arraySize = 1U << 16; std::vector a(arraySize), b(arraySize), c(arraySize); int *d_a, *d_b, *d_c; // Setup input values. std::fill(a.begin(), a.end(), 1); std::fill(b.begin(), b.end(), 2); // Allocate device copies of a, b and c. HIP_CHECK(hipMalloc(&d_a, arraySize * sizeof(int))); HIP_CHECK(hipMalloc(&d_b, arraySize * sizeof(int))); HIP_CHECK(hipMalloc(&d_c, arraySize * sizeof(int))); // Copy input values to device. HIP_CHECK(hipMemcpy(d_a, a.data(), arraySize * sizeof(int), hipMemcpyHostToDevice)); HIP_CHECK(hipMemcpy(d_b, b.data(), arraySize * sizeof(int), hipMemcpyHostToDevice)); // Launch add() kernel on GPU. add<<>>(d_a, d_b, d_c, arraySize); // Check the kernel launch HIP_CHECK(hipGetLastError()); // Check for kernel execution error HIP_CHECK(hipDeviceSynchronize()); // Copy the result back to the host. HIP_CHECK(hipMemcpy(c.data(), d_c, arraySize * sizeof(int), hipMemcpyDeviceToHost)); // Cleanup allocated memory. HIP_CHECK(hipFree(d_a)); HIP_CHECK(hipFree(d_b)); HIP_CHECK(hipFree(d_c)); // Print the result. std::cout << a[0] << " + " << b[0] << " = " << c[0] << std::endl; return EXIT_SUCCESS; } // [sphinx-end]