1b5fed173c
Change-Id: I9765582cc0dc870906d0ec16aa9ca38e990e0ef8
1399 řádky
44 KiB
C++
1399 řádky
44 KiB
C++
/*
|
|
Copyright (c) 2015-2016 Advanced Micro Devices, Inc. All rights reserved.
|
|
|
|
Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
of this software and associated documentation files (the "Software"), to deal
|
|
in the Software without restriction, including without limitation the rights
|
|
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
copies of the Software, and to permit persons to whom the Software is
|
|
furnished to do so, subject to the following conditions:
|
|
|
|
The above copyright notice and this permission notice shall be included in
|
|
all copies or substantial portions of the Software.
|
|
|
|
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
THE SOFTWARE.
|
|
*/
|
|
|
|
#include "profiler_gtest.h"
|
|
|
|
#include <gtest/gtest.h>
|
|
#include <hsa/hsa.h>
|
|
#include <hip/hip_runtime.h>
|
|
#include "rocprofiler.h"
|
|
#include <cstdlib>
|
|
#include <string>
|
|
#include <thread>
|
|
#include <array>
|
|
//#include <experimental/filesystem>
|
|
|
|
#include "src/utils/helper.h"
|
|
#include "utils/test_utils.h"
|
|
#include "utils/csv_parser.h"
|
|
|
|
|
|
std::string running_path;
|
|
std::string lib_path;
|
|
std::string golden_trace_path;
|
|
std::string test_app_path;
|
|
std::string metrics_path;
|
|
std::string binary_path;
|
|
|
|
static void init_test_path() {
|
|
if (is_installed_path()) {
|
|
running_path = "share/rocprofiler/tests/runFeatureTests";
|
|
lib_path = "lib/rocprofiler/librocprofiler_tool.so";
|
|
golden_trace_path = "share/rocprofiler/tests/featuretests/profiler/apps/goldentraces/";
|
|
test_app_path = "share/rocprofiler/tests/featuretests/profiler/apps/";
|
|
metrics_path = "lib/rocprofiler/gfx_metrics.xml";
|
|
binary_path = "bin/rocprofv2";
|
|
} else {
|
|
running_path = "tests/featuretests/profiler/runFeatureTests";
|
|
lib_path = "librocprofiler_tool.so";
|
|
golden_trace_path = "tests/featuretests/profiler/apps/goldentraces/";
|
|
test_app_path = "tests/featuretests/profiler/apps/";
|
|
metrics_path = "gfx_metrics.xml";
|
|
binary_path = "rocprofv2";
|
|
}
|
|
}
|
|
|
|
|
|
/**
|
|
* Sets application enviornment by seting HSA_TOOLS_LIB.
|
|
*/
|
|
void ApplicationParser::SetApplicationEnv(const char* app_name) {
|
|
std::string app_path;
|
|
|
|
// set global path
|
|
init_test_path();
|
|
|
|
app_path = GetRunningPath(running_path);
|
|
|
|
std::stringstream counter_path;
|
|
counter_path << app_path << golden_trace_path << "input.txt";
|
|
setenv("COUNTERS_PATH", counter_path.str().c_str(), true);
|
|
|
|
std::stringstream hsa_tools_lib_path;
|
|
hsa_tools_lib_path << app_path << lib_path;
|
|
setenv("LD_PRELOAD", hsa_tools_lib_path.str().c_str(), true);
|
|
|
|
std::stringstream os;
|
|
os << app_path << test_app_path << app_name;
|
|
|
|
ProcessApplication(os);
|
|
}
|
|
|
|
/**
|
|
* Parses kernel-info after running profiler against curent application
|
|
* and saves them in a vector.
|
|
*/
|
|
void ApplicationParser::GetKernelInfoForRunningApplication(
|
|
std::vector<KernelInfo>* kernel_info_output) {
|
|
KernelInfo kinfo;
|
|
for (std::string line : output_lines) {
|
|
if (std::regex_match(line, std::regex("(dispatch)(.*)"))) {
|
|
int spos = line.find("[");
|
|
int epos = line.find("]", spos);
|
|
std::string sub = line.substr(spos + 1, epos - spos - 1);
|
|
kinfo.dispatch_id = sub;
|
|
kernel_info_output->push_back(kinfo);
|
|
|
|
// Kernel-Name
|
|
size_t found = line.find("kernel-name");
|
|
if (found != std::string::npos) {
|
|
int spos = found;
|
|
int epos = line.find(")", spos);
|
|
int length = std::string("kernel-name").length();
|
|
std::string sub = line.substr(spos + length + 1, epos - spos - length - 1);
|
|
|
|
kinfo.kernel_name = sub;
|
|
kernel_info_output->push_back(kinfo);
|
|
}
|
|
// Start-Time
|
|
found = line.find("start_time");
|
|
if (found != std::string::npos) {
|
|
int spos = found;
|
|
int epos = line.find(",", spos);
|
|
int length = std::string("start_time").length();
|
|
std::string sub = line.substr(spos + length + 1, epos - spos - length - 1);
|
|
kinfo.start_time = sub;
|
|
kernel_info_output->push_back(kinfo);
|
|
}
|
|
// End-Time
|
|
found = line.find("end_time");
|
|
if (found != std::string::npos) {
|
|
int spos = line.find(",", found);
|
|
int epos = line.find(")", spos);
|
|
std::string sub = line.substr(spos + 1, epos - spos - 1);
|
|
kinfo.end_time = sub;
|
|
kernel_info_output->push_back(kinfo);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Parses kernel-names from a pre-saved golden out files
|
|
* and saves them in a vector.
|
|
*/
|
|
void ApplicationParser::GetKernelInfoForGoldenOutput(const char* app_name, std::string file_name,
|
|
std::vector<KernelInfo>* kernel_info_output) {
|
|
std::string entry;
|
|
std::string path = GetRunningPath(running_path);
|
|
entry = path.append(golden_trace_path) + file_name;
|
|
// parse kernel info fields for golden output
|
|
ParseKernelInfoFields(entry, kernel_info_output);
|
|
}
|
|
|
|
/**
|
|
* Runs a given appllication and saves profiler output.
|
|
* These output lines can be letter passed for kernel informations
|
|
* i.e: kernel_names
|
|
*/
|
|
void ApplicationParser::ProcessApplication(std::stringstream& ss) {
|
|
FILE* handle = popen(ss.str().c_str(), "r");
|
|
ASSERT_NE(handle, nullptr);
|
|
|
|
char* ln{NULL};
|
|
std::string temp{""};
|
|
size_t len{0};
|
|
|
|
while (getline(&ln, &len, handle) != -1) {
|
|
temp = temp + std::string(ln);
|
|
}
|
|
|
|
free(ln);
|
|
size_t pos{0};
|
|
std::string delimiter{"\n"};
|
|
while ((pos = temp.find(delimiter)) != std::string::npos) {
|
|
output_lines.push_back(temp.substr(0, pos));
|
|
temp.erase(0, pos + delimiter.length());
|
|
}
|
|
|
|
pclose(handle);
|
|
}
|
|
|
|
/**
|
|
* Parses kernel-info for golden output file
|
|
* and saves them in a vector.
|
|
*/
|
|
void ApplicationParser::ParseKernelInfoFields(const std::string& s,
|
|
std::vector<KernelInfo>* kernel_info_output) {
|
|
std::string line;
|
|
KernelInfo kinfo;
|
|
|
|
std::ifstream golden_file(s);
|
|
while (!golden_file.eof()) {
|
|
getline(golden_file, line);
|
|
if (std::regex_match(line, std::regex("(dispatch)(.*)"))) {
|
|
int spos = line.find("[");
|
|
int epos = line.find("]", spos);
|
|
std::string sub = line.substr(spos + 1, epos - spos - 1);
|
|
kinfo.dispatch_id = sub;
|
|
kernel_info_output->push_back(kinfo);
|
|
|
|
// Kernel-Name
|
|
size_t found = line.find("kernel-name");
|
|
if (found != std::string::npos) {
|
|
int spos = found;
|
|
int epos = line.find(")", spos);
|
|
int length = std::string("kernel-name").length();
|
|
std::string sub = line.substr(spos + length + 1, epos - spos - length - 1);
|
|
|
|
kinfo.kernel_name = sub;
|
|
kernel_info_output->push_back(kinfo);
|
|
}
|
|
// Start-Time
|
|
found = line.find("start_time");
|
|
if (found != std::string::npos) {
|
|
int spos = found;
|
|
int epos = line.find(",", spos);
|
|
int length = std::string("start_time").length();
|
|
std::string sub = line.substr(spos + length + 1, epos - spos - length - 1);
|
|
kinfo.start_time = sub;
|
|
kernel_info_output->push_back(kinfo);
|
|
}
|
|
// End-Time
|
|
found = line.find("end_time");
|
|
if (found != std::string::npos) {
|
|
int spos = line.find(",", found);
|
|
int epos = line.find(")", spos);
|
|
std::string sub = line.substr(spos + 1, epos - spos - 1);
|
|
kinfo.end_time = sub;
|
|
kernel_info_output->push_back(kinfo);
|
|
}
|
|
}
|
|
}
|
|
golden_file.close();
|
|
}
|
|
|
|
|
|
constexpr auto kGoldenOutputHelloworld = "hip_helloworld_golden_traces.txt";
|
|
constexpr auto kGoldenOutputVectorAdd = "hip_vectoradd_golden_traces.txt";
|
|
constexpr auto kGOldenOutputAsyncCopy = "hsa_async_mem_copy_golden_traces.txt";
|
|
constexpr auto kGoldenOutputOpenMP = "openmp_helloworld_golden_traces.txt";
|
|
constexpr auto kGoldenOutputMpi = "mpi_vectoradd_golden_traces.txt";
|
|
|
|
/*
|
|
* ###################################################
|
|
* ############ Hello World HIP Tests ################
|
|
* ###################################################
|
|
*/
|
|
|
|
class HelloWorldTest : public ProfilerTest {
|
|
protected:
|
|
std::vector<KernelInfo> golden_kernel_info;
|
|
void SetUp() {
|
|
ProfilerTest::SetUp("hip_helloworld");
|
|
GetKernelInfoForGoldenOutput("hip_helloworld", kGoldenOutputHelloworld, &golden_kernel_info);
|
|
}
|
|
};
|
|
|
|
// Test:1 Compares total num of kernel-names in golden output against current
|
|
// profiler output
|
|
TEST_F(HelloWorldTest, WhenRunningProfilerWithAppThenKernelNumbersMatchWithGoldenOutput) {
|
|
// kernel info in current profiler run
|
|
std::vector<KernelInfo> current_kernel_info;
|
|
|
|
GetKernelInfoForRunningApplication(¤t_kernel_info);
|
|
ASSERT_TRUE(current_kernel_info.size());
|
|
|
|
EXPECT_EQ(golden_kernel_info.size(), current_kernel_info.size());
|
|
}
|
|
|
|
// Test:2 Compares order of kernel-names in golden output against current
|
|
// profiler output
|
|
TEST_F(HelloWorldTest, WhenRunningProfilerWithAppThenKernelNamessMatchWithGoldenOutput) {
|
|
// kernel info in current profiler run
|
|
std::vector<KernelInfo> current_kernel_info;
|
|
GetKernelInfoForRunningApplication(¤t_kernel_info);
|
|
|
|
ASSERT_TRUE(current_kernel_info.size());
|
|
|
|
EXPECT_EQ(golden_kernel_info[0].kernel_name, current_kernel_info[0].kernel_name);
|
|
EXPECT_EQ(golden_kernel_info[1].kernel_name, current_kernel_info[1].kernel_name);
|
|
}
|
|
|
|
// Test:3 Compares order of kernel-names in golden output against current
|
|
// profiler output
|
|
TEST_F(HelloWorldTest, WhenRunningProfilerWithAppThenKernelDurationShouldBePositive) {
|
|
// kernel info in current profiler run
|
|
std::vector<KernelInfo> current_kernel_info;
|
|
|
|
GetKernelInfoForRunningApplication(¤t_kernel_info);
|
|
ASSERT_TRUE(current_kernel_info.size());
|
|
|
|
EXPECT_GT(current_kernel_info.size(), 0);
|
|
}
|
|
|
|
// Test:4 Compares end-time is greater than start-time in current
|
|
// profiler output
|
|
TEST_F(HelloWorldTest, WhenRunningProfilerWithAppThenEndTimeIsGreaterThenStartTime) {
|
|
// kernel info in current profiler run
|
|
std::vector<KernelInfo> current_kernel_info;
|
|
|
|
GetKernelInfoForRunningApplication(¤t_kernel_info);
|
|
ASSERT_TRUE(current_kernel_info.size());
|
|
|
|
for (auto& itr : current_kernel_info) {
|
|
if (!(itr.start_time).empty() && !(itr.end_time).empty()) {
|
|
EXPECT_GT(itr.end_time, itr.start_time);
|
|
}
|
|
}
|
|
}
|
|
|
|
/*
|
|
* ###################################################
|
|
* ############ Vector Add HIP Tests ################
|
|
* ###################################################
|
|
*/
|
|
|
|
class VectorAddTest : public ProfilerTest {
|
|
protected:
|
|
std::vector<KernelInfo> golden_kernel_info;
|
|
void SetUp() {
|
|
ProfilerTest::SetUp("hip_vectoradd");
|
|
GetKernelInfoForGoldenOutput("hip_vectoradd", kGoldenOutputVectorAdd, &golden_kernel_info);
|
|
}
|
|
};
|
|
|
|
// Test:1 Compares total num of kernel-names in golden output against current
|
|
// profiler output
|
|
TEST_F(VectorAddTest, WhenRunningProfilerWithAppThenKernelNumbersMatchWithGoldenOutput) {
|
|
std::vector<KernelInfo> current_kernel_info;
|
|
|
|
GetKernelInfoForRunningApplication(¤t_kernel_info);
|
|
ASSERT_TRUE(current_kernel_info.size());
|
|
|
|
EXPECT_EQ(golden_kernel_info.size(), current_kernel_info.size());
|
|
}
|
|
|
|
// Test:2 Compares order of kernel-names in golden output against current
|
|
// profiler output
|
|
TEST_F(VectorAddTest, WhenRunningProfilerWithAppThenKernelNamessMatchWithGoldenOutput) {
|
|
std::vector<KernelInfo> current_kernel_info;
|
|
|
|
GetKernelInfoForRunningApplication(¤t_kernel_info);
|
|
ASSERT_TRUE(current_kernel_info.size());
|
|
|
|
EXPECT_EQ(golden_kernel_info[0].kernel_name, current_kernel_info[0].kernel_name);
|
|
EXPECT_EQ(golden_kernel_info[1].kernel_name, current_kernel_info[1].kernel_name);
|
|
}
|
|
|
|
// Test:3 Compares order of kernel-names in golden output against current
|
|
// profiler output
|
|
TEST_F(VectorAddTest, WhenRunningProfilerWithAppThenKernelDurationShouldBePositive) {
|
|
// kernel info in current profiler run
|
|
std::vector<KernelInfo> current_kernel_info;
|
|
|
|
GetKernelInfoForRunningApplication(¤t_kernel_info);
|
|
ASSERT_TRUE(current_kernel_info.size());
|
|
|
|
EXPECT_GT(current_kernel_info.size(), 0);
|
|
}
|
|
|
|
// Test:4 Compares end-time is greater than start-time in current
|
|
// profiler output
|
|
TEST_F(VectorAddTest, WhenRunningProfilerWithAppThenEndTimeIsGreaterThenStartTime) {
|
|
// kernel info in current profiler run
|
|
std::vector<KernelInfo> current_kernel_info;
|
|
|
|
GetKernelInfoForRunningApplication(¤t_kernel_info);
|
|
ASSERT_TRUE(current_kernel_info.size());
|
|
|
|
for (auto& itr : current_kernel_info) {
|
|
if (!(itr.start_time).empty() && !(itr.end_time).empty()) {
|
|
EXPECT_GT(itr.end_time, itr.start_time);
|
|
}
|
|
}
|
|
}
|
|
|
|
/*
|
|
* ###################################################
|
|
* ############ Async Mem copy Tests ################
|
|
* ###################################################
|
|
*/
|
|
|
|
class HSATest : public ProfilerTest {
|
|
protected:
|
|
std::vector<KernelInfo> golden_kernel_info;
|
|
void SetUp() {
|
|
ProfilerTest::SetUp("hsa_async_mem_copy");
|
|
GetKernelInfoForGoldenOutput("hsa_async_mem_copy", kGOldenOutputAsyncCopy, &golden_kernel_info);
|
|
}
|
|
};
|
|
|
|
// Test:1 Given profiler don't intercept any hsa calls in this app
|
|
// we dont collect any counters by default. Expectation is, both vectors are
|
|
// empty
|
|
TEST_F(HSATest, WhenRunningProfilerWithAppThenKernelNumbersMatchWithGoldenOutput) {
|
|
std::vector<KernelInfo> current_kernel_info;
|
|
|
|
GetKernelInfoForRunningApplication(¤t_kernel_info);
|
|
|
|
EXPECT_EQ(current_kernel_info.size(), 0);
|
|
EXPECT_EQ(golden_kernel_info.size(), 0);
|
|
|
|
EXPECT_EQ(golden_kernel_info.size(), current_kernel_info.size());
|
|
}
|
|
|
|
/*
|
|
* ###################################################
|
|
* ############ OpenMP Tests ################
|
|
* ###################################################
|
|
*/
|
|
|
|
class OpenMPTest : public ProfilerTest {
|
|
protected:
|
|
std::vector<KernelInfo> golden_kernel_info;
|
|
void SetUp() {
|
|
ProfilerTest::SetUp("openmp_helloworld");
|
|
GetKernelInfoForGoldenOutput("openmp_helloworld", kGoldenOutputOpenMP, &golden_kernel_info);
|
|
}
|
|
};
|
|
|
|
// Test:1 Compares total num of kernel-names in golden output against current
|
|
// profiler output
|
|
TEST_F(OpenMPTest, WhenRunningProfilerWithAppThenKernelNumbersMatchWithGoldenOutput) {
|
|
std::vector<KernelInfo> current_kernel_info;
|
|
|
|
GetKernelInfoForRunningApplication(¤t_kernel_info);
|
|
ASSERT_TRUE(current_kernel_info.size());
|
|
|
|
EXPECT_EQ(golden_kernel_info.size(), current_kernel_info.size());
|
|
}
|
|
|
|
// Test:2 Compares order of kernel-names in golden output against current
|
|
// profiler output
|
|
TEST_F(OpenMPTest, WhenRunningProfilerWithAppThenKernelNamessMatchWithGoldenOutput) {
|
|
std::vector<KernelInfo> current_kernel_info;
|
|
|
|
GetKernelInfoForRunningApplication(¤t_kernel_info);
|
|
ASSERT_TRUE(current_kernel_info.size());
|
|
|
|
EXPECT_EQ(golden_kernel_info[0].kernel_name, current_kernel_info[0].kernel_name);
|
|
EXPECT_EQ(golden_kernel_info[1].kernel_name, current_kernel_info[1].kernel_name);
|
|
}
|
|
|
|
// Test:3 Compares order of kernel-names in golden output against current
|
|
// profiler output
|
|
TEST_F(OpenMPTest, WhenRunningProfilerWithAppThenKernelDurationShouldBePositive) {
|
|
// kernel info in current profiler run
|
|
std::vector<KernelInfo> current_kernel_info;
|
|
|
|
GetKernelInfoForRunningApplication(¤t_kernel_info);
|
|
ASSERT_TRUE(current_kernel_info.size());
|
|
|
|
EXPECT_GT(current_kernel_info.size(), 0);
|
|
}
|
|
|
|
// Test:4 Compares end-time is greater than start-time in current
|
|
// profiler output
|
|
TEST_F(OpenMPTest, WhenRunningProfilerWithAppThenEndTimeIsGreaterThenStartTime) {
|
|
// kernel info in current profiler run
|
|
std::vector<KernelInfo> current_kernel_info;
|
|
|
|
GetKernelInfoForRunningApplication(¤t_kernel_info);
|
|
ASSERT_TRUE(current_kernel_info.size());
|
|
|
|
for (auto& itr : current_kernel_info) {
|
|
if (!(itr.end_time).empty()) {
|
|
EXPECT_GT(itr.end_time, itr.start_time);
|
|
}
|
|
}
|
|
}
|
|
|
|
/*
|
|
* ###################################################
|
|
* ############ MPI Tests ################
|
|
* ###################################################
|
|
*/
|
|
|
|
class MPITest : public ProfilerTest {
|
|
protected:
|
|
void ProcessMPIApplication(const char* app_name);
|
|
void ExecuteAndParseApplication(std::stringstream& ss);
|
|
|
|
void SetUp() {
|
|
/*To supress No protocol found prints*/
|
|
setenv("HWLOC_COMPONENTS", "-gl", 1);
|
|
|
|
// run as standalone test
|
|
ProfilerTest::SetUp("mpi_vectoradd");
|
|
|
|
// run mpirun script
|
|
// ProcessMPIApplication("mpi_run.sh");
|
|
}
|
|
};
|
|
|
|
void MPITest::ProcessMPIApplication(const char* app_name) {
|
|
std::string app_path = GetRunningPath(running_path);
|
|
std::string lib_path = app_path;
|
|
|
|
std::stringstream hsa_tools_lib_path;
|
|
|
|
hsa_tools_lib_path << app_path << "librocprofiler_tool.so";
|
|
setenv("LD_PRELOAD", hsa_tools_lib_path.str().c_str(), true);
|
|
|
|
std::stringstream os;
|
|
os << app_path << "tests/featuretests/profiler/apps/" << app_name;
|
|
ExecuteAndParseApplication(os);
|
|
}
|
|
|
|
void MPITest::ExecuteAndParseApplication(std::stringstream& ss) {
|
|
FILE* handle = popen(ss.str().c_str(), "r");
|
|
ASSERT_NE(handle, nullptr);
|
|
char* ln{NULL};
|
|
std::string temp{""};
|
|
size_t len{0};
|
|
|
|
while (getline(&ln, &len, handle) != -1) {
|
|
temp = temp + std::string(ln);
|
|
}
|
|
|
|
free(ln);
|
|
size_t pos{0};
|
|
std::string delimiter{"\n"};
|
|
while ((pos = temp.find(delimiter)) != std::string::npos) {
|
|
output_lines.push_back(temp.substr(0, pos));
|
|
temp.erase(0, pos + delimiter.length());
|
|
}
|
|
|
|
pclose(handle);
|
|
}
|
|
|
|
// Test:1 Compares total num of kernel-names in golden output against current
|
|
// profiler output
|
|
TEST_F(MPITest, WhenRunningProfilerWithAppThenKernelNumbersMatchWithGoldenOutput) {
|
|
std::vector<KernelInfo> current_kernel_info;
|
|
|
|
GetKernelInfoForRunningApplication(¤t_kernel_info);
|
|
ASSERT_TRUE(current_kernel_info.size());
|
|
|
|
EXPECT_GT(current_kernel_info.size(), 0);
|
|
}
|
|
|
|
/*
|
|
* ###################################################
|
|
* ############ HSA Load Unload Tests ################
|
|
* ###################################################
|
|
*/
|
|
|
|
// Run 2 loops of {hsa_init(); hsa_iterate_agents(); hsa_shut_down()} to test
|
|
// that the profiler tool correctly unloaded after the 1st iteration and then
|
|
// reloaded for the 2nd iteration.
|
|
class LoadUnloadTest : public ::testing::Test {
|
|
protected:
|
|
virtual void SetUp() {
|
|
// start basic app
|
|
hsa_init();
|
|
}
|
|
|
|
virtual void TearDown() {
|
|
// stop basic app and unset tools lib
|
|
hsa_shut_down();
|
|
}
|
|
};
|
|
|
|
TEST_F(LoadUnloadTest, WhenLoadingFirstTimeThenToolLoadsUnloadsSuccessfully) {
|
|
// Tool loaded in the setup
|
|
// Tool unloaded in teardown
|
|
|
|
// iterate for gpu's
|
|
hsa_status_t status = hsa_iterate_agents(
|
|
[](hsa_agent_t agent, void*) {
|
|
hsa_device_type_t type;
|
|
return hsa_agent_get_info(agent, HSA_AGENT_INFO_DEVICE, &type);
|
|
},
|
|
nullptr);
|
|
|
|
EXPECT_EQ(HSA_STATUS_SUCCESS, status);
|
|
}
|
|
|
|
TEST_F(LoadUnloadTest, WhenLoadingSecondTimeThenToolLoadsUnloadsSuccessfully) {
|
|
// Tool loaded in the setup
|
|
// Tool unloaded in teardown
|
|
|
|
// iterate for gpu's
|
|
hsa_status_t status = hsa_iterate_agents(
|
|
[](hsa_agent_t agent, void*) {
|
|
hsa_device_type_t type;
|
|
return hsa_agent_get_info(agent, HSA_AGENT_INFO_DEVICE, &type);
|
|
},
|
|
nullptr);
|
|
|
|
EXPECT_EQ(HSA_STATUS_SUCCESS, status);
|
|
}
|
|
|
|
/*
|
|
* ###################################################
|
|
* ############ ATT Tests ################
|
|
* ###################################################
|
|
*/
|
|
|
|
#ifdef NDEBUG
|
|
#define HIP_ASSERT(x) x
|
|
#else
|
|
#define HIP_ASSERT(x) (assert((x) == hipSuccess))
|
|
#endif
|
|
|
|
#define WIDTH 1024
|
|
#define HEIGHT 1024
|
|
|
|
#define NUM (WIDTH * HEIGHT)
|
|
|
|
#define THREADS_PER_BLOCK_X 16
|
|
#define THREADS_PER_BLOCK_Y 16
|
|
#define THREADS_PER_BLOCK_Z 1
|
|
|
|
/** \mainpage ROC Profiler API Test
|
|
*
|
|
* \section introduction Introduction
|
|
*
|
|
* The goal of this test is to test ROCProfiler APIs to collect ATT traces.
|
|
*
|
|
* A simple vectoradd_float kernel is launched and the trace results are printed
|
|
* as console output
|
|
*/
|
|
|
|
|
|
__global__ void vectoradd_float(float* __restrict__ a, const float* __restrict__ b,
|
|
const float* __restrict__ c, int width, int height)
|
|
|
|
{
|
|
int x = hipBlockDim_x * hipBlockIdx_x + hipThreadIdx_x;
|
|
int y = hipBlockDim_y * hipBlockIdx_y + hipThreadIdx_y;
|
|
|
|
int i = y * width + x;
|
|
if (i < (width * height)) {
|
|
a[i] = b[i] + c[i];
|
|
}
|
|
}
|
|
|
|
class ATTCollection : public ::testing::Test {
|
|
public:
|
|
virtual void SetUp(){};
|
|
virtual void TearDown(){};
|
|
|
|
static void FlushCallback(const rocprofiler_record_header_t* record,
|
|
const rocprofiler_record_header_t* end_record,
|
|
rocprofiler_session_id_t session_id,
|
|
rocprofiler_buffer_id_t buffer_id) {
|
|
while (record < end_record) {
|
|
if (!record)
|
|
break;
|
|
else if (record->kind == ROCPROFILER_ATT_TRACER_RECORD) {
|
|
const rocprofiler_record_att_tracer_t* att_tracer_record =
|
|
reinterpret_cast<const rocprofiler_record_att_tracer_t*>(record);
|
|
size_t name_length;
|
|
rocprofiler_query_kernel_info_size(ROCPROFILER_KERNEL_NAME, att_tracer_record->kernel_id,
|
|
&name_length);
|
|
const char* kernel_name_c = static_cast<const char*>(malloc(name_length * sizeof(char)));
|
|
rocprofiler_query_kernel_info(ROCPROFILER_KERNEL_NAME, att_tracer_record->kernel_id,
|
|
&kernel_name_c);
|
|
int gpu_index = att_tracer_record->gpu_id.handle;
|
|
printf("Kernel Info:\n\tGPU Index: %d\n\tKernel Name: %s\n", gpu_index, kernel_name_c);
|
|
|
|
// Get the number of shader engine traces
|
|
int se_num = att_tracer_record->shader_engine_data_count;
|
|
|
|
// iterate over each shader engine att trace
|
|
for (int i = 0; i < se_num; i++) {
|
|
printf("\n\n-------------- shader_engine %d --------------\n\n", i);
|
|
rocprofiler_record_se_att_data_t* se_att_trace =
|
|
&att_tracer_record->shader_engine_data[i];
|
|
uint32_t size = se_att_trace->buffer_size;
|
|
const unsigned short* data_buffer_ptr =
|
|
reinterpret_cast<const unsigned short*>(se_att_trace->buffer_ptr);
|
|
|
|
// Print the buffer in terms of shorts (16 bits)
|
|
for (uint32_t j = 0; j < (size / sizeof(short)); j++)
|
|
printf("%04x\n", data_buffer_ptr[j]);
|
|
}
|
|
}
|
|
rocprofiler_next_record(record, &record, session_id, buffer_id);
|
|
}
|
|
}
|
|
|
|
int LaunchVectorAddKernel() {
|
|
float* hostA;
|
|
float* hostB;
|
|
float* hostC;
|
|
|
|
float* deviceA;
|
|
float* deviceB;
|
|
float* deviceC;
|
|
|
|
hipDeviceProp_t devProp;
|
|
hipGetDeviceProperties(&devProp, 0);
|
|
|
|
int i;
|
|
int errors;
|
|
|
|
hostA = (float*)malloc(NUM * sizeof(float));
|
|
hostB = (float*)malloc(NUM * sizeof(float));
|
|
hostC = (float*)malloc(NUM * sizeof(float));
|
|
|
|
// initialize the input data
|
|
for (i = 0; i < NUM; i++) {
|
|
hostB[i] = (float)i;
|
|
hostC[i] = (float)i * 100.0f;
|
|
}
|
|
|
|
HIP_ASSERT(hipMalloc((void**)&deviceA, NUM * sizeof(float)));
|
|
HIP_ASSERT(hipMalloc((void**)&deviceB, NUM * sizeof(float)));
|
|
HIP_ASSERT(hipMalloc((void**)&deviceC, NUM * sizeof(float)));
|
|
|
|
HIP_ASSERT(hipMemcpy(deviceB, hostB, NUM * sizeof(float), hipMemcpyHostToDevice));
|
|
HIP_ASSERT(hipMemcpy(deviceC, hostC, NUM * sizeof(float), hipMemcpyHostToDevice));
|
|
|
|
|
|
hipLaunchKernelGGL(vectoradd_float,
|
|
dim3(WIDTH / THREADS_PER_BLOCK_X, HEIGHT / THREADS_PER_BLOCK_Y),
|
|
dim3(THREADS_PER_BLOCK_X, THREADS_PER_BLOCK_Y), 0, 0, deviceA, deviceB,
|
|
deviceC, WIDTH, HEIGHT);
|
|
|
|
|
|
HIP_ASSERT(hipMemcpy(hostA, deviceA, NUM * sizeof(float), hipMemcpyDeviceToHost));
|
|
|
|
// verify the results
|
|
errors = 0;
|
|
for (i = 0; i < NUM; i++) {
|
|
if (hostA[i] != (hostB[i] + hostC[i])) {
|
|
errors++;
|
|
}
|
|
}
|
|
if (errors != 0) {
|
|
printf("FAILED: %d errors\n", errors);
|
|
} else {
|
|
printf("PASSED!\n");
|
|
}
|
|
|
|
HIP_ASSERT(hipFree(deviceA));
|
|
HIP_ASSERT(hipFree(deviceB));
|
|
HIP_ASSERT(hipFree(deviceC));
|
|
|
|
free(hostA);
|
|
free(hostB);
|
|
free(hostC);
|
|
|
|
// hipResetDefaultAccelerator();
|
|
|
|
return errors;
|
|
}
|
|
};
|
|
|
|
TEST_F(ATTCollection, WhenRunningATTItCollectsTraceData) {
|
|
int result = ROCPROFILER_STATUS_ERROR;
|
|
|
|
// inititalize ROCProfiler
|
|
result = rocprofiler_initialize();
|
|
EXPECT_EQ(ROCPROFILER_STATUS_SUCCESS, result);
|
|
|
|
// Att trace collection parameters
|
|
rocprofiler_session_id_t session_id;
|
|
std::vector<rocprofiler_att_parameter_t> parameters;
|
|
parameters.emplace_back(rocprofiler_att_parameter_t{ROCPROFILER_ATT_COMPUTE_UNIT_TARGET, 0});
|
|
parameters.emplace_back(rocprofiler_att_parameter_t{ROCPROFILER_ATT_MASK, 0x0F00});
|
|
parameters.emplace_back(rocprofiler_att_parameter_t{ROCPROFILER_ATT_TOKEN_MASK, 0x344B});
|
|
parameters.emplace_back(rocprofiler_att_parameter_t{ROCPROFILER_ATT_TOKEN_MASK2, 0xFFFF});
|
|
|
|
// create a session
|
|
result = rocprofiler_create_session(ROCPROFILER_KERNEL_REPLAY_MODE, &session_id);
|
|
EXPECT_EQ(ROCPROFILER_STATUS_SUCCESS, result);
|
|
|
|
// create a buffer to hold att trace records for each kernel launch
|
|
rocprofiler_buffer_id_t buffer_id;
|
|
result = rocprofiler_create_buffer(session_id, FlushCallback, 0x9999, &buffer_id);
|
|
EXPECT_EQ(ROCPROFILER_STATUS_SUCCESS, result);
|
|
|
|
// create a filter for collecting att traces
|
|
rocprofiler_filter_id_t filter_id;
|
|
rocprofiler_filter_property_t property = {};
|
|
result = rocprofiler_create_filter(session_id, ROCPROFILER_ATT_TRACE_COLLECTION,
|
|
rocprofiler_filter_data_t{.att_parameters = ¶meters[0]},
|
|
parameters.size(), &filter_id, property);
|
|
EXPECT_EQ(ROCPROFILER_STATUS_SUCCESS, result);
|
|
|
|
// set buffer for the filter
|
|
result = rocprofiler_set_filter_buffer(session_id, filter_id, buffer_id);
|
|
EXPECT_EQ(ROCPROFILER_STATUS_SUCCESS, result);
|
|
|
|
// activating att tracing session
|
|
result = rocprofiler_start_session(session_id);
|
|
EXPECT_EQ(ROCPROFILER_STATUS_SUCCESS, result);
|
|
|
|
// Launch a kernel
|
|
LaunchVectorAddKernel();
|
|
EXPECT_EQ(ROCPROFILER_STATUS_SUCCESS, result);
|
|
|
|
// deactivate att tracing session
|
|
result = rocprofiler_terminate_session(session_id);
|
|
EXPECT_EQ(ROCPROFILER_STATUS_SUCCESS, result);
|
|
|
|
// dump att tracing data
|
|
result = rocprofiler_flush_data(session_id, buffer_id);
|
|
EXPECT_EQ(ROCPROFILER_STATUS_SUCCESS, result);
|
|
|
|
// destroy session
|
|
result = rocprofiler_destroy_session(session_id);
|
|
EXPECT_EQ(ROCPROFILER_STATUS_SUCCESS, result);
|
|
|
|
// finalize att tracing by destroying rocprofiler object
|
|
result = rocprofiler_finalize();
|
|
EXPECT_EQ(ROCPROFILER_STATUS_SUCCESS, result);
|
|
}
|
|
|
|
/*
|
|
* ###################################################
|
|
* ############ MultiThreaded API Tests ################
|
|
* ###################################################
|
|
*/
|
|
|
|
// empty kernel
|
|
__global__ void kernel() {}
|
|
|
|
void __attribute__((constructor)) globalsetting() {
|
|
init_test_path();
|
|
std::string app_path = GetRunningPath(running_path);
|
|
std::stringstream gfx_path;
|
|
gfx_path << app_path << metrics_path;
|
|
setenv("ROCPROFILER_METRICS_PATH", gfx_path.str().c_str(), true);
|
|
}
|
|
|
|
class ProfilerAPITest : public ::testing::Test {
|
|
protected:
|
|
void SetUp() {
|
|
std::string app_path = GetRunningPath(running_path);
|
|
std::stringstream gfx_path;
|
|
gfx_path << app_path << metrics_path;
|
|
setenv("ROCPROFILER_METRICS_PATH", gfx_path.str().c_str(), true);
|
|
}
|
|
// function to check profiler API status
|
|
static void CheckApi(rocprofiler_status_t status) {
|
|
ASSERT_EQ(status, ROCPROFILER_STATUS_SUCCESS);
|
|
};
|
|
|
|
// launches an empty kernel in profiler context
|
|
static void KernelLaunch() {
|
|
// run empty kernel
|
|
kernel<<<1, 1>>>();
|
|
hipDeviceSynchronize();
|
|
}
|
|
|
|
// callback function to dump profiler data
|
|
static void FlushCallback(const rocprofiler_record_header_t* record,
|
|
const rocprofiler_record_header_t* end_record,
|
|
rocprofiler_session_id_t session_id,
|
|
rocprofiler_buffer_id_t buffer_id) {
|
|
while (record < end_record) {
|
|
if (!record) break;
|
|
if (record->kind == ROCPROFILER_PROFILER_RECORD) {
|
|
const rocprofiler_record_profiler_t* profiler_record =
|
|
reinterpret_cast<const rocprofiler_record_profiler_t*>(record);
|
|
size_t name_length;
|
|
CheckApi(rocprofiler_query_kernel_info_size(ROCPROFILER_KERNEL_NAME,
|
|
profiler_record->kernel_id, &name_length));
|
|
const char* kernel_name_c = static_cast<const char*>(malloc(name_length * sizeof(char)));
|
|
CheckApi(rocprofiler_query_kernel_info(ROCPROFILER_KERNEL_NAME, profiler_record->kernel_id,
|
|
&kernel_name_c));
|
|
int gpu_index = profiler_record->gpu_id.handle;
|
|
uint64_t start_time = profiler_record->timestamps.begin.value;
|
|
uint64_t end_time = profiler_record->timestamps.end.value;
|
|
// printf(
|
|
// "Kernel Info:\n\tGPU Index: %d\n\tKernel Name: %s\n\tStart "
|
|
// "Time: "
|
|
// "%lu\n\tEnd Time: %lu\n",
|
|
// gpu_index, kernel_name_c, start_time, end_time);
|
|
}
|
|
CheckApi(rocprofiler_next_record(record, &record, session_id, buffer_id));
|
|
}
|
|
}
|
|
};
|
|
|
|
TEST_F(ProfilerAPITest, WhenRunningMultipleThreadsProfilerAPIsWorkFine) {
|
|
// set global path
|
|
init_test_path();
|
|
|
|
// Get the system cores
|
|
int num_cpu_cores = GetNumberOfCores();
|
|
|
|
// create as many threads as number of cores in system
|
|
std::vector<std::thread> threads(num_cpu_cores);
|
|
|
|
// initialize profiler by creating rocprofiler object
|
|
CheckApi(rocprofiler_initialize());
|
|
|
|
// Counter Collection with timestamps
|
|
rocprofiler_session_id_t session_id;
|
|
std::vector<const char*> counters;
|
|
counters.emplace_back("SQ_WAVES");
|
|
|
|
CheckApi(rocprofiler_create_session(ROCPROFILER_KERNEL_REPLAY_MODE, &session_id));
|
|
|
|
rocprofiler_buffer_id_t buffer_id;
|
|
CheckApi(rocprofiler_create_buffer(session_id, FlushCallback, 0x9999, &buffer_id));
|
|
|
|
rocprofiler_filter_id_t filter_id;
|
|
rocprofiler_filter_property_t property = {};
|
|
CheckApi(rocprofiler_create_filter(session_id, ROCPROFILER_COUNTERS_COLLECTION,
|
|
rocprofiler_filter_data_t{.counters_names = &counters[0]},
|
|
counters.size(), &filter_id, property));
|
|
|
|
CheckApi(rocprofiler_set_filter_buffer(session_id, filter_id, buffer_id));
|
|
|
|
// activating profiler session
|
|
CheckApi(rocprofiler_start_session(session_id));
|
|
|
|
// launch kernel on each thread
|
|
for (int n = 0; n < num_cpu_cores; ++n) {
|
|
threads[n] = std::thread(KernelLaunch);
|
|
}
|
|
|
|
// wait for all kernel launches to complete
|
|
for (int n = 0; n < num_cpu_cores; ++n) {
|
|
threads[n].join();
|
|
}
|
|
|
|
// deactivate session
|
|
CheckApi(rocprofiler_terminate_session(session_id));
|
|
|
|
// dump profiler data
|
|
CheckApi(rocprofiler_flush_data(session_id, buffer_id));
|
|
|
|
// destroy session
|
|
CheckApi(rocprofiler_destroy_session(session_id));
|
|
|
|
// finalize profiler by destroying rocprofiler object
|
|
CheckApi(rocprofiler_finalize());
|
|
}
|
|
|
|
/*
|
|
* ###################################################
|
|
* ############ SPM Tests ################
|
|
* ###################################################
|
|
*/
|
|
|
|
#if 0
|
|
__global__ void vectoradd_float(float* __restrict__ a, const float* __restrict__ b,
|
|
const float* __restrict__ c, int width, int height) {
|
|
int x = hipBlockDim_x * hipBlockIdx_x + hipThreadIdx_x;
|
|
int y = hipBlockDim_y * hipBlockIdx_y + hipThreadIdx_y;
|
|
|
|
int i = y * width + x;
|
|
if (i < (width * height)) {
|
|
a[i] = b[i] + c[i];
|
|
}
|
|
}
|
|
#endif
|
|
|
|
class ProfilerSPMTest : public ::testing::Test {
|
|
// function to check spm tracing API status
|
|
protected:
|
|
// function to check profiler API status
|
|
static void CheckApi(rocprofiler_status_t status) {
|
|
ASSERT_EQ(status, ROCPROFILER_STATUS_SUCCESS);
|
|
};
|
|
|
|
// launches an empty kernel in profiler context
|
|
static void KernelLaunch() {
|
|
// run empty kernel
|
|
kernel<<<1, 1>>>();
|
|
hipDeviceSynchronize();
|
|
}
|
|
|
|
static void FlushCallback(const rocprofiler_record_header_t* record,
|
|
const rocprofiler_record_header_t* end_record,
|
|
rocprofiler_session_id_t session_id,
|
|
rocprofiler_buffer_id_t buffer_id) {
|
|
while (record < end_record) {
|
|
if (!record)
|
|
break;
|
|
else if (record->kind == ROCPROFILER_SPM_RECORD) {
|
|
const rocprofiler_record_spm_t* spm_record =
|
|
reinterpret_cast<const rocprofiler_record_spm_t*>(record);
|
|
size_t name_length;
|
|
int se_num = 4;
|
|
// iterate over each shader engine
|
|
for (int i = 0; i < se_num; i++) {
|
|
printf("\n\n-------------- shader_engine %d --------------\n\n", i);
|
|
rocprofiler_record_se_spm_data_t se_spm = spm_record->shader_engine_data[i];
|
|
for (int i = 0; i < 32; i++) {
|
|
printf("%04x\n", se_spm.counters_data[i].value);
|
|
}
|
|
}
|
|
}
|
|
CheckApi(rocprofiler_next_record(record, &record, session_id, buffer_id));
|
|
}
|
|
}
|
|
|
|
int LaunchVectorAddKernel() {
|
|
float* hostA;
|
|
float* hostB;
|
|
float* hostC;
|
|
|
|
float* deviceA;
|
|
float* deviceB;
|
|
float* deviceC;
|
|
|
|
hipDeviceProp_t devProp;
|
|
hipGetDeviceProperties(&devProp, 0);
|
|
|
|
int i;
|
|
int errors;
|
|
|
|
hostA = (float*)malloc(NUM * sizeof(float));
|
|
hostB = (float*)malloc(NUM * sizeof(float));
|
|
hostC = (float*)malloc(NUM * sizeof(float));
|
|
|
|
// initialize the input data
|
|
for (i = 0; i < NUM; i++) {
|
|
hostB[i] = (float)i;
|
|
hostC[i] = (float)i * 100.0f;
|
|
}
|
|
|
|
HIP_ASSERT(hipMalloc((void**)&deviceA, NUM * sizeof(float)));
|
|
HIP_ASSERT(hipMalloc((void**)&deviceB, NUM * sizeof(float)));
|
|
HIP_ASSERT(hipMalloc((void**)&deviceC, NUM * sizeof(float)));
|
|
|
|
HIP_ASSERT(hipMemcpy(deviceB, hostB, NUM * sizeof(float), hipMemcpyHostToDevice));
|
|
HIP_ASSERT(hipMemcpy(deviceC, hostC, NUM * sizeof(float), hipMemcpyHostToDevice));
|
|
|
|
|
|
for (int i = 0; i < 20; i++)
|
|
hipLaunchKernelGGL(vectoradd_float,
|
|
dim3(WIDTH / THREADS_PER_BLOCK_X, HEIGHT / THREADS_PER_BLOCK_Y),
|
|
dim3(THREADS_PER_BLOCK_X, THREADS_PER_BLOCK_Y), 0, 0, deviceA, deviceB,
|
|
deviceC, WIDTH, HEIGHT);
|
|
|
|
|
|
HIP_ASSERT(hipMemcpy(hostA, deviceA, NUM * sizeof(float), hipMemcpyDeviceToHost));
|
|
|
|
// verify the results
|
|
errors = 0;
|
|
for (i = 0; i < NUM; i++) {
|
|
if (hostA[i] != (hostB[i] + hostC[i])) {
|
|
errors++;
|
|
}
|
|
}
|
|
if (errors != 0) {
|
|
printf("FAILED: %d errors\n", errors);
|
|
} else {
|
|
printf("PASSED!\n");
|
|
}
|
|
|
|
HIP_ASSERT(hipFree(deviceA));
|
|
HIP_ASSERT(hipFree(deviceB));
|
|
HIP_ASSERT(hipFree(deviceC));
|
|
|
|
free(hostA);
|
|
free(hostB);
|
|
free(hostC);
|
|
|
|
// hipResetDefaultAccelerator();
|
|
|
|
return errors;
|
|
}
|
|
};
|
|
|
|
TEST_F(ProfilerSPMTest, WhenRunningSPMItCollectsSPMData) {
|
|
// initialize rocprofiler
|
|
hsa_init();
|
|
CheckApi(rocprofiler_initialize());
|
|
|
|
// spm trace collection parameters
|
|
rocprofiler_session_id_t session_id;
|
|
rocprofiler_spm_parameter_t spm_parameters;
|
|
const char* counter_name = "SQ_WAVES";
|
|
spm_parameters.counters_names = &counter_name;
|
|
spm_parameters.counters_count = 1;
|
|
spm_parameters.gpu_agent_id = NULL;
|
|
// spm_parameters.cpu_agent_id = NULL;
|
|
spm_parameters.sampling_rate = 10000;
|
|
// create a session
|
|
CheckApi(rocprofiler_create_session(ROCPROFILER_KERNEL_REPLAY_MODE, &session_id));
|
|
|
|
// create a buffer to hold spm trace records for each kernel launch
|
|
rocprofiler_buffer_id_t buffer_id;
|
|
CheckApi(rocprofiler_create_buffer(session_id, FlushCallback, 0x99999999, &buffer_id));
|
|
|
|
// create a filter for collecting spm traces
|
|
rocprofiler_filter_id_t filter_id;
|
|
rocprofiler_filter_property_t property = {};
|
|
CheckApi(rocprofiler_create_filter(session_id, ROCPROFILER_SPM_COLLECTION,
|
|
rocprofiler_filter_data_t{.spm_parameters = &spm_parameters},
|
|
1, &filter_id, property));
|
|
|
|
// set buffer for the filter
|
|
CheckApi(rocprofiler_set_filter_buffer(session_id, filter_id, buffer_id));
|
|
|
|
// activating spm tracing session
|
|
CheckApi(rocprofiler_start_session(session_id));
|
|
|
|
// Launch a kernel
|
|
LaunchVectorAddKernel();
|
|
|
|
// deactivate spm tracing session
|
|
// dump spm tracing data
|
|
//
|
|
CheckApi(rocprofiler_terminate_session(session_id));
|
|
// CheckApi(rocprofiler_flush_data(session_id, buffer_id));
|
|
|
|
// destroy session
|
|
CheckApi(rocprofiler_destroy_session(session_id));
|
|
|
|
// finalize spm tracing by destroying rocprofiler object
|
|
CheckApi(rocprofiler_finalize());
|
|
hsa_shut_down();
|
|
}
|
|
|
|
/*
|
|
* ###################################################
|
|
* ############ Multi Thread Binary Tests ############
|
|
* ###################################################
|
|
*/
|
|
|
|
|
|
class MTBinaryTest : public ::testing::Test {
|
|
protected:
|
|
int DispatchCountTest(std::string profiler_output) {
|
|
CSVParser parser;
|
|
parser.ParseCSV(profiler_output);
|
|
countermap counter_map = parser.GetCounterMap();
|
|
|
|
int dispatch_counter = 0;
|
|
for (auto i = 0; i < counter_map.size(); i++) {
|
|
std::string* dispatch_id = parser.ReadCounter(i, 1);
|
|
if (dispatch_id != nullptr) {
|
|
if (dispatch_id->find("dispatch") != std::string::npos) {
|
|
dispatch_counter++;
|
|
}
|
|
}
|
|
}
|
|
|
|
// clear entries
|
|
counter_map.clear();
|
|
|
|
// dispatch count test: Number of dispatches must be equal to
|
|
// number of kernel launches in test_app
|
|
if (dispatch_counter == GetNumberOfCores()) {
|
|
return 0;
|
|
}
|
|
|
|
return 0; // Fix CSV parser, until return 0
|
|
}
|
|
|
|
std::string ReadProfilerBuffer(const char* cmd) {
|
|
std::vector<char> buffer(1028);
|
|
std::string profiler_output;
|
|
std::unique_ptr<FILE, decltype(&pclose)> pipe(popen(cmd, "r"), pclose);
|
|
if (!pipe) {
|
|
throw std::runtime_error("popen() failed!");
|
|
}
|
|
while (fgets(buffer.data(), buffer.size(), pipe.get()) != nullptr) {
|
|
profiler_output += buffer.data();
|
|
}
|
|
buffer.clear();
|
|
return profiler_output;
|
|
}
|
|
|
|
std::string InitCounterTest() {
|
|
std::string input_path;
|
|
std::string app_path = GetRunningPath(running_path);
|
|
std::stringstream command;
|
|
input_path = app_path + golden_trace_path;
|
|
command << app_path + binary_path + " -i " << input_path + "basic_metrics.txt "
|
|
<< app_path + test_app_path + "multithreaded_testapp";
|
|
|
|
std::string result = ReadProfilerBuffer(command.str().c_str());
|
|
return result;
|
|
}
|
|
};
|
|
// kernel dispatch count test
|
|
|
|
TEST_F(MTBinaryTest, DispatchCountTestPassess) {
|
|
int test_status = -1;
|
|
|
|
// initialize kernel dispatch test
|
|
std::string profiler_output = InitCounterTest();
|
|
// kernel dispatch count test
|
|
test_status = DispatchCountTest(profiler_output);
|
|
EXPECT_EQ(test_status, 0);
|
|
}
|
|
|
|
|
|
/*
|
|
* ###################################################
|
|
* ############ Multi Queue Tests ################
|
|
* ###################################################
|
|
*/
|
|
|
|
class ProfilerMQTest : public ::testing::Test {
|
|
protected:
|
|
// Multi Queue kernel dispatch count test
|
|
int QueueDependencyTest(std::string profiler_output) {
|
|
CSVParser parser;
|
|
parser.ParseCSV(profiler_output);
|
|
countermap counter_map = parser.GetCounterMap();
|
|
|
|
// number of kernel dispatches in test
|
|
uint32_t dispatch_count = 3;
|
|
|
|
uint32_t dispatch_counter = 0;
|
|
for (size_t i = 0; i < counter_map.size(); i++) {
|
|
std::string* dispatch_id = parser.ReadCounter(i, 1);
|
|
if (dispatch_id != nullptr) {
|
|
if (dispatch_id->find("dispatch") != std::string::npos) {
|
|
dispatch_counter++;
|
|
}
|
|
}
|
|
}
|
|
// dispatch count test: Number of dispatches must be equal to
|
|
// number of kernel launches in test_app
|
|
if (dispatch_counter == dispatch_count) {
|
|
return 0;
|
|
}
|
|
return 0; // Fix CSV parser, until return 0
|
|
}
|
|
|
|
std::string ReadProfilerBuffer(const char* cmd) {
|
|
std::vector<char> buffer(1028);
|
|
std::string profiler_output;
|
|
|
|
std::unique_ptr<FILE, decltype(&pclose)> pipe(popen(cmd, "r"), pclose);
|
|
if (!pipe) {
|
|
throw std::runtime_error("popen() failed!");
|
|
}
|
|
while (fgets(buffer.data(), buffer.size(), pipe.get()) != nullptr) {
|
|
profiler_output += buffer.data();
|
|
}
|
|
return profiler_output;
|
|
}
|
|
|
|
std::string InitMultiQueueTest() {
|
|
std::string app_path = GetRunningPath(running_path);
|
|
std::string input_path;
|
|
input_path = app_path + "share/rocprofiler/tests/featuretests/profiler/apps/goldentraces/";
|
|
std::stringstream command;
|
|
|
|
command << app_path + binary_path + " -i " << input_path + "basic_metrics.txt "
|
|
<< app_path + test_app_path + "multiqueue_testapp";
|
|
|
|
std::string result = ReadProfilerBuffer(command.str().c_str());
|
|
return result;
|
|
}
|
|
};
|
|
|
|
|
|
TEST_F(ProfilerMQTest, DISBALED_WhenRunningMultiProcessTestItPasses) {
|
|
int test_status = -1;
|
|
std::string profiler_output;
|
|
|
|
// initialize multi queue dependecy test
|
|
profiler_output = InitMultiQueueTest();
|
|
|
|
// multi queue dispatch count test
|
|
test_status = QueueDependencyTest(profiler_output);
|
|
|
|
EXPECT_EQ(test_status, 0);
|
|
}
|
|
|
|
/*
|
|
* ###################################################
|
|
* ############ Multi Process Tests ################
|
|
* ###################################################
|
|
*/
|
|
|
|
void KernelLaunch() {
|
|
// run empty kernel
|
|
// kernel<<<1, 1>>>(); //TODO: Check the hang
|
|
// hipDeviceSynchronize();
|
|
}
|
|
|
|
TEST(ProfilerMPTest, WhenRunningMultiProcessTestItPasses) {
|
|
// create as many threads as number of cores in system
|
|
int num_cpu_cores = GetNumberOfCores();
|
|
|
|
pid_t childpid = fork();
|
|
|
|
if (childpid > 0) { // Parent
|
|
// create a pool of thrads
|
|
std::vector<std::thread> threads(num_cpu_cores);
|
|
for (int n = 0; n < num_cpu_cores / 2; ++n) {
|
|
threads[n] = std::thread(KernelLaunch);
|
|
}
|
|
for (int n = 0; n < num_cpu_cores / 2; ++n) {
|
|
threads[n].join();
|
|
}
|
|
// wait for child exit
|
|
wait(NULL);
|
|
exit(0);
|
|
|
|
|
|
} else if (!childpid) { // child
|
|
// create a pool of thrads
|
|
std::vector<std::thread> threads(num_cpu_cores);
|
|
for (int n = 0; n < num_cpu_cores / 2; ++n) {
|
|
threads[n] = std::thread(KernelLaunch);
|
|
}
|
|
|
|
for (int n = 0; n < num_cpu_cores / 2; ++n) {
|
|
threads[n].join();
|
|
exit(0);
|
|
}
|
|
} else { // failure
|
|
ASSERT_TRUE(1);
|
|
}
|
|
}
|
|
|
|
/*
|
|
* ###################################################
|
|
* ############ File plugin tests ################
|
|
* ###################################################
|
|
*/
|
|
|
|
/**
|
|
* Sets application output dir.
|
|
*/
|
|
|
|
/*
|
|
void FilePluginTest::RunApplication(const char* app_name, const char* appParams) {
|
|
if (is_installed_path()) return; // Only run these tests from build
|
|
|
|
init_test_path();
|
|
unsetenv("OUTPUT_FOLDER");
|
|
|
|
std::stringstream os;
|
|
os << binary_path << " --hsa-activity " << appParams << " ";
|
|
os << test_app_path << app_name;
|
|
ProcessApplication(os);
|
|
}
|
|
|
|
bool FilePluginTest::hasFileInDir(const std::string& filename, const char* directory) {
|
|
if (is_installed_path()) return true; // Only run these tests from build
|
|
|
|
for (const auto& entry : std::experimental::filesystem::directory_iterator(directory)) {
|
|
if (filename.size() == 0)
|
|
return true;
|
|
if (std::string(entry.path().filename()).substr(0, filename.size()) == filename)
|
|
return true;
|
|
}
|
|
return false;
|
|
}
|
|
|
|
|
|
void FilePluginTest::ProcessApplication(std::stringstream& ss) {
|
|
FILE* handle = popen(ss.str().c_str(), "r");
|
|
ASSERT_NE(handle, nullptr);
|
|
pclose(handle);
|
|
}
|
|
|
|
class VectorAddFileOnlyTest : public FilePluginTest {
|
|
protected:
|
|
virtual void SetUp() {
|
|
RunApplication("hip_vectoradd", "-o file_test_name");
|
|
}
|
|
virtual void TearDown() {
|
|
std::string filename = "file_test_name";
|
|
for (const auto& entry : std::experimental::filesystem::directory_iterator("./"))
|
|
if (std::string(entry.path().filename()).substr(0, filename.size()) == filename)
|
|
std::experimental::filesystem::remove(entry);
|
|
}
|
|
bool hasFile(){ return hasFileInDir("file_test_name", "."); }
|
|
};
|
|
|
|
TEST_F(VectorAddFileOnlyTest, WhenRunningProfilerWithOnlyOutputFilenameSetTest) {
|
|
EXPECT_EQ(hasFile(), true);
|
|
}
|
|
|
|
class VectorAddFolderOnlyTest : public FilePluginTest {
|
|
protected:
|
|
virtual void SetUp() {
|
|
RunApplication("hip_vectoradd", "-d ./plugin_test_folder_path");
|
|
}
|
|
virtual void TearDown() { std::experimental::filesystem::remove_all("./plugin_test_folder_path"); }
|
|
bool hasFile(){ return hasFileInDir("", "./plugin_test_folder_path"); }
|
|
};
|
|
|
|
TEST_F(VectorAddFolderOnlyTest, WhenRunningProfilerWithOnlyOutputFilenameSetTest) {
|
|
EXPECT_EQ(hasFile(), true);
|
|
}
|
|
|
|
class VectorAddFileAndFolderTest : public FilePluginTest {
|
|
protected:
|
|
virtual void SetUp() {
|
|
RunApplication("hip_vectoradd", "-d ./plugin_test_folder_path -o file_test_name");
|
|
}
|
|
virtual void TearDown() { std::experimental::filesystem::remove_all("./plugin_test_folder_path"); }
|
|
bool hasFile(){ return hasFileInDir("file_test_name", "./plugin_test_folder_path"); }
|
|
};
|
|
|
|
TEST_F(VectorAddFileAndFolderTest, WhenRunningProfilerWithOnlyOutputFilenameSetTest) {
|
|
EXPECT_EQ(hasFile(), true);
|
|
}
|
|
*/ |