070b659a9a
* Ensure the clang-tidy is updated + clang-tidy fixes * update-ci workflow * Enable clang-tidy checks * Add extra logging to device counter collection samples * Misc clang-tidy fixes * Disable device counter collection samples for ThreadSanitizer * Formatting --------- Co-authored-by: Jonathan R. Madsen <jonathanrmadsen@gmail.com>
115 строки
3.3 KiB
C++
115 строки
3.3 KiB
C++
// MIT License
|
|
//
|
|
// Copyright (c) 2024-2025 Advanced Micro Devices, Inc. All rights reserved.
|
|
//
|
|
// Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
// of this software and associated documentation files (the "Software"), to deal
|
|
// in the Software without restriction, including without limitation the rights
|
|
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
// copies of the Software, and to permit persons to whom the Software is
|
|
// furnished to do so, subject to the following conditions:
|
|
//
|
|
// The above copyright notice and this permission notice shall be included in all
|
|
// copies or substantial portions of the Software.
|
|
//
|
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
// SOFTWARE.
|
|
|
|
#include "occupancy.hpp"
|
|
#include <nlohmann/json.hpp>
|
|
#include "outputfile.hpp"
|
|
|
|
#include <atomic>
|
|
#include <fstream>
|
|
#include <iostream>
|
|
#include <sstream>
|
|
|
|
#define OCCUPANCY_RES 8
|
|
|
|
namespace rocprofiler
|
|
{
|
|
namespace att_wrapper
|
|
{
|
|
namespace
|
|
{
|
|
union occupancy_data_v1
|
|
{
|
|
struct
|
|
{
|
|
uint64_t kernel_id : 12;
|
|
uint64_t simd : 2;
|
|
uint64_t slot : 4;
|
|
uint64_t enable : 1;
|
|
uint64_t cu : 4;
|
|
uint64_t time : 41;
|
|
};
|
|
uint64_t raw;
|
|
};
|
|
|
|
std::map<pcinfo_t, int> kernel_ids{{pcinfo_t{0, 0}, 0}};
|
|
std::atomic<int> current_id{1};
|
|
|
|
int
|
|
get_kernel_id(pcinfo_t pc)
|
|
{
|
|
if(kernel_ids.find(pc) != kernel_ids.end()) return kernel_ids.at(pc);
|
|
|
|
return kernel_ids.emplace(pc, current_id.fetch_add(1)).first->second;
|
|
}
|
|
|
|
uint64_t
|
|
convert(const att_occupancy_info_v2_t& v2)
|
|
{
|
|
occupancy_data_v1 v1{};
|
|
v1.time = v2.time / OCCUPANCY_RES;
|
|
v1.simd = v2.simd;
|
|
v1.slot = v2.slot;
|
|
v1.enable = v2.start;
|
|
v1.cu = v2.cu;
|
|
v1.kernel_id = get_kernel_id(v2.pc);
|
|
return v1.raw;
|
|
}
|
|
} // namespace
|
|
|
|
namespace OccupancyFile
|
|
{
|
|
void
|
|
OccupancyFile(const Fspath& dir,
|
|
std::shared_ptr<AddressTable>& table,
|
|
const std::map<size_t, std::vector<att_occupancy_info_v2_t>>& occ)
|
|
{
|
|
if(!GlobalDefs::get().has_format("json")) return;
|
|
nlohmann::json jocc;
|
|
|
|
for(const auto& [se, eventlist] : occ)
|
|
{
|
|
nlohmann::json list;
|
|
for(const auto& event : eventlist)
|
|
list.push_back(convert(event));
|
|
jocc[std::to_string(se)] = list;
|
|
}
|
|
|
|
for(auto& [pc, id] : kernel_ids)
|
|
{
|
|
std::stringstream ss;
|
|
try
|
|
{
|
|
ss << table->getSymbolMap(pc.marker_id).at(pc.addr).name;
|
|
} catch(std::exception& e)
|
|
{
|
|
ss << pc.marker_id << " / 0x" << std::hex << pc.addr << std::dec;
|
|
}
|
|
jocc["dispatches"][std::to_string(id)] = ss.str();
|
|
}
|
|
|
|
OutputFile(dir / "occupancy.json") << jocc;
|
|
}
|
|
} // namespace OccupancyFile
|
|
} // namespace att_wrapper
|
|
} // namespace rocprofiler
|