Файли
rocm-systems/source/lib/rocprofiler-sdk-att/occupancy.cpp
T
Madsen, Jonathan 070b659a9a Re-enable clang-tidy for core workflows + clang-tidy fixes (#197)
* Ensure the clang-tidy is updated + clang-tidy fixes

* update-ci workflow

* Enable clang-tidy checks

* Add extra logging to device counter collection samples

* Misc clang-tidy fixes

* Disable device counter collection samples for ThreadSanitizer

* Formatting

---------

Co-authored-by: Jonathan R. Madsen <jonathanrmadsen@gmail.com>
2025-02-11 10:58:47 -06:00

115 рядки
3.3 KiB
C++

// MIT License
//
// Copyright (c) 2024-2025 Advanced Micro Devices, Inc. All rights reserved.
//
// Permission is hereby granted, free of charge, to any person obtaining a copy
// of this software and associated documentation files (the "Software"), to deal
// in the Software without restriction, including without limitation the rights
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
// copies of the Software, and to permit persons to whom the Software is
// furnished to do so, subject to the following conditions:
//
// The above copyright notice and this permission notice shall be included in all
// copies or substantial portions of the Software.
//
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
// SOFTWARE.
#include "occupancy.hpp"
#include <nlohmann/json.hpp>
#include "outputfile.hpp"
#include <atomic>
#include <fstream>
#include <iostream>
#include <sstream>
#define OCCUPANCY_RES 8
namespace rocprofiler
{
namespace att_wrapper
{
namespace
{
union occupancy_data_v1
{
struct
{
uint64_t kernel_id : 12;
uint64_t simd : 2;
uint64_t slot : 4;
uint64_t enable : 1;
uint64_t cu : 4;
uint64_t time : 41;
};
uint64_t raw;
};
std::map<pcinfo_t, int> kernel_ids{{pcinfo_t{0, 0}, 0}};
std::atomic<int> current_id{1};
int
get_kernel_id(pcinfo_t pc)
{
if(kernel_ids.find(pc) != kernel_ids.end()) return kernel_ids.at(pc);
return kernel_ids.emplace(pc, current_id.fetch_add(1)).first->second;
}
uint64_t
convert(const att_occupancy_info_v2_t& v2)
{
occupancy_data_v1 v1{};
v1.time = v2.time / OCCUPANCY_RES;
v1.simd = v2.simd;
v1.slot = v2.slot;
v1.enable = v2.start;
v1.cu = v2.cu;
v1.kernel_id = get_kernel_id(v2.pc);
return v1.raw;
}
} // namespace
namespace OccupancyFile
{
void
OccupancyFile(const Fspath& dir,
std::shared_ptr<AddressTable>& table,
const std::map<size_t, std::vector<att_occupancy_info_v2_t>>& occ)
{
if(!GlobalDefs::get().has_format("json")) return;
nlohmann::json jocc;
for(const auto& [se, eventlist] : occ)
{
nlohmann::json list;
for(const auto& event : eventlist)
list.push_back(convert(event));
jocc[std::to_string(se)] = list;
}
for(auto& [pc, id] : kernel_ids)
{
std::stringstream ss;
try
{
ss << table->getSymbolMap(pc.marker_id).at(pc.addr).name;
} catch(std::exception& e)
{
ss << pc.marker_id << " / 0x" << std::hex << pc.addr << std::dec;
}
jocc["dispatches"][std::to_string(id)] = ss.str();
}
OutputFile(dir / "occupancy.json") << jocc;
}
} // namespace OccupancyFile
} // namespace att_wrapper
} // namespace rocprofiler