97b7a6315d
* Update LICENSE * Update conf.py * Update copyright year * [fix] Update copyright year * Update copyright year "ROCm Developer Tools" * Add license headers to c++ files * Add license to *.py * Update licenses in rocdecode sources --------- Co-authored-by: srawat <120587655+SwRaw@users.noreply.github.com> Co-authored-by: Mythreya <mythreya.kuricheti@amd.com> Co-authored-by: Jonathan R. Madsen <jonathanrmadsen@gmail.com>
110 строки
3.2 KiB
C++
110 строки
3.2 KiB
C++
// MIT License
|
|
//
|
|
// Copyright (c) 2024-2025 Advanced Micro Devices, Inc. All rights reserved.
|
|
//
|
|
// Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
// of this software and associated documentation files (the "Software"), to deal
|
|
// in the Software without restriction, including without limitation the rights
|
|
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
// copies of the Software, and to permit persons to whom the Software is
|
|
// furnished to do so, subject to the following conditions:
|
|
//
|
|
// The above copyright notice and this permission notice shall be included in all
|
|
// copies or substantial portions of the Software.
|
|
//
|
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
// SOFTWARE.
|
|
|
|
#include "occupancy.hpp"
|
|
#include <nlohmann/json.hpp>
|
|
#include "outputfile.hpp"
|
|
|
|
#include <atomic>
|
|
#include <fstream>
|
|
#include <iostream>
|
|
#include <sstream>
|
|
|
|
#define OCCUPANCY_RES 8
|
|
|
|
namespace rocprofiler
|
|
{
|
|
namespace att_wrapper
|
|
{
|
|
union occupancy_data_v1
|
|
{
|
|
struct
|
|
{
|
|
uint64_t kernel_id : 12;
|
|
uint64_t simd : 2;
|
|
uint64_t slot : 4;
|
|
uint64_t enable : 1;
|
|
uint64_t cu : 4;
|
|
uint64_t time : 41;
|
|
};
|
|
uint64_t raw;
|
|
};
|
|
|
|
std::map<pcinfo_t, int> kernel_ids{{pcinfo_t{0, 0}, 0}};
|
|
std::atomic<int> current_id{1};
|
|
|
|
static int
|
|
get_kernel_id(pcinfo_t pc)
|
|
{
|
|
if(kernel_ids.find(pc) != kernel_ids.end()) return kernel_ids.at(pc);
|
|
|
|
return kernel_ids.emplace(pc, current_id.fetch_add(1)).first->second;
|
|
}
|
|
|
|
static uint64_t
|
|
convert(const att_occupancy_info_v2_t& v2)
|
|
{
|
|
occupancy_data_v1 v1{};
|
|
v1.time = v2.time / OCCUPANCY_RES;
|
|
v1.simd = v2.simd;
|
|
v1.slot = v2.slot;
|
|
v1.enable = v2.start;
|
|
v1.cu = v2.cu;
|
|
v1.kernel_id = get_kernel_id(v2.pc);
|
|
return v1.raw;
|
|
};
|
|
|
|
void
|
|
OccupancyFile::OccupancyFile(const Fspath& dir,
|
|
std::shared_ptr<AddressTable> table,
|
|
const std::map<size_t, std::vector<att_occupancy_info_v2_t>>& occ)
|
|
{
|
|
if(!GlobalDefs::get().has_format("json")) return;
|
|
nlohmann::json jocc;
|
|
|
|
for(auto& [se, eventlist] : occ)
|
|
{
|
|
nlohmann::json list;
|
|
for(auto& event : eventlist)
|
|
list.push_back(convert(event));
|
|
jocc[std::to_string(se)] = list;
|
|
}
|
|
|
|
for(auto& [pc, id] : kernel_ids)
|
|
{
|
|
std::stringstream ss;
|
|
try
|
|
{
|
|
ss << table->getSymbolMap(pc.marker_id).at(pc.addr).name;
|
|
} catch(std::exception& e)
|
|
{
|
|
ss << pc.marker_id << " / 0x" << std::hex << pc.addr << std::dec;
|
|
}
|
|
jocc["dispatches"][std::to_string(id)] = ss.str();
|
|
}
|
|
|
|
OutputFile(dir / "occupancy.json") << jocc;
|
|
}
|
|
|
|
} // namespace att_wrapper
|
|
} // namespace rocprofiler
|