7d2bc9d113
[git-p4: depot-paths = "//depot/stg/hsa/drivers/hsa/runtime/": change = 1250152]
276 regels
10 KiB
C++
276 regels
10 KiB
C++
////////////////////////////////////////////////////////////////////////////////
|
|
//
|
|
// The University of Illinois/NCSA
|
|
// Open Source License (NCSA)
|
|
//
|
|
// Copyright (c) 2014-2015, Advanced Micro Devices, Inc. All rights reserved.
|
|
//
|
|
// Developed by:
|
|
//
|
|
// AMD Research and AMD HSA Software Development
|
|
//
|
|
// Advanced Micro Devices, Inc.
|
|
//
|
|
// www.amd.com
|
|
//
|
|
// Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
// of this software and associated documentation files (the "Software"), to
|
|
// deal with the Software without restriction, including without limitation
|
|
// the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
// and/or sell copies of the Software, and to permit persons to whom the
|
|
// Software is furnished to do so, subject to the following conditions:
|
|
//
|
|
// - Redistributions of source code must retain the above copyright notice,
|
|
// this list of conditions and the following disclaimers.
|
|
// - Redistributions in binary form must reproduce the above copyright
|
|
// notice, this list of conditions and the following disclaimers in
|
|
// the documentation and/or other materials provided with the distribution.
|
|
// - Neither the names of Advanced Micro Devices, Inc,
|
|
// nor the names of its contributors may be used to endorse or promote
|
|
// products derived from this Software without specific prior written
|
|
// permission.
|
|
//
|
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
// THE CONTRIBUTORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
|
|
// OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
|
|
// ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
|
|
// DEALINGS WITH THE SOFTWARE.
|
|
//
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
#include "core/inc/default_signal.h"
|
|
#include "core/util/timer.h"
|
|
|
|
namespace core {
|
|
|
|
int DefaultSignal::rtti_id_ = 0;
|
|
|
|
DefaultSignal::DefaultSignal(hsa_signal_value_t initial_value)
|
|
: Signal(initial_value) {
|
|
signal_.kind = AMD_SIGNAL_KIND_USER;
|
|
signal_.event_mailbox_ptr = NULL;
|
|
HSA::hsa_memory_register(this, sizeof(DefaultSignal));
|
|
}
|
|
|
|
DefaultSignal::~DefaultSignal() {
|
|
invalid_ = true;
|
|
while (InUse())
|
|
;
|
|
HSA::hsa_memory_deregister(this, sizeof(DefaultSignal));
|
|
}
|
|
|
|
hsa_signal_value_t DefaultSignal::LoadRelaxed() {
|
|
return hsa_signal_value_t(
|
|
atomic::Load(&signal_.value, std::memory_order_relaxed));
|
|
}
|
|
|
|
hsa_signal_value_t DefaultSignal::LoadAcquire() {
|
|
return hsa_signal_value_t(
|
|
atomic::Load(&signal_.value, std::memory_order_acquire));
|
|
}
|
|
|
|
void DefaultSignal::StoreRelaxed(hsa_signal_value_t value) {
|
|
atomic::Store(&signal_.value, int64_t(value), std::memory_order_relaxed);
|
|
}
|
|
|
|
void DefaultSignal::StoreRelease(hsa_signal_value_t value) {
|
|
atomic::Store(&signal_.value, int64_t(value), std::memory_order_release);
|
|
}
|
|
|
|
hsa_signal_value_t DefaultSignal::WaitRelaxed(hsa_signal_condition_t condition,
|
|
hsa_signal_value_t compare_value,
|
|
uint64_t timeout,
|
|
hsa_wait_state_t wait_hint) {
|
|
atomic::Increment(&waiting_);
|
|
MAKE_SCOPE_GUARD([&]() { atomic::Decrement(&waiting_); });
|
|
bool condition_met = false;
|
|
int64_t value;
|
|
|
|
assert(!g_use_interrupt_wait && "Use of non-host signal in host signal wait API.");
|
|
|
|
timer::fast_clock::time_point start_time, time;
|
|
start_time = timer::fast_clock::now();
|
|
|
|
uint64_t hsa_freq;
|
|
HSA::hsa_system_get_info(HSA_SYSTEM_INFO_TIMESTAMP_FREQUENCY, &hsa_freq);
|
|
const timer::fast_clock::duration fast_timeout =
|
|
timer::duration_from_seconds<timer::fast_clock::duration>(
|
|
double(timeout) / double(hsa_freq));
|
|
|
|
while (true) {
|
|
if (invalid_) return 0;
|
|
|
|
value = atomic::Load(&signal_.value, std::memory_order_relaxed);
|
|
|
|
switch (condition) {
|
|
case HSA_SIGNAL_CONDITION_EQ: {
|
|
condition_met = (value == compare_value);
|
|
break;
|
|
}
|
|
case HSA_SIGNAL_CONDITION_NE: {
|
|
condition_met = (value != compare_value);
|
|
break;
|
|
}
|
|
case HSA_SIGNAL_CONDITION_GTE: {
|
|
condition_met = (value >= compare_value);
|
|
break;
|
|
}
|
|
case HSA_SIGNAL_CONDITION_LT: {
|
|
condition_met = (value < compare_value);
|
|
break;
|
|
}
|
|
default:
|
|
return 0;
|
|
}
|
|
if (condition_met) return hsa_signal_value_t(value);
|
|
|
|
time = timer::fast_clock::now();
|
|
if (time - start_time > fast_timeout) {
|
|
value = atomic::Load(&signal_.value, std::memory_order_relaxed);
|
|
return hsa_signal_value_t(value);
|
|
}
|
|
}
|
|
}
|
|
|
|
hsa_signal_value_t DefaultSignal::WaitAcquire(hsa_signal_condition_t condition,
|
|
hsa_signal_value_t compare_value,
|
|
uint64_t timeout,
|
|
hsa_wait_state_t wait_hint) {
|
|
hsa_signal_value_t ret =
|
|
WaitRelaxed(condition, compare_value, timeout, wait_hint);
|
|
std::atomic_thread_fence(std::memory_order_acquire);
|
|
return ret;
|
|
}
|
|
|
|
void DefaultSignal::AndRelaxed(hsa_signal_value_t value) {
|
|
atomic::And(&signal_.value, int64_t(value), std::memory_order_relaxed);
|
|
}
|
|
|
|
void DefaultSignal::AndAcquire(hsa_signal_value_t value) {
|
|
atomic::And(&signal_.value, int64_t(value), std::memory_order_acquire);
|
|
}
|
|
|
|
void DefaultSignal::AndRelease(hsa_signal_value_t value) {
|
|
atomic::And(&signal_.value, int64_t(value), std::memory_order_release);
|
|
}
|
|
|
|
void DefaultSignal::AndAcqRel(hsa_signal_value_t value) {
|
|
atomic::And(&signal_.value, int64_t(value), std::memory_order_acq_rel);
|
|
}
|
|
|
|
void DefaultSignal::OrRelaxed(hsa_signal_value_t value) {
|
|
atomic::Or(&signal_.value, int64_t(value), std::memory_order_relaxed);
|
|
}
|
|
|
|
void DefaultSignal::OrAcquire(hsa_signal_value_t value) {
|
|
atomic::Or(&signal_.value, int64_t(value), std::memory_order_acquire);
|
|
}
|
|
|
|
void DefaultSignal::OrRelease(hsa_signal_value_t value) {
|
|
atomic::Or(&signal_.value, int64_t(value), std::memory_order_release);
|
|
}
|
|
|
|
void DefaultSignal::OrAcqRel(hsa_signal_value_t value) {
|
|
atomic::Or(&signal_.value, int64_t(value), std::memory_order_acq_rel);
|
|
}
|
|
|
|
void DefaultSignal::XorRelaxed(hsa_signal_value_t value) {
|
|
atomic::Xor(&signal_.value, int64_t(value), std::memory_order_relaxed);
|
|
}
|
|
|
|
void DefaultSignal::XorAcquire(hsa_signal_value_t value) {
|
|
atomic::Xor(&signal_.value, int64_t(value), std::memory_order_acquire);
|
|
}
|
|
|
|
void DefaultSignal::XorRelease(hsa_signal_value_t value) {
|
|
atomic::Xor(&signal_.value, int64_t(value), std::memory_order_release);
|
|
}
|
|
|
|
void DefaultSignal::XorAcqRel(hsa_signal_value_t value) {
|
|
atomic::Xor(&signal_.value, int64_t(value), std::memory_order_acq_rel);
|
|
}
|
|
|
|
void DefaultSignal::AddRelaxed(hsa_signal_value_t value) {
|
|
atomic::Add(&signal_.value, int64_t(value), std::memory_order_relaxed);
|
|
}
|
|
|
|
void DefaultSignal::AddAcquire(hsa_signal_value_t value) {
|
|
atomic::Add(&signal_.value, int64_t(value), std::memory_order_acquire);
|
|
}
|
|
|
|
void DefaultSignal::AddRelease(hsa_signal_value_t value) {
|
|
atomic::Add(&signal_.value, int64_t(value), std::memory_order_release);
|
|
}
|
|
|
|
void DefaultSignal::AddAcqRel(hsa_signal_value_t value) {
|
|
atomic::Add(&signal_.value, int64_t(value), std::memory_order_acq_rel);
|
|
}
|
|
|
|
void DefaultSignal::SubRelaxed(hsa_signal_value_t value) {
|
|
atomic::Sub(&signal_.value, int64_t(value), std::memory_order_relaxed);
|
|
}
|
|
|
|
void DefaultSignal::SubAcquire(hsa_signal_value_t value) {
|
|
atomic::Sub(&signal_.value, int64_t(value), std::memory_order_acquire);
|
|
}
|
|
|
|
void DefaultSignal::SubRelease(hsa_signal_value_t value) {
|
|
atomic::Sub(&signal_.value, int64_t(value), std::memory_order_release);
|
|
}
|
|
|
|
void DefaultSignal::SubAcqRel(hsa_signal_value_t value) {
|
|
atomic::Sub(&signal_.value, int64_t(value), std::memory_order_acq_rel);
|
|
}
|
|
|
|
hsa_signal_value_t DefaultSignal::ExchRelaxed(hsa_signal_value_t value) {
|
|
return hsa_signal_value_t(atomic::Exchange(&signal_.value, int64_t(value),
|
|
std::memory_order_relaxed));
|
|
}
|
|
|
|
hsa_signal_value_t DefaultSignal::ExchAcquire(hsa_signal_value_t value) {
|
|
return hsa_signal_value_t(atomic::Exchange(&signal_.value, int64_t(value),
|
|
std::memory_order_acquire));
|
|
}
|
|
|
|
hsa_signal_value_t DefaultSignal::ExchRelease(hsa_signal_value_t value) {
|
|
return hsa_signal_value_t(atomic::Exchange(&signal_.value, int64_t(value),
|
|
std::memory_order_release));
|
|
}
|
|
|
|
hsa_signal_value_t DefaultSignal::ExchAcqRel(hsa_signal_value_t value) {
|
|
return hsa_signal_value_t(atomic::Exchange(&signal_.value, int64_t(value),
|
|
std::memory_order_acq_rel));
|
|
}
|
|
|
|
hsa_signal_value_t DefaultSignal::CasRelaxed(hsa_signal_value_t expected,
|
|
hsa_signal_value_t value) {
|
|
return hsa_signal_value_t(atomic::Cas(&signal_.value, int64_t(value),
|
|
int64_t(expected),
|
|
std::memory_order_relaxed));
|
|
}
|
|
|
|
hsa_signal_value_t DefaultSignal::CasAcquire(hsa_signal_value_t expected,
|
|
hsa_signal_value_t value) {
|
|
return hsa_signal_value_t(atomic::Cas(&signal_.value, int64_t(value),
|
|
int64_t(expected),
|
|
std::memory_order_acquire));
|
|
}
|
|
|
|
hsa_signal_value_t DefaultSignal::CasRelease(hsa_signal_value_t expected,
|
|
hsa_signal_value_t value) {
|
|
return hsa_signal_value_t(atomic::Cas(&signal_.value, int64_t(value),
|
|
int64_t(expected),
|
|
std::memory_order_release));
|
|
}
|
|
|
|
hsa_signal_value_t DefaultSignal::CasAcqRel(hsa_signal_value_t expected,
|
|
hsa_signal_value_t value) {
|
|
return hsa_signal_value_t(atomic::Cas(&signal_.value, int64_t(value),
|
|
int64_t(expected),
|
|
std::memory_order_acq_rel));
|
|
}
|
|
|
|
} // namespace core
|