diff --git a/projects/clr/rocclr/runtime/device/gpu/gpuschedcl.cpp b/projects/clr/rocclr/runtime/device/gpu/gpuschedcl.cpp index c08a88e02c..85ba4fb9a7 100644 --- a/projects/clr/rocclr/runtime/device/gpu/gpuschedcl.cpp +++ b/projects/clr/rocclr/runtime/device/gpu/gpuschedcl.cpp @@ -417,7 +417,7 @@ scheduler( uint tmp = 0; if (atomic_compare_exchange_strong_explicit( (__global atomic_uint*)¶m->launch, &tmp, launch, - memory_order_acq_rel, memory_order_acq_rel, memory_scope_device)) { + memory_order_acq_rel, memory_order_acquire, memory_scope_device)) { if (event != 0) { event->timer[PROFILING_COMMAND_START] = (__hsail_get_clock() * (ulong)param->eng_clk) >> 10;