From dfcb8cb2a92c9f72ddde5ea08dadf2f640197d32 Mon Sep 17 00:00:00 2001 From: Joseph Huber Date: Mon, 5 May 2025 16:33:41 -0500 Subject: [PATCH] [OpenMP] Add pre sm_70 load hack back in (#138589) Summary: Different ordering modes aren't supported for an atomic load, so we just do an add of zero as the same thing. It's less efficient, but it works. Fixes https://github.com/llvm/llvm-project/issues/138560 --- offload/DeviceRTL/include/Synchronization.h | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/offload/DeviceRTL/include/Synchronization.h b/offload/DeviceRTL/include/Synchronization.h index f9eb8d0d2319..7e7c8eacb917 100644 --- a/offload/DeviceRTL/include/Synchronization.h +++ b/offload/DeviceRTL/include/Synchronization.h @@ -59,7 +59,11 @@ V add(Ty *Address, V Val, atomic::OrderingTy Ordering, template > V load(Ty *Address, atomic::OrderingTy Ordering, MemScopeTy MemScope = MemScopeTy::device) { +#ifdef __NVPTX__ + return __scoped_atomic_fetch_add(Address, V(0), Ordering, MemScope); +#else return __scoped_atomic_load_n(Address, Ordering, MemScope); +#endif } template >