1349cc55cSDimitry Andric //===----------------------------------------------------------------------===//
25ffd83dbSDimitry Andric //
35ffd83dbSDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
45ffd83dbSDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
55ffd83dbSDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
65ffd83dbSDimitry Andric //
75ffd83dbSDimitry Andric //===----------------------------------------------------------------------===//
85ffd83dbSDimitry Andric 
906c3fb27SDimitry Andric #include <__thread/timed_backoff_policy.h>
105ffd83dbSDimitry Andric #include <atomic>
1104eeddc0SDimitry Andric #include <climits>
125ffd83dbSDimitry Andric #include <functional>
1304eeddc0SDimitry Andric #include <thread>
145ffd83dbSDimitry Andric 
1506c3fb27SDimitry Andric #include "include/apple_availability.h"
1606c3fb27SDimitry Andric 
175ffd83dbSDimitry Andric #ifdef __linux__
185ffd83dbSDimitry Andric 
195ffd83dbSDimitry Andric #  include <linux/futex.h>
205ffd83dbSDimitry Andric #  include <sys/syscall.h>
21cb14a3feSDimitry Andric #  include <unistd.h>
225ffd83dbSDimitry Andric 
23d409305fSDimitry Andric // libc++ uses SYS_futex as a universal syscall name. However, on 32 bit architectures
24d409305fSDimitry Andric // with a 64 bit time_t, we need to specify SYS_futex_time64.
25d409305fSDimitry Andric #  if !defined(SYS_futex) && defined(SYS_futex_time64)
26d409305fSDimitry Andric #    define SYS_futex SYS_futex_time64
27d409305fSDimitry Andric #  endif
28*3a079333SDimitry Andric #  define _LIBCPP_FUTEX(...) syscall(SYS_futex, __VA_ARGS__)
29d409305fSDimitry Andric 
309c996882SKonstantin Belousov #elif defined(__FreeBSD__)
319c996882SKonstantin Belousov 
329c996882SKonstantin Belousov #  include <sys/types.h>
339c996882SKonstantin Belousov #  include <sys/umtx.h>
349c996882SKonstantin Belousov 
35*3a079333SDimitry Andric #  define _LIBCPP_FUTEX(...) syscall(SYS_futex, __VA_ARGS__)
36*3a079333SDimitry Andric 
37*3a079333SDimitry Andric #elif defined(__OpenBSD__)
38*3a079333SDimitry Andric 
39*3a079333SDimitry Andric #  include <sys/futex.h>
40*3a079333SDimitry Andric 
41*3a079333SDimitry Andric // OpenBSD has no indirect syscalls
42*3a079333SDimitry Andric #  define _LIBCPP_FUTEX(...) futex(__VA_ARGS__)
43*3a079333SDimitry Andric 
445ffd83dbSDimitry Andric #else // <- Add other operating systems here
455ffd83dbSDimitry Andric 
465ffd83dbSDimitry Andric // Baseline needs no new headers
475ffd83dbSDimitry Andric 
48*3a079333SDimitry Andric #  define _LIBCPP_FUTEX(...) syscall(SYS_futex, __VA_ARGS__)
49*3a079333SDimitry Andric 
505ffd83dbSDimitry Andric #endif
515ffd83dbSDimitry Andric 
525ffd83dbSDimitry Andric _LIBCPP_BEGIN_NAMESPACE_STD
535ffd83dbSDimitry Andric 
545ffd83dbSDimitry Andric #ifdef __linux__
555ffd83dbSDimitry Andric 
56cb14a3feSDimitry Andric static void
__libcpp_platform_wait_on_address(__cxx_atomic_contention_t const volatile * __ptr,__cxx_contention_t __val)57cb14a3feSDimitry Andric __libcpp_platform_wait_on_address(__cxx_atomic_contention_t const volatile* __ptr, __cxx_contention_t __val) {
585ffd83dbSDimitry Andric   static constexpr timespec __timeout = {2, 0};
59*3a079333SDimitry Andric   _LIBCPP_FUTEX(__ptr, FUTEX_WAIT_PRIVATE, __val, &__timeout, 0, 0);
605ffd83dbSDimitry Andric }
615ffd83dbSDimitry Andric 
__libcpp_platform_wake_by_address(__cxx_atomic_contention_t const volatile * __ptr,bool __notify_one)62cb14a3feSDimitry Andric static void __libcpp_platform_wake_by_address(__cxx_atomic_contention_t const volatile* __ptr, bool __notify_one) {
63*3a079333SDimitry Andric   _LIBCPP_FUTEX(__ptr, FUTEX_WAKE_PRIVATE, __notify_one ? 1 : INT_MAX, 0, 0, 0);
645ffd83dbSDimitry Andric }
655ffd83dbSDimitry Andric 
665ffd83dbSDimitry Andric #elif defined(__APPLE__) && defined(_LIBCPP_USE_ULOCK)
675ffd83dbSDimitry Andric 
68cb14a3feSDimitry Andric extern "C" int __ulock_wait(
69cb14a3feSDimitry Andric     uint32_t operation, void* addr, uint64_t value, uint32_t timeout); /* timeout is specified in microseconds */
705ffd83dbSDimitry Andric extern "C" int __ulock_wake(uint32_t operation, void* addr, uint64_t wake_value);
715ffd83dbSDimitry Andric 
725ffd83dbSDimitry Andric #  define UL_COMPARE_AND_WAIT 1
735ffd83dbSDimitry Andric #  define ULF_WAKE_ALL 0x00000100
745ffd83dbSDimitry Andric 
75cb14a3feSDimitry Andric static void
76cb14a3feSDimitry Andric __libcpp_platform_wait_on_address(__cxx_atomic_contention_t const volatile* __ptr, __cxx_contention_t __val) {
77cb14a3feSDimitry Andric   __ulock_wait(UL_COMPARE_AND_WAIT, const_cast<__cxx_atomic_contention_t*>(__ptr), __val, 0);
785ffd83dbSDimitry Andric }
795ffd83dbSDimitry Andric 
80cb14a3feSDimitry Andric static void __libcpp_platform_wake_by_address(__cxx_atomic_contention_t const volatile* __ptr, bool __notify_one) {
81cb14a3feSDimitry Andric   __ulock_wake(
82cb14a3feSDimitry Andric       UL_COMPARE_AND_WAIT | (__notify_one ? 0 : ULF_WAKE_ALL), const_cast<__cxx_atomic_contention_t*>(__ptr), 0);
835ffd83dbSDimitry Andric }
845ffd83dbSDimitry Andric 
8525b18d89SKonstantin Belousov #elif defined(__FreeBSD__) && __SIZEOF_LONG__ == 8
864c4a2926SKonstantin Belousov /*
874c4a2926SKonstantin Belousov  * Since __cxx_contention_t is int64_t even on 32bit FreeBSD
884c4a2926SKonstantin Belousov  * platforms, we have to use umtx ops that work on the long type, and
894c4a2926SKonstantin Belousov  * limit its use to architectures where long and int64_t are synonyms.
904c4a2926SKonstantin Belousov  */
919c996882SKonstantin Belousov 
92cb14a3feSDimitry Andric static void
93cb14a3feSDimitry Andric __libcpp_platform_wait_on_address(__cxx_atomic_contention_t const volatile* __ptr, __cxx_contention_t __val) {
94cb14a3feSDimitry Andric   _umtx_op(const_cast<__cxx_atomic_contention_t*>(__ptr), UMTX_OP_WAIT, __val, NULL, NULL);
959c996882SKonstantin Belousov }
969c996882SKonstantin Belousov 
97cb14a3feSDimitry Andric static void __libcpp_platform_wake_by_address(__cxx_atomic_contention_t const volatile* __ptr, bool __notify_one) {
98cb14a3feSDimitry Andric   _umtx_op(const_cast<__cxx_atomic_contention_t*>(__ptr), UMTX_OP_WAKE, __notify_one ? 1 : INT_MAX, NULL, NULL);
999c996882SKonstantin Belousov }
1009c996882SKonstantin Belousov 
1015ffd83dbSDimitry Andric #else // <- Add other operating systems here
1025ffd83dbSDimitry Andric 
1035ffd83dbSDimitry Andric // Baseline is just a timed backoff
1045ffd83dbSDimitry Andric 
105cb14a3feSDimitry Andric static void
106cb14a3feSDimitry Andric __libcpp_platform_wait_on_address(__cxx_atomic_contention_t const volatile* __ptr, __cxx_contention_t __val) {
107cb14a3feSDimitry Andric   __libcpp_thread_poll_with_backoff(
108cb14a3feSDimitry Andric       [=]() -> bool { return !__cxx_nonatomic_compare_equal(__cxx_atomic_load(__ptr, memory_order_relaxed), __val); },
109cb14a3feSDimitry Andric       __libcpp_timed_backoff_policy());
1105ffd83dbSDimitry Andric }
1115ffd83dbSDimitry Andric 
1125ffd83dbSDimitry Andric static void __libcpp_platform_wake_by_address(__cxx_atomic_contention_t const volatile*, bool) {}
1135ffd83dbSDimitry Andric 
1145ffd83dbSDimitry Andric #endif // __linux__
1155ffd83dbSDimitry Andric 
1165ffd83dbSDimitry Andric static constexpr size_t __libcpp_contention_table_size = (1 << 8); /* < there's no magic in this number */
1175ffd83dbSDimitry Andric 
118cb14a3feSDimitry Andric struct alignas(64) /*  aim to avoid false sharing */ __libcpp_contention_table_entry {
1195ffd83dbSDimitry Andric   __cxx_atomic_contention_t __contention_state;
1205ffd83dbSDimitry Andric   __cxx_atomic_contention_t __platform_state;
__libcpp_contention_table_entry__libcpp_contention_table_entry121cb14a3feSDimitry Andric   inline constexpr __libcpp_contention_table_entry() : __contention_state(0), __platform_state(0) {}
1225ffd83dbSDimitry Andric };
1235ffd83dbSDimitry Andric 
1245ffd83dbSDimitry Andric static __libcpp_contention_table_entry __libcpp_contention_table[__libcpp_contention_table_size];
1255ffd83dbSDimitry Andric 
1265ffd83dbSDimitry Andric static hash<void const volatile*> __libcpp_contention_hasher;
1275ffd83dbSDimitry Andric 
__libcpp_contention_state(void const volatile * p)128cb14a3feSDimitry Andric static __libcpp_contention_table_entry* __libcpp_contention_state(void const volatile* p) {
1295ffd83dbSDimitry Andric   return &__libcpp_contention_table[__libcpp_contention_hasher(p) & (__libcpp_contention_table_size - 1)];
1305ffd83dbSDimitry Andric }
1315ffd83dbSDimitry Andric 
1325ffd83dbSDimitry Andric /* Given an atomic to track contention and an atomic to actually wait on, which may be
1335ffd83dbSDimitry Andric    the same atomic, we try to detect contention to avoid spuriously calling the platform. */
1345ffd83dbSDimitry Andric 
__libcpp_contention_notify(__cxx_atomic_contention_t volatile * __contention_state,__cxx_atomic_contention_t const volatile * __platform_state,bool __notify_one)1355ffd83dbSDimitry Andric static void __libcpp_contention_notify(__cxx_atomic_contention_t volatile* __contention_state,
1365ffd83dbSDimitry Andric                                        __cxx_atomic_contention_t const volatile* __platform_state,
137cb14a3feSDimitry Andric                                        bool __notify_one) {
1385ffd83dbSDimitry Andric   if (0 != __cxx_atomic_load(__contention_state, memory_order_seq_cst))
1395ffd83dbSDimitry Andric     // We only call 'wake' if we consumed a contention bit here.
1405ffd83dbSDimitry Andric     __libcpp_platform_wake_by_address(__platform_state, __notify_one);
1415ffd83dbSDimitry Andric }
142cb14a3feSDimitry Andric static __cxx_contention_t
__libcpp_contention_monitor_for_wait(__cxx_atomic_contention_t volatile *,__cxx_atomic_contention_t const volatile * __platform_state)143cb14a3feSDimitry Andric __libcpp_contention_monitor_for_wait(__cxx_atomic_contention_t volatile* /*__contention_state*/,
144cb14a3feSDimitry Andric                                      __cxx_atomic_contention_t const volatile* __platform_state) {
1455ffd83dbSDimitry Andric   // We will monitor this value.
1465ffd83dbSDimitry Andric   return __cxx_atomic_load(__platform_state, memory_order_acquire);
1475ffd83dbSDimitry Andric }
__libcpp_contention_wait(__cxx_atomic_contention_t volatile * __contention_state,__cxx_atomic_contention_t const volatile * __platform_state,__cxx_contention_t __old_value)1485ffd83dbSDimitry Andric static void __libcpp_contention_wait(__cxx_atomic_contention_t volatile* __contention_state,
1495ffd83dbSDimitry Andric                                      __cxx_atomic_contention_t const volatile* __platform_state,
150cb14a3feSDimitry Andric                                      __cxx_contention_t __old_value) {
1515ffd83dbSDimitry Andric   __cxx_atomic_fetch_add(__contention_state, __cxx_contention_t(1), memory_order_seq_cst);
1525ffd83dbSDimitry Andric   // We sleep as long as the monitored value hasn't changed.
1535ffd83dbSDimitry Andric   __libcpp_platform_wait_on_address(__platform_state, __old_value);
1545ffd83dbSDimitry Andric   __cxx_atomic_fetch_sub(__contention_state, __cxx_contention_t(1), memory_order_release);
1555ffd83dbSDimitry Andric }
1565ffd83dbSDimitry Andric 
1575ffd83dbSDimitry Andric /* When the incoming atomic is the wrong size for the platform wait size, need to
1585ffd83dbSDimitry Andric    launder the value sequence through an atomic from our table. */
1595ffd83dbSDimitry Andric 
__libcpp_atomic_notify(void const volatile * __location)160cb14a3feSDimitry Andric static void __libcpp_atomic_notify(void const volatile* __location) {
1615ffd83dbSDimitry Andric   auto const __entry = __libcpp_contention_state(__location);
1625ffd83dbSDimitry Andric   // The value sequence laundering happens on the next line below.
1635ffd83dbSDimitry Andric   __cxx_atomic_fetch_add(&__entry->__platform_state, __cxx_contention_t(1), memory_order_release);
164cb14a3feSDimitry Andric   __libcpp_contention_notify(
165cb14a3feSDimitry Andric       &__entry->__contention_state,
1665ffd83dbSDimitry Andric       &__entry->__platform_state,
1675ffd83dbSDimitry Andric       false /* when laundering, we can't handle notify_one */);
1685ffd83dbSDimitry Andric }
__cxx_atomic_notify_one(void const volatile * __location)169cb14a3feSDimitry Andric _LIBCPP_EXPORTED_FROM_ABI void __cxx_atomic_notify_one(void const volatile* __location) {
170cb14a3feSDimitry Andric   __libcpp_atomic_notify(__location);
171cb14a3feSDimitry Andric }
__cxx_atomic_notify_all(void const volatile * __location)172cb14a3feSDimitry Andric _LIBCPP_EXPORTED_FROM_ABI void __cxx_atomic_notify_all(void const volatile* __location) {
173cb14a3feSDimitry Andric   __libcpp_atomic_notify(__location);
174cb14a3feSDimitry Andric }
__libcpp_atomic_monitor(void const volatile * __location)175cb14a3feSDimitry Andric _LIBCPP_EXPORTED_FROM_ABI __cxx_contention_t __libcpp_atomic_monitor(void const volatile* __location) {
1765ffd83dbSDimitry Andric   auto const __entry = __libcpp_contention_state(__location);
1775ffd83dbSDimitry Andric   return __libcpp_contention_monitor_for_wait(&__entry->__contention_state, &__entry->__platform_state);
1785ffd83dbSDimitry Andric }
__libcpp_atomic_wait(void const volatile * __location,__cxx_contention_t __old_value)179cb14a3feSDimitry Andric _LIBCPP_EXPORTED_FROM_ABI void __libcpp_atomic_wait(void const volatile* __location, __cxx_contention_t __old_value) {
1805ffd83dbSDimitry Andric   auto const __entry = __libcpp_contention_state(__location);
1815ffd83dbSDimitry Andric   __libcpp_contention_wait(&__entry->__contention_state, &__entry->__platform_state, __old_value);
1825ffd83dbSDimitry Andric }
1835ffd83dbSDimitry Andric 
1845ffd83dbSDimitry Andric /* When the incoming atomic happens to be the platform wait size, we still need to use the
1855ffd83dbSDimitry Andric    table for the contention detection, but we can use the atomic directly for the wait. */
1865ffd83dbSDimitry Andric 
__cxx_atomic_notify_one(__cxx_atomic_contention_t const volatile * __location)187cb14a3feSDimitry Andric _LIBCPP_EXPORTED_FROM_ABI void __cxx_atomic_notify_one(__cxx_atomic_contention_t const volatile* __location) {
1885ffd83dbSDimitry Andric   __libcpp_contention_notify(&__libcpp_contention_state(__location)->__contention_state, __location, true);
1895ffd83dbSDimitry Andric }
__cxx_atomic_notify_all(__cxx_atomic_contention_t const volatile * __location)190cb14a3feSDimitry Andric _LIBCPP_EXPORTED_FROM_ABI void __cxx_atomic_notify_all(__cxx_atomic_contention_t const volatile* __location) {
1915ffd83dbSDimitry Andric   __libcpp_contention_notify(&__libcpp_contention_state(__location)->__contention_state, __location, false);
1925ffd83dbSDimitry Andric }
193cb14a3feSDimitry Andric _LIBCPP_EXPORTED_FROM_ABI __cxx_contention_t
__libcpp_atomic_monitor(__cxx_atomic_contention_t const volatile * __location)194cb14a3feSDimitry Andric __libcpp_atomic_monitor(__cxx_atomic_contention_t const volatile* __location) {
1955ffd83dbSDimitry Andric   return __libcpp_contention_monitor_for_wait(&__libcpp_contention_state(__location)->__contention_state, __location);
1965ffd83dbSDimitry Andric }
197cb14a3feSDimitry Andric _LIBCPP_EXPORTED_FROM_ABI void
__libcpp_atomic_wait(__cxx_atomic_contention_t const volatile * __location,__cxx_contention_t __old_value)198cb14a3feSDimitry Andric __libcpp_atomic_wait(__cxx_atomic_contention_t const volatile* __location, __cxx_contention_t __old_value) {
1995ffd83dbSDimitry Andric   __libcpp_contention_wait(&__libcpp_contention_state(__location)->__contention_state, __location, __old_value);
2005ffd83dbSDimitry Andric }
2015ffd83dbSDimitry Andric 
2025ffd83dbSDimitry Andric _LIBCPP_END_NAMESPACE_STD
203