1 | //===----------------------------------------------------------------------===// |
2 | // |
3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
4 | // See https://llvm.org/LICENSE.txt for license information. |
5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
6 | // |
7 | //===----------------------------------------------------------------------===// |
8 | |
9 | #include <__thread/timed_backoff_policy.h> |
10 | #include <atomic> |
11 | #include <climits> |
12 | #include <functional> |
13 | #include <thread> |
14 | |
15 | #include "include/apple_availability.h" |
16 | |
17 | #ifdef __linux__ |
18 | |
19 | # include <linux/futex.h> |
20 | # include <sys/syscall.h> |
21 | # include <unistd.h> |
22 | |
23 | // libc++ uses SYS_futex as a universal syscall name. However, on 32 bit architectures |
24 | // with a 64 bit time_t, we need to specify SYS_futex_time64. |
25 | # if !defined(SYS_futex) && defined(SYS_futex_time64) |
26 | # define SYS_futex SYS_futex_time64 |
27 | # endif |
28 | # define _LIBCPP_FUTEX(...) syscall(SYS_futex, __VA_ARGS__) |
29 | |
30 | #elif defined(__FreeBSD__) |
31 | |
32 | # include <sys/types.h> |
33 | # include <sys/umtx.h> |
34 | |
35 | # define _LIBCPP_FUTEX(...) syscall(SYS_futex, __VA_ARGS__) |
36 | |
37 | #elif defined(__OpenBSD__) |
38 | |
39 | # include <sys/futex.h> |
40 | |
41 | // OpenBSD has no indirect syscalls |
42 | # define _LIBCPP_FUTEX(...) futex(__VA_ARGS__) |
43 | |
44 | #else // <- Add other operating systems here |
45 | |
46 | // Baseline needs no new headers |
47 | |
48 | # define _LIBCPP_FUTEX(...) syscall(SYS_futex, __VA_ARGS__) |
49 | |
50 | #endif |
51 | |
52 | _LIBCPP_BEGIN_NAMESPACE_STD |
53 | |
54 | #ifdef __linux__ |
55 | |
56 | static void |
57 | __libcpp_platform_wait_on_address(__cxx_atomic_contention_t const volatile* __ptr, __cxx_contention_t __val) { |
58 | static constexpr timespec __timeout = {.tv_sec: 2, .tv_nsec: 0}; |
59 | _LIBCPP_FUTEX(__ptr, FUTEX_WAIT_PRIVATE, __val, &__timeout, 0, 0); |
60 | } |
61 | |
62 | static void __libcpp_platform_wake_by_address(__cxx_atomic_contention_t const volatile* __ptr, bool __notify_one) { |
63 | _LIBCPP_FUTEX(__ptr, FUTEX_WAKE_PRIVATE, __notify_one ? 1 : INT_MAX, 0, 0, 0); |
64 | } |
65 | |
66 | #elif defined(__APPLE__) && defined(_LIBCPP_USE_ULOCK) |
67 | |
68 | extern "C" int __ulock_wait( |
69 | uint32_t operation, void* addr, uint64_t value, uint32_t timeout); /* timeout is specified in microseconds */ |
70 | extern "C" int __ulock_wake(uint32_t operation, void* addr, uint64_t wake_value); |
71 | |
72 | // https://github.com/apple/darwin-xnu/blob/2ff845c2e033bd0ff64b5b6aa6063a1f8f65aa32/bsd/sys/ulock.h#L82 |
73 | # define UL_COMPARE_AND_WAIT64 5 |
74 | # define ULF_WAKE_ALL 0x00000100 |
75 | |
76 | static void |
77 | __libcpp_platform_wait_on_address(__cxx_atomic_contention_t const volatile* __ptr, __cxx_contention_t __val) { |
78 | static_assert(sizeof(__cxx_atomic_contention_t) == 8, "Waiting on 8 bytes value" ); |
79 | __ulock_wait(UL_COMPARE_AND_WAIT64, const_cast<__cxx_atomic_contention_t*>(__ptr), __val, 0); |
80 | } |
81 | |
82 | static void __libcpp_platform_wake_by_address(__cxx_atomic_contention_t const volatile* __ptr, bool __notify_one) { |
83 | static_assert(sizeof(__cxx_atomic_contention_t) == 8, "Waking up on 8 bytes value" ); |
84 | __ulock_wake( |
85 | UL_COMPARE_AND_WAIT64 | (__notify_one ? 0 : ULF_WAKE_ALL), const_cast<__cxx_atomic_contention_t*>(__ptr), 0); |
86 | } |
87 | |
88 | #elif defined(__FreeBSD__) && __SIZEOF_LONG__ == 8 |
89 | /* |
90 | * Since __cxx_contention_t is int64_t even on 32bit FreeBSD |
91 | * platforms, we have to use umtx ops that work on the long type, and |
92 | * limit its use to architectures where long and int64_t are synonyms. |
93 | */ |
94 | |
95 | static void |
96 | __libcpp_platform_wait_on_address(__cxx_atomic_contention_t const volatile* __ptr, __cxx_contention_t __val) { |
97 | _umtx_op(const_cast<__cxx_atomic_contention_t*>(__ptr), UMTX_OP_WAIT, __val, NULL, NULL); |
98 | } |
99 | |
100 | static void __libcpp_platform_wake_by_address(__cxx_atomic_contention_t const volatile* __ptr, bool __notify_one) { |
101 | _umtx_op(const_cast<__cxx_atomic_contention_t*>(__ptr), UMTX_OP_WAKE, __notify_one ? 1 : INT_MAX, NULL, NULL); |
102 | } |
103 | |
104 | #else // <- Add other operating systems here |
105 | |
106 | // Baseline is just a timed backoff |
107 | |
108 | static void |
109 | __libcpp_platform_wait_on_address(__cxx_atomic_contention_t const volatile* __ptr, __cxx_contention_t __val) { |
110 | __libcpp_thread_poll_with_backoff( |
111 | [=]() -> bool { return !__cxx_nonatomic_compare_equal(__cxx_atomic_load(__ptr, memory_order_relaxed), __val); }, |
112 | __libcpp_timed_backoff_policy()); |
113 | } |
114 | |
115 | static void __libcpp_platform_wake_by_address(__cxx_atomic_contention_t const volatile*, bool) {} |
116 | |
117 | #endif // __linux__ |
118 | |
119 | static constexpr size_t __libcpp_contention_table_size = (1 << 8); /* < there's no magic in this number */ |
120 | |
121 | struct alignas(64) /* aim to avoid false sharing */ __libcpp_contention_table_entry { |
122 | __cxx_atomic_contention_t __contention_state; |
123 | __cxx_atomic_contention_t __platform_state; |
124 | inline constexpr __libcpp_contention_table_entry() : __contention_state(0), __platform_state(0) {} |
125 | }; |
126 | |
127 | static __libcpp_contention_table_entry __libcpp_contention_table[__libcpp_contention_table_size]; |
128 | |
129 | static hash<void const volatile*> __libcpp_contention_hasher; |
130 | |
131 | static __libcpp_contention_table_entry* __libcpp_contention_state(void const volatile* p) { |
132 | return &__libcpp_contention_table[__libcpp_contention_hasher(p) & (__libcpp_contention_table_size - 1)]; |
133 | } |
134 | |
135 | /* Given an atomic to track contention and an atomic to actually wait on, which may be |
136 | the same atomic, we try to detect contention to avoid spuriously calling the platform. */ |
137 | |
138 | static void __libcpp_contention_notify(__cxx_atomic_contention_t volatile* __contention_state, |
139 | __cxx_atomic_contention_t const volatile* __platform_state, |
140 | bool __notify_one) { |
141 | if (0 != __cxx_atomic_load(a: __contention_state, order: memory_order_seq_cst)) |
142 | // We only call 'wake' if we consumed a contention bit here. |
143 | __libcpp_platform_wake_by_address(ptr: __platform_state, __notify_one); |
144 | } |
145 | static __cxx_contention_t |
146 | __libcpp_contention_monitor_for_wait(__cxx_atomic_contention_t volatile* /*__contention_state*/, |
147 | __cxx_atomic_contention_t const volatile* __platform_state) { |
148 | // We will monitor this value. |
149 | return __cxx_atomic_load(a: __platform_state, order: memory_order_acquire); |
150 | } |
151 | static void __libcpp_contention_wait(__cxx_atomic_contention_t volatile* __contention_state, |
152 | __cxx_atomic_contention_t const volatile* __platform_state, |
153 | __cxx_contention_t __old_value) { |
154 | __cxx_atomic_fetch_add(a: __contention_state, delta: __cxx_contention_t(1), order: memory_order_seq_cst); |
155 | // We sleep as long as the monitored value hasn't changed. |
156 | __libcpp_platform_wait_on_address(ptr: __platform_state, val: __old_value); |
157 | __cxx_atomic_fetch_sub(a: __contention_state, delta: __cxx_contention_t(1), order: memory_order_release); |
158 | } |
159 | |
160 | /* When the incoming atomic is the wrong size for the platform wait size, need to |
161 | launder the value sequence through an atomic from our table. */ |
162 | |
163 | static void __libcpp_atomic_notify(void const volatile* __location) { |
164 | auto const __entry = __libcpp_contention_state(p: __location); |
165 | // The value sequence laundering happens on the next line below. |
166 | __cxx_atomic_fetch_add(a: &__entry->__platform_state, delta: __cxx_contention_t(1), order: memory_order_release); |
167 | __libcpp_contention_notify( |
168 | contention_state: &__entry->__contention_state, |
169 | platform_state: &__entry->__platform_state, |
170 | notify_one: false /* when laundering, we can't handle notify_one */); |
171 | } |
172 | _LIBCPP_EXPORTED_FROM_ABI void __cxx_atomic_notify_one(void const volatile* __location) noexcept { |
173 | __libcpp_atomic_notify(__location); |
174 | } |
175 | _LIBCPP_EXPORTED_FROM_ABI void __cxx_atomic_notify_all(void const volatile* __location) noexcept { |
176 | __libcpp_atomic_notify(__location); |
177 | } |
178 | _LIBCPP_EXPORTED_FROM_ABI __cxx_contention_t __libcpp_atomic_monitor(void const volatile* __location) noexcept { |
179 | auto const __entry = __libcpp_contention_state(p: __location); |
180 | return __libcpp_contention_monitor_for_wait(&__entry->__contention_state, platform_state: &__entry->__platform_state); |
181 | } |
182 | _LIBCPP_EXPORTED_FROM_ABI void |
183 | __libcpp_atomic_wait(void const volatile* __location, __cxx_contention_t __old_value) noexcept { |
184 | auto const __entry = __libcpp_contention_state(p: __location); |
185 | __libcpp_contention_wait(contention_state: &__entry->__contention_state, platform_state: &__entry->__platform_state, __old_value); |
186 | } |
187 | |
188 | /* When the incoming atomic happens to be the platform wait size, we still need to use the |
189 | table for the contention detection, but we can use the atomic directly for the wait. */ |
190 | |
191 | _LIBCPP_EXPORTED_FROM_ABI void __cxx_atomic_notify_one(__cxx_atomic_contention_t const volatile* __location) noexcept { |
192 | __libcpp_contention_notify(contention_state: &__libcpp_contention_state(p: __location)->__contention_state, platform_state: __location, notify_one: true); |
193 | } |
194 | _LIBCPP_EXPORTED_FROM_ABI void __cxx_atomic_notify_all(__cxx_atomic_contention_t const volatile* __location) noexcept { |
195 | __libcpp_contention_notify(contention_state: &__libcpp_contention_state(p: __location)->__contention_state, platform_state: __location, notify_one: false); |
196 | } |
197 | // This function is never used, but still exported for ABI compatibility. |
198 | _LIBCPP_EXPORTED_FROM_ABI __cxx_contention_t |
199 | __libcpp_atomic_monitor(__cxx_atomic_contention_t const volatile* __location) noexcept { |
200 | return __libcpp_contention_monitor_for_wait(&__libcpp_contention_state(p: __location)->__contention_state, platform_state: __location); |
201 | } |
202 | _LIBCPP_EXPORTED_FROM_ABI void |
203 | __libcpp_atomic_wait(__cxx_atomic_contention_t const volatile* __location, __cxx_contention_t __old_value) noexcept { |
204 | __libcpp_contention_wait(contention_state: &__libcpp_contention_state(p: __location)->__contention_state, platform_state: __location, __old_value); |
205 | } |
206 | |
207 | _LIBCPP_END_NAMESPACE_STD |
208 | |