| 1 | // -*- C++ -*- header. |
| 2 | |
| 3 | // Copyright (C) 2020-2021 Free Software Foundation, Inc. |
| 4 | // |
| 5 | // This file is part of the GNU ISO C++ Library. This library is free |
| 6 | // software; you can redistribute it and/or modify it under the |
| 7 | // terms of the GNU General Public License as published by the |
| 8 | // Free Software Foundation; either version 3, or (at your option) |
| 9 | // any later version. |
| 10 | |
| 11 | // This library is distributed in the hope that it will be useful, |
| 12 | // but WITHOUT ANY WARRANTY; without even the implied warranty of |
| 13 | // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
| 14 | // GNU General Public License for more details. |
| 15 | |
| 16 | // Under Section 7 of GPL version 3, you are granted additional |
| 17 | // permissions described in the GCC Runtime Library Exception, version |
| 18 | // 3.1, as published by the Free Software Foundation. |
| 19 | |
| 20 | // You should have received a copy of the GNU General Public License and |
| 21 | // a copy of the GCC Runtime Library Exception along with this program; |
| 22 | // see the files COPYING3 and COPYING.RUNTIME respectively. If not, see |
| 23 | // <http://www.gnu.org/licenses/>. |
| 24 | |
| 25 | /** @file bits/atomic_wait.h |
| 26 | * This is an internal header file, included by other library headers. |
| 27 | * Do not attempt to use it directly. @headername{atomic} |
| 28 | */ |
| 29 | |
| 30 | #ifndef _GLIBCXX_ATOMIC_WAIT_H |
| 31 | #define _GLIBCXX_ATOMIC_WAIT_H 1 |
| 32 | |
| 33 | #pragma GCC system_header |
| 34 | |
| 35 | #include <bits/c++config.h> |
| 36 | #if defined _GLIBCXX_HAS_GTHREADS || defined _GLIBCXX_HAVE_LINUX_FUTEX |
| 37 | #include <bits/functional_hash.h> |
| 38 | #include <bits/gthr.h> |
| 39 | #include <ext/numeric_traits.h> |
| 40 | |
| 41 | #ifdef _GLIBCXX_HAVE_LINUX_FUTEX |
| 42 | # include <cerrno> |
| 43 | # include <climits> |
| 44 | # include <unistd.h> |
| 45 | # include <syscall.h> |
| 46 | # include <bits/functexcept.h> |
| 47 | #endif |
| 48 | |
| 49 | # include <bits/std_mutex.h> // std::mutex, std::__condvar |
| 50 | |
| 51 | #define __cpp_lib_atomic_wait 201907L |
| 52 | |
| 53 | namespace std _GLIBCXX_VISIBILITY(default) |
| 54 | { |
| 55 | _GLIBCXX_BEGIN_NAMESPACE_VERSION |
| 56 | namespace __detail |
| 57 | { |
| 58 | #ifdef _GLIBCXX_HAVE_LINUX_FUTEX |
| 59 | #define _GLIBCXX_HAVE_PLATFORM_WAIT 1 |
| 60 | using __platform_wait_t = int; |
| 61 | static constexpr size_t __platform_wait_alignment = 4; |
| 62 | #else |
| 63 | // define _GLIBCX_HAVE_PLATFORM_WAIT and implement __platform_wait() |
| 64 | // and __platform_notify() if there is a more efficient primitive supported |
| 65 | // by the platform (e.g. __ulock_wait()/__ulock_wake()) which is better than |
| 66 | // a mutex/condvar based wait. |
| 67 | using __platform_wait_t = uint64_t; |
| 68 | static constexpr size_t __platform_wait_alignment |
| 69 | = __alignof__(__platform_wait_t); |
| 70 | #endif |
| 71 | } // namespace __detail |
| 72 | |
| 73 | template<typename _Tp> |
| 74 | inline constexpr bool __platform_wait_uses_type |
| 75 | #ifdef _GLIBCXX_HAVE_PLATFORM_WAIT |
| 76 | = is_scalar_v<_Tp> |
| 77 | && ((sizeof(_Tp) == sizeof(__detail::__platform_wait_t)) |
| 78 | && (alignof(_Tp*) >= __detail::__platform_wait_alignment)); |
| 79 | #else |
| 80 | = false; |
| 81 | #endif |
| 82 | |
| 83 | namespace __detail |
| 84 | { |
| 85 | #ifdef _GLIBCXX_HAVE_LINUX_FUTEX |
| 86 | enum class __futex_wait_flags : int |
| 87 | { |
| 88 | #ifdef _GLIBCXX_HAVE_LINUX_FUTEX_PRIVATE |
| 89 | __private_flag = 128, |
| 90 | #else |
| 91 | __private_flag = 0, |
| 92 | #endif |
| 93 | __wait = 0, |
| 94 | __wake = 1, |
| 95 | __wait_bitset = 9, |
| 96 | __wake_bitset = 10, |
| 97 | __wait_private = __wait | __private_flag, |
| 98 | __wake_private = __wake | __private_flag, |
| 99 | __wait_bitset_private = __wait_bitset | __private_flag, |
| 100 | __wake_bitset_private = __wake_bitset | __private_flag, |
| 101 | __bitset_match_any = -1 |
| 102 | }; |
| 103 | |
| 104 | template<typename _Tp> |
| 105 | void |
| 106 | __platform_wait(const _Tp* __addr, __platform_wait_t __val) noexcept |
| 107 | { |
| 108 | auto __e = syscall (SYS_futex, static_cast<const void*>(__addr), |
| 109 | static_cast<int>(__futex_wait_flags::__wait_private), |
| 110 | __val, nullptr); |
| 111 | if (!__e || errno == EAGAIN) |
| 112 | return; |
| 113 | if (errno != EINTR) |
| 114 | __throw_system_error(errno); |
| 115 | } |
| 116 | |
| 117 | template<typename _Tp> |
| 118 | void |
| 119 | __platform_notify(const _Tp* __addr, bool __all) noexcept |
| 120 | { |
| 121 | syscall (SYS_futex, static_cast<const void*>(__addr), |
| 122 | static_cast<int>(__futex_wait_flags::__wake_private), |
| 123 | __all ? INT_MAX : 1); |
| 124 | } |
| 125 | #endif |
| 126 | |
| 127 | inline void |
| 128 | __thread_yield() noexcept |
| 129 | { |
| 130 | #if defined _GLIBCXX_HAS_GTHREADS && defined _GLIBCXX_USE_SCHED_YIELD |
| 131 | __gthread_yield(); |
| 132 | #endif |
| 133 | } |
| 134 | |
| 135 | inline void |
| 136 | __thread_relax() noexcept |
| 137 | { |
| 138 | #if defined __i386__ || defined __x86_64__ |
| 139 | __builtin_ia32_pause(); |
| 140 | #else |
| 141 | __thread_yield(); |
| 142 | #endif |
| 143 | } |
| 144 | |
| 145 | constexpr auto __atomic_spin_count_relax = 12; |
| 146 | constexpr auto __atomic_spin_count = 16; |
| 147 | |
| 148 | struct __default_spin_policy |
| 149 | { |
| 150 | bool |
| 151 | operator()() const noexcept |
| 152 | { return false; } |
| 153 | }; |
| 154 | |
| 155 | template<typename _Pred, |
| 156 | typename _Spin = __default_spin_policy> |
| 157 | bool |
| 158 | __atomic_spin(_Pred& __pred, _Spin __spin = _Spin{ }) noexcept |
| 159 | { |
| 160 | for (auto __i = 0; __i < __atomic_spin_count; ++__i) |
| 161 | { |
| 162 | if (__pred()) |
| 163 | return true; |
| 164 | |
| 165 | if (__i < __atomic_spin_count_relax) |
| 166 | __detail::__thread_relax(); |
| 167 | else |
| 168 | __detail::__thread_yield(); |
| 169 | } |
| 170 | |
| 171 | while (__spin()) |
| 172 | { |
| 173 | if (__pred()) |
| 174 | return true; |
| 175 | } |
| 176 | |
| 177 | return false; |
| 178 | } |
| 179 | |
| 180 | // return true if equal |
| 181 | template<typename _Tp> |
| 182 | bool __atomic_compare(const _Tp& __a, const _Tp& __b) |
| 183 | { |
| 184 | // TODO make this do the correct padding bit ignoring comparison |
| 185 | return __builtin_memcmp(&__a, &__b, sizeof(_Tp)) == 0; |
| 186 | } |
| 187 | |
| 188 | struct __waiter_pool_base |
| 189 | { |
| 190 | #ifdef __cpp_lib_hardware_interference_size |
| 191 | static constexpr auto _S_align = hardware_destructive_interference_size; |
| 192 | #else |
| 193 | static constexpr auto _S_align = 64; |
| 194 | #endif |
| 195 | |
| 196 | alignas(_S_align) __platform_wait_t _M_wait = 0; |
| 197 | |
| 198 | #ifndef _GLIBCXX_HAVE_PLATFORM_WAIT |
| 199 | mutex _M_mtx; |
| 200 | #endif |
| 201 | |
| 202 | alignas(_S_align) __platform_wait_t _M_ver = 0; |
| 203 | |
| 204 | #ifndef _GLIBCXX_HAVE_PLATFORM_WAIT |
| 205 | __condvar _M_cv; |
| 206 | #endif |
| 207 | __waiter_pool_base() = default; |
| 208 | |
| 209 | void |
| 210 | _M_enter_wait() noexcept |
| 211 | { __atomic_fetch_add(&_M_wait, 1, __ATOMIC_SEQ_CST); } |
| 212 | |
| 213 | void |
| 214 | _M_leave_wait() noexcept |
| 215 | { __atomic_fetch_sub(&_M_wait, 1, __ATOMIC_RELEASE); } |
| 216 | |
| 217 | bool |
| 218 | _M_waiting() const noexcept |
| 219 | { |
| 220 | __platform_wait_t __res; |
| 221 | __atomic_load(&_M_wait, &__res, __ATOMIC_SEQ_CST); |
| 222 | return __res != 0; |
| 223 | } |
| 224 | |
| 225 | void |
| 226 | _M_notify(__platform_wait_t* __addr, [[maybe_unused]] bool __all, |
| 227 | bool __bare) noexcept |
| 228 | { |
| 229 | #ifdef _GLIBCXX_HAVE_PLATFORM_WAIT |
| 230 | if (__addr == &_M_ver) |
| 231 | { |
| 232 | __atomic_fetch_add(__addr, 1, __ATOMIC_SEQ_CST); |
| 233 | __all = true; |
| 234 | } |
| 235 | |
| 236 | if (__bare || _M_waiting()) |
| 237 | __platform_notify(__addr, __all); |
| 238 | #else |
| 239 | { |
| 240 | lock_guard<mutex> __l(_M_mtx); |
| 241 | __atomic_fetch_add(__addr, 1, __ATOMIC_RELAXED); |
| 242 | } |
| 243 | if (__bare || _M_waiting()) |
| 244 | _M_cv.notify_all(); |
| 245 | #endif |
| 246 | } |
| 247 | |
| 248 | static __waiter_pool_base& |
| 249 | _S_for(const void* __addr) noexcept |
| 250 | { |
| 251 | constexpr uintptr_t __ct = 16; |
| 252 | static __waiter_pool_base __w[__ct]; |
| 253 | auto __key = (uintptr_t(__addr) >> 2) % __ct; |
| 254 | return __w[__key]; |
| 255 | } |
| 256 | }; |
| 257 | |
| 258 | struct __waiter_pool : __waiter_pool_base |
| 259 | { |
| 260 | void |
| 261 | _M_do_wait(const __platform_wait_t* __addr, __platform_wait_t __old) noexcept |
| 262 | { |
| 263 | #ifdef _GLIBCXX_HAVE_PLATFORM_WAIT |
| 264 | __platform_wait(__addr, val: __old); |
| 265 | #else |
| 266 | __platform_wait_t __val; |
| 267 | __atomic_load(__addr, &__val, __ATOMIC_SEQ_CST); |
| 268 | if (__val == __old) |
| 269 | { |
| 270 | lock_guard<mutex> __l(_M_mtx); |
| 271 | __atomic_load(__addr, &__val, __ATOMIC_RELAXED); |
| 272 | if (__val == __old) |
| 273 | _M_cv.wait(_M_mtx); |
| 274 | } |
| 275 | #endif // __GLIBCXX_HAVE_PLATFORM_WAIT |
| 276 | } |
| 277 | }; |
| 278 | |
| 279 | template<typename _Tp> |
| 280 | struct __waiter_base |
| 281 | { |
| 282 | using __waiter_type = _Tp; |
| 283 | |
| 284 | __waiter_type& _M_w; |
| 285 | __platform_wait_t* _M_addr; |
| 286 | |
| 287 | template<typename _Up> |
| 288 | static __platform_wait_t* |
| 289 | _S_wait_addr(const _Up* __a, __platform_wait_t* __b) |
| 290 | { |
| 291 | if constexpr (__platform_wait_uses_type<_Up>) |
| 292 | return reinterpret_cast<__platform_wait_t*>(const_cast<_Up*>(__a)); |
| 293 | else |
| 294 | return __b; |
| 295 | } |
| 296 | |
| 297 | static __waiter_type& |
| 298 | _S_for(const void* __addr) noexcept |
| 299 | { |
| 300 | static_assert(sizeof(__waiter_type) == sizeof(__waiter_pool_base)); |
| 301 | auto& res = __waiter_pool_base::_S_for(__addr); |
| 302 | return reinterpret_cast<__waiter_type&>(res); |
| 303 | } |
| 304 | |
| 305 | template<typename _Up> |
| 306 | explicit __waiter_base(const _Up* __addr) noexcept |
| 307 | : _M_w(_S_for(__addr)) |
| 308 | , _M_addr(_S_wait_addr(__addr, &_M_w._M_ver)) |
| 309 | { } |
| 310 | |
| 311 | void |
| 312 | _M_notify(bool __all, bool __bare = false) noexcept |
| 313 | { _M_w._M_notify(_M_addr, __all, __bare); } |
| 314 | |
| 315 | template<typename _Up, typename _ValFn, |
| 316 | typename _Spin = __default_spin_policy> |
| 317 | static bool |
| 318 | _S_do_spin_v(__platform_wait_t* __addr, |
| 319 | const _Up& __old, _ValFn __vfn, |
| 320 | __platform_wait_t& __val, |
| 321 | _Spin __spin = _Spin{ }) |
| 322 | { |
| 323 | auto const __pred = [=] |
| 324 | { return !__detail::__atomic_compare(__old, __vfn()); }; |
| 325 | |
| 326 | if constexpr (__platform_wait_uses_type<_Up>) |
| 327 | { |
| 328 | __builtin_memcpy(&__val, &__old, sizeof(__val)); |
| 329 | } |
| 330 | else |
| 331 | { |
| 332 | __atomic_load(__addr, &__val, __ATOMIC_ACQUIRE); |
| 333 | } |
| 334 | return __atomic_spin(__pred, __spin); |
| 335 | } |
| 336 | |
| 337 | template<typename _Up, typename _ValFn, |
| 338 | typename _Spin = __default_spin_policy> |
| 339 | bool |
| 340 | _M_do_spin_v(const _Up& __old, _ValFn __vfn, |
| 341 | __platform_wait_t& __val, |
| 342 | _Spin __spin = _Spin{ }) |
| 343 | { return _S_do_spin_v(_M_addr, __old, __vfn, __val, __spin); } |
| 344 | |
| 345 | template<typename _Pred, |
| 346 | typename _Spin = __default_spin_policy> |
| 347 | static bool |
| 348 | _S_do_spin(const __platform_wait_t* __addr, |
| 349 | _Pred __pred, |
| 350 | __platform_wait_t& __val, |
| 351 | _Spin __spin = _Spin{ }) |
| 352 | { |
| 353 | __atomic_load(__addr, &__val, __ATOMIC_ACQUIRE); |
| 354 | return __atomic_spin(__pred, __spin); |
| 355 | } |
| 356 | |
| 357 | template<typename _Pred, |
| 358 | typename _Spin = __default_spin_policy> |
| 359 | bool |
| 360 | _M_do_spin(_Pred __pred, __platform_wait_t& __val, |
| 361 | _Spin __spin = _Spin{ }) |
| 362 | { return _S_do_spin(_M_addr, __pred, __val, __spin); } |
| 363 | }; |
| 364 | |
| 365 | template<typename _EntersWait> |
| 366 | struct __waiter : __waiter_base<__waiter_pool> |
| 367 | { |
| 368 | using __base_type = __waiter_base<__waiter_pool>; |
| 369 | |
| 370 | template<typename _Tp> |
| 371 | explicit __waiter(const _Tp* __addr) noexcept |
| 372 | : __base_type(__addr) |
| 373 | { |
| 374 | if constexpr (_EntersWait::value) |
| 375 | _M_w._M_enter_wait(); |
| 376 | } |
| 377 | |
| 378 | ~__waiter() |
| 379 | { |
| 380 | if constexpr (_EntersWait::value) |
| 381 | _M_w._M_leave_wait(); |
| 382 | } |
| 383 | |
| 384 | template<typename _Tp, typename _ValFn> |
| 385 | void |
| 386 | _M_do_wait_v(_Tp __old, _ValFn __vfn) |
| 387 | { |
| 388 | do |
| 389 | { |
| 390 | __platform_wait_t __val; |
| 391 | if (__base_type::_M_do_spin_v(__old, __vfn, __val)) |
| 392 | return; |
| 393 | __base_type::_M_w._M_do_wait(addr: __base_type::_M_addr, old: __val); |
| 394 | } |
| 395 | while (__detail::__atomic_compare(__old, __vfn())); |
| 396 | } |
| 397 | |
| 398 | template<typename _Pred> |
| 399 | void |
| 400 | _M_do_wait(_Pred __pred) noexcept |
| 401 | { |
| 402 | do |
| 403 | { |
| 404 | __platform_wait_t __val; |
| 405 | if (__base_type::_M_do_spin(__pred, __val)) |
| 406 | return; |
| 407 | __base_type::_M_w._M_do_wait(addr: __base_type::_M_addr, old: __val); |
| 408 | } |
| 409 | while (!__pred()); |
| 410 | } |
| 411 | }; |
| 412 | |
| 413 | using __enters_wait = __waiter<std::true_type>; |
| 414 | using __bare_wait = __waiter<std::false_type>; |
| 415 | } // namespace __detail |
| 416 | |
| 417 | template<typename _Tp, typename _ValFn> |
| 418 | void |
| 419 | __atomic_wait_address_v(const _Tp* __addr, _Tp __old, |
| 420 | _ValFn __vfn) noexcept |
| 421 | { |
| 422 | __detail::__enters_wait __w(__addr); |
| 423 | __w._M_do_wait_v(__old, __vfn); |
| 424 | } |
| 425 | |
| 426 | template<typename _Tp, typename _Pred> |
| 427 | void |
| 428 | __atomic_wait_address(const _Tp* __addr, _Pred __pred) noexcept |
| 429 | { |
| 430 | __detail::__enters_wait __w(__addr); |
| 431 | __w._M_do_wait(__pred); |
| 432 | } |
| 433 | |
| 434 | // This call is to be used by atomic types which track contention externally |
| 435 | template<typename _Pred> |
| 436 | void |
| 437 | __atomic_wait_address_bare(const __detail::__platform_wait_t* __addr, |
| 438 | _Pred __pred) noexcept |
| 439 | { |
| 440 | #ifdef _GLIBCXX_HAVE_PLATFORM_WAIT |
| 441 | do |
| 442 | { |
| 443 | __detail::__platform_wait_t __val; |
| 444 | if (__detail::__bare_wait::_S_do_spin(__addr, __pred, __val)) |
| 445 | return; |
| 446 | __detail::__platform_wait(__addr, __val); |
| 447 | } |
| 448 | while (!__pred()); |
| 449 | #else // !_GLIBCXX_HAVE_PLATFORM_WAIT |
| 450 | __detail::__bare_wait __w(__addr); |
| 451 | __w._M_do_wait(__pred); |
| 452 | #endif |
| 453 | } |
| 454 | |
| 455 | template<typename _Tp> |
| 456 | void |
| 457 | __atomic_notify_address(const _Tp* __addr, bool __all) noexcept |
| 458 | { |
| 459 | __detail::__bare_wait __w(__addr); |
| 460 | __w._M_notify(__all); |
| 461 | } |
| 462 | |
| 463 | // This call is to be used by atomic types which track contention externally |
| 464 | inline void |
| 465 | __atomic_notify_address_bare(const __detail::__platform_wait_t* __addr, |
| 466 | bool __all) noexcept |
| 467 | { |
| 468 | #ifdef _GLIBCXX_HAVE_PLATFORM_WAIT |
| 469 | __detail::__platform_notify(__addr, __all); |
| 470 | #else |
| 471 | __detail::__bare_wait __w(__addr); |
| 472 | __w._M_notify(__all, true); |
| 473 | #endif |
| 474 | } |
| 475 | _GLIBCXX_END_NAMESPACE_VERSION |
| 476 | } // namespace std |
| 477 | #endif // GTHREADS || LINUX_FUTEX |
| 478 | #endif // _GLIBCXX_ATOMIC_WAIT_H |
| 479 | |