123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469 |
- /* pthread_cond_common -- shared code for condition variable.
- Copyright (C) 2016-2019 Free Software Foundation, Inc.
- This file is part of the GNU C Library.
- The GNU C Library is free software; you can redistribute it and/or
- modify it under the terms of the GNU Lesser General Public
- License as published by the Free Software Foundation; either
- version 2.1 of the License, or (at your option) any later version.
- The GNU C Library is distributed in the hope that it will be useful,
- but WITHOUT ANY WARRANTY; without even the implied warranty of
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
- Lesser General Public License for more details.
- You should have received a copy of the GNU Lesser General Public
- License along with the GNU C Library; if not, see
- <http://www.gnu.org/licenses/>. */
- #include <atomic.h>
- #include <stdint.h>
- #include <pthread.h>
- /* We need 3 least-significant bits on __wrefs for something else. */
- #define __PTHREAD_COND_MAX_GROUP_SIZE ((unsigned) 1 << 29)
- #if __HAVE_64B_ATOMICS == 1
- static uint64_t __attribute__ ((unused))
- __condvar_load_wseq_relaxed (pthread_cond_t *cond)
- {
- return atomic_load_relaxed (&cond->__data.__wseq);
- }
- static uint64_t __attribute__ ((unused))
- __condvar_fetch_add_wseq_acquire (pthread_cond_t *cond, unsigned int val)
- {
- return atomic_fetch_add_acquire (&cond->__data.__wseq, val);
- }
- static uint64_t __attribute__ ((unused))
- __condvar_fetch_xor_wseq_release (pthread_cond_t *cond, unsigned int val)
- {
- return atomic_fetch_xor_release (&cond->__data.__wseq, val);
- }
- static uint64_t __attribute__ ((unused))
- __condvar_load_g1_start_relaxed (pthread_cond_t *cond)
- {
- return atomic_load_relaxed (&cond->__data.__g1_start);
- }
- static void __attribute__ ((unused))
- __condvar_add_g1_start_relaxed (pthread_cond_t *cond, unsigned int val)
- {
- atomic_store_relaxed (&cond->__data.__g1_start,
- atomic_load_relaxed (&cond->__data.__g1_start) + val);
- }
- #else
- /* We use two 64b counters: __wseq and __g1_start. They are monotonically
- increasing and single-writer-multiple-readers counters, so we can implement
- load, fetch-and-add, and fetch-and-xor operations even when we just have
- 32b atomics. Values we add or xor are less than or equal to 1<<31 (*),
- so we only have to make overflow-and-addition atomic wrt. to concurrent
- load operations and xor operations. To do that, we split each counter into
- two 32b values of which we reserve the MSB of each to represent an
- overflow from the lower-order half to the higher-order half.
- In the common case, the state is (higher-order / lower-order half, and . is
- basically concatenation of the bits):
- 0.h / 0.l = h.l
- When we add a value of x that overflows (i.e., 0.l + x == 1.L), we run the
- following steps S1-S4 (the values these represent are on the right-hand
- side):
- S1: 0.h / 1.L == (h+1).L
- S2: 1.(h+1) / 1.L == (h+1).L
- S3: 1.(h+1) / 0.L == (h+1).L
- S4: 0.(h+1) / 0.L == (h+1).L
- If the LSB of the higher-order half is set, readers will ignore the
- overflow bit in the lower-order half.
- To get an atomic snapshot in load operations, we exploit that the
- higher-order half is monotonically increasing; if we load a value V from
- it, then read the lower-order half, and then read the higher-order half
- again and see the same value V, we know that both halves have existed in
- the sequence of values the full counter had. This is similar to the
- validated reads in the time-based STMs in GCC's libitm (e.g.,
- method_ml_wt).
- The xor operation needs to be an atomic read-modify-write. The write
- itself is not an issue as it affects just the lower-order half but not bits
- used in the add operation. To make the full fetch-and-xor atomic, we
- exploit that concurrently, the value can increase by at most 1<<31 (*): The
- xor operation is only called while having acquired the lock, so not more
- than __PTHREAD_COND_MAX_GROUP_SIZE waiters can enter concurrently and thus
- increment __wseq. Therefore, if the xor operation observes a value of
- __wseq, then the value it applies the modification to later on can be
- derived (see below).
- One benefit of this scheme is that this makes load operations
- obstruction-free because unlike if we would just lock the counter, readers
- can almost always interpret a snapshot of each halves. Readers can be
- forced to read a new snapshot when the read is concurrent with an overflow.
- However, overflows will happen infrequently, so load operations are
- practically lock-free.
- (*) The highest value we add is __PTHREAD_COND_MAX_GROUP_SIZE << 2 to
- __g1_start (the two extra bits are for the lock in the two LSBs of
- __g1_start). */
- typedef struct
- {
- unsigned int low;
- unsigned int high;
- } _condvar_lohi;
- static uint64_t
- __condvar_fetch_add_64_relaxed (_condvar_lohi *lh, unsigned int op)
- {
- /* S1. Note that this is an atomic read-modify-write so it extends the
- release sequence of release MO store at S3. */
- unsigned int l = atomic_fetch_add_relaxed (&lh->low, op);
- unsigned int h = atomic_load_relaxed (&lh->high);
- uint64_t result = ((uint64_t) h << 31) | l;
- l += op;
- if ((l >> 31) > 0)
- {
- /* Overflow. Need to increment higher-order half. Note that all
- add operations are ordered in happens-before. */
- h++;
- /* S2. Release MO to synchronize with the loads of the higher-order half
- in the load operation. See __condvar_load_64_relaxed. */
- atomic_store_release (&lh->high, h | ((unsigned int) 1 << 31));
- l ^= (unsigned int) 1 << 31;
- /* S3. See __condvar_load_64_relaxed. */
- atomic_store_release (&lh->low, l);
- /* S4. Likewise. */
- atomic_store_release (&lh->high, h);
- }
- return result;
- }
- static uint64_t
- __condvar_load_64_relaxed (_condvar_lohi *lh)
- {
- unsigned int h, l, h2;
- do
- {
- /* This load and the second one below to the same location read from the
- stores in the overflow handling of the add operation or the
- initializing stores (which is a simple special case because
- initialization always completely happens before further use).
- Because no two stores to the higher-order half write the same value,
- the loop ensures that if we continue to use the snapshot, this load
- and the second one read from the same store operation. All candidate
- store operations have release MO.
- If we read from S2 in the first load, then we will see the value of
- S1 on the next load (because we synchronize with S2), or a value
- later in modification order. We correctly ignore the lower-half's
- overflow bit in this case. If we read from S4, then we will see the
- value of S3 in the next load (or a later value), which does not have
- the overflow bit set anymore.
- */
- h = atomic_load_acquire (&lh->high);
- /* This will read from the release sequence of S3 (i.e, either the S3
- store or the read-modify-writes at S1 following S3 in modification
- order). Thus, the read synchronizes with S3, and the following load
- of the higher-order half will read from the matching S2 (or a later
- value).
- Thus, if we read a lower-half value here that already overflowed and
- belongs to an increased higher-order half value, we will see the
- latter and h and h2 will not be equal. */
- l = atomic_load_acquire (&lh->low);
- /* See above. */
- h2 = atomic_load_relaxed (&lh->high);
- }
- while (h != h2);
- if (((l >> 31) > 0) && ((h >> 31) > 0))
- l ^= (unsigned int) 1 << 31;
- return ((uint64_t) (h & ~((unsigned int) 1 << 31)) << 31) + l;
- }
- static uint64_t __attribute__ ((unused))
- __condvar_load_wseq_relaxed (pthread_cond_t *cond)
- {
- return __condvar_load_64_relaxed ((_condvar_lohi *) &cond->__data.__wseq32);
- }
- static uint64_t __attribute__ ((unused))
- __condvar_fetch_add_wseq_acquire (pthread_cond_t *cond, unsigned int val)
- {
- uint64_t r = __condvar_fetch_add_64_relaxed
- ((_condvar_lohi *) &cond->__data.__wseq32, val);
- atomic_thread_fence_acquire ();
- return r;
- }
- static uint64_t __attribute__ ((unused))
- __condvar_fetch_xor_wseq_release (pthread_cond_t *cond, unsigned int val)
- {
- _condvar_lohi *lh = (_condvar_lohi *) &cond->__data.__wseq32;
- /* First, get the current value. See __condvar_load_64_relaxed. */
- unsigned int h, l, h2;
- do
- {
- h = atomic_load_acquire (&lh->high);
- l = atomic_load_acquire (&lh->low);
- h2 = atomic_load_relaxed (&lh->high);
- }
- while (h != h2);
- if (((l >> 31) > 0) && ((h >> 31) == 0))
- h++;
- h &= ~((unsigned int) 1 << 31);
- l &= ~((unsigned int) 1 << 31);
- /* Now modify. Due to the coherence rules, the prior load will read a value
- earlier in modification order than the following fetch-xor.
- This uses release MO to make the full operation have release semantics
- (all other operations access the lower-order half). */
- unsigned int l2 = atomic_fetch_xor_release (&lh->low, val)
- & ~((unsigned int) 1 << 31);
- if (l2 < l)
- /* The lower-order half overflowed in the meantime. This happened exactly
- once due to the limit on concurrent waiters (see above). */
- h++;
- return ((uint64_t) h << 31) + l2;
- }
- static uint64_t __attribute__ ((unused))
- __condvar_load_g1_start_relaxed (pthread_cond_t *cond)
- {
- return __condvar_load_64_relaxed
- ((_condvar_lohi *) &cond->__data.__g1_start32);
- }
- static void __attribute__ ((unused))
- __condvar_add_g1_start_relaxed (pthread_cond_t *cond, unsigned int val)
- {
- ignore_value (__condvar_fetch_add_64_relaxed
- ((_condvar_lohi *) &cond->__data.__g1_start32, val));
- }
- #endif /* !__HAVE_64B_ATOMICS */
- /* The lock that signalers use. See pthread_cond_wait_common for uses.
- The lock is our normal three-state lock: not acquired (0) / acquired (1) /
- acquired-with-futex_wake-request (2). However, we need to preserve the
- other bits in the unsigned int used for the lock, and therefore it is a
- little more complex. */
- static void __attribute__ ((unused))
- __condvar_acquire_lock (pthread_cond_t *cond, int private)
- {
- unsigned int s = atomic_load_relaxed (&cond->__data.__g1_orig_size);
- while ((s & 3) == 0)
- {
- if (atomic_compare_exchange_weak_acquire (&cond->__data.__g1_orig_size,
- &s, s | 1))
- return;
- /* TODO Spinning and back-off. */
- }
- /* We can't change from not acquired to acquired, so try to change to
- acquired-with-futex-wake-request and do a futex wait if we cannot change
- from not acquired. */
- while (1)
- {
- while ((s & 3) != 2)
- {
- if (atomic_compare_exchange_weak_acquire
- (&cond->__data.__g1_orig_size, &s, (s & ~(unsigned int) 3) | 2))
- {
- if ((s & 3) == 0)
- return;
- break;
- }
- /* TODO Back off. */
- }
- futex_wait_simple (&cond->__data.__g1_orig_size,
- (s & ~(unsigned int) 3) | 2, private);
- /* Reload so we see a recent value. */
- s = atomic_load_relaxed (&cond->__data.__g1_orig_size);
- }
- }
- /* See __condvar_acquire_lock. */
- static void __attribute__ ((unused))
- __condvar_release_lock (pthread_cond_t *cond, int private)
- {
- if ((atomic_fetch_and_release (&cond->__data.__g1_orig_size,
- ~(unsigned int) 3) & 3)
- == 2)
- futex_wake (&cond->__data.__g1_orig_size, 1, private);
- }
- /* Only use this when having acquired the lock. */
- static unsigned int __attribute__ ((unused))
- __condvar_get_orig_size (pthread_cond_t *cond)
- {
- return atomic_load_relaxed (&cond->__data.__g1_orig_size) >> 2;
- }
- /* Only use this when having acquired the lock. */
- static void __attribute__ ((unused))
- __condvar_set_orig_size (pthread_cond_t *cond, unsigned int size)
- {
- /* We have acquired the lock, but might get one concurrent update due to a
- lock state change from acquired to acquired-with-futex_wake-request.
- The store with relaxed MO is fine because there will be no further
- changes to the lock bits nor the size, and we will subsequently release
- the lock with release MO. */
- unsigned int s;
- s = (atomic_load_relaxed (&cond->__data.__g1_orig_size) & 3)
- | (size << 2);
- if ((atomic_exchange_relaxed (&cond->__data.__g1_orig_size, s) & 3)
- != (s & 3))
- atomic_store_relaxed (&cond->__data.__g1_orig_size, (size << 2) | 2);
- }
- /* Returns FUTEX_SHARED or FUTEX_PRIVATE based on the provided __wrefs
- value. */
- static int __attribute__ ((unused))
- __condvar_get_private (int flags)
- {
- if ((flags & __PTHREAD_COND_SHARED_MASK) == 0)
- return FUTEX_PRIVATE;
- else
- return FUTEX_SHARED;
- }
- /* This closes G1 (whose index is in G1INDEX), waits for all futex waiters to
- leave G1, converts G1 into a fresh G2, and then switches group roles so that
- the former G2 becomes the new G1 ending at the current __wseq value when we
- eventually make the switch (WSEQ is just an observation of __wseq by the
- signaler).
- If G2 is empty, it will not switch groups because then it would create an
- empty G1 which would require switching groups again on the next signal.
- Returns false iff groups were not switched because G2 was empty. */
- static bool __attribute__ ((unused))
- __condvar_quiesce_and_switch_g1 (pthread_cond_t *cond, uint64_t wseq,
- unsigned int *g1index, int private)
- {
- const unsigned int maxspin = 0;
- unsigned int g1 = *g1index;
- /* If there is no waiter in G2, we don't do anything. The expression may
- look odd but remember that __g_size might hold a negative value, so
- putting the expression this way avoids relying on implementation-defined
- behavior.
- Note that this works correctly for a zero-initialized condvar too. */
- unsigned int old_orig_size = __condvar_get_orig_size (cond);
- uint64_t old_g1_start = __condvar_load_g1_start_relaxed (cond) >> 1;
- if (((unsigned) (wseq - old_g1_start - old_orig_size)
- + cond->__data.__g_size[g1 ^ 1]) == 0)
- return false;
- /* Now try to close and quiesce G1. We have to consider the following kinds
- of waiters:
- * Waiters from less recent groups than G1 are not affected because
- nothing will change for them apart from __g1_start getting larger.
- * New waiters arriving concurrently with the group switching will all go
- into G2 until we atomically make the switch. Waiters existing in G2
- are not affected.
- * Waiters in G1 will be closed out immediately by setting a flag in
- __g_signals, which will prevent waiters from blocking using a futex on
- __g_signals and also notifies them that the group is closed. As a
- result, they will eventually remove their group reference, allowing us
- to close switch group roles. */
- /* First, set the closed flag on __g_signals. This tells waiters that are
- about to wait that they shouldn't do that anymore. This basically
- serves as an advance notificaton of the upcoming change to __g1_start;
- waiters interpret it as if __g1_start was larger than their waiter
- sequence position. This allows us to change __g1_start after waiting
- for all existing waiters with group references to leave, which in turn
- makes recovery after stealing a signal simpler because it then can be
- skipped if __g1_start indicates that the group is closed (otherwise,
- we would have to recover always because waiters don't know how big their
- groups are). Relaxed MO is fine. */
- atomic_fetch_or_relaxed (cond->__data.__g_signals + g1, 1);
- /* Wait until there are no group references anymore. The fetch-or operation
- injects us into the modification order of __g_refs; release MO ensures
- that waiters incrementing __g_refs after our fetch-or see the previous
- changes to __g_signals and to __g1_start that had to happen before we can
- switch this G1 and alias with an older group (we have two groups, so
- aliasing requires switching group roles twice). Note that nobody else
- can have set the wake-request flag, so we do not have to act upon it.
- Also note that it is harmless if older waiters or waiters from this G1
- get a group reference after we have quiesced the group because it will
- remain closed for them either because of the closed flag in __g_signals
- or the later update to __g1_start. New waiters will never arrive here
- but instead continue to go into the still current G2. */
- unsigned r = atomic_fetch_or_release (cond->__data.__g_refs + g1, 0);
- while ((r >> 1) > 0)
- {
- for (unsigned int spin = maxspin; ((r >> 1) > 0) && (spin > 0); spin--)
- {
- /* TODO Back off. */
- r = atomic_load_relaxed (cond->__data.__g_refs + g1);
- }
- if ((r >> 1) > 0)
- {
- /* There is still a waiter after spinning. Set the wake-request
- flag and block. Relaxed MO is fine because this is just about
- this futex word.
- Update r to include the set wake-request flag so that the upcoming
- futex_wait only blocks if the flag is still set (otherwise, we'd
- violate the basic client-side futex protocol). */
- r = atomic_fetch_or_relaxed (cond->__data.__g_refs + g1, 1) | 1;
- if ((r >> 1) > 0)
- futex_wait_simple (cond->__data.__g_refs + g1, r, private);
- /* Reload here so we eventually see the most recent value even if we
- do not spin. */
- r = atomic_load_relaxed (cond->__data.__g_refs + g1);
- }
- }
- /* Acquire MO so that we synchronize with the release operation that waiters
- use to decrement __g_refs and thus happen after the waiters we waited
- for. */
- atomic_thread_fence_acquire ();
- /* Update __g1_start, which finishes closing this group. The value we add
- will never be negative because old_orig_size can only be zero when we
- switch groups the first time after a condvar was initialized, in which
- case G1 will be at index 1 and we will add a value of 1. See above for
- why this takes place after waiting for quiescence of the group.
- Relaxed MO is fine because the change comes with no additional
- constraints that others would have to observe. */
- __condvar_add_g1_start_relaxed (cond,
- (old_orig_size << 1) + (g1 == 1 ? 1 : - 1));
- /* Now reopen the group, thus enabling waiters to again block using the
- futex controlled by __g_signals. Release MO so that observers that see
- no signals (and thus can block) also see the write __g1_start and thus
- that this is now a new group (see __pthread_cond_wait_common for the
- matching acquire MO loads). */
- atomic_store_release (cond->__data.__g_signals + g1, 0);
- /* At this point, the old G1 is now a valid new G2 (but not in use yet).
- No old waiter can neither grab a signal nor acquire a reference without
- noticing that __g1_start is larger.
- We can now publish the group switch by flipping the G2 index in __wseq.
- Release MO so that this synchronizes with the acquire MO operation
- waiters use to obtain a position in the waiter sequence. */
- wseq = __condvar_fetch_xor_wseq_release (cond, 1) >> 1;
- g1 ^= 1;
- *g1index ^= 1;
- /* These values are just observed by signalers, and thus protected by the
- lock. */
- unsigned int orig_size = wseq - (old_g1_start + old_orig_size);
- __condvar_set_orig_size (cond, orig_size);
- /* Use and addition to not loose track of cancellations in what was
- previously G2. */
- cond->__data.__g_size[g1] += orig_size;
- /* The new G1's size may be zero because of cancellations during its time
- as G2. If this happens, there are no waiters that have to receive a
- signal, so we do not need to add any and return false. */
- if (cond->__data.__g_size[g1] == 0)
- return false;
- return true;
- }
|