Blame nptl/tst-rwlock-tryrdlock-stall.c

Packit Service e75323
/* Bug 23844: Test for pthread_rwlock_tryrdlock stalls.
Packit Service e75323
   Copyright (C) 2019 Free Software Foundation, Inc.
Packit Service e75323
   This file is part of the GNU C Library.
Packit Service e75323
Packit Service e75323
   The GNU C Library is free software; you can redistribute it and/or
Packit Service e75323
   modify it under the terms of the GNU Lesser General Public
Packit Service e75323
   License as published by the Free Software Foundation; either
Packit Service e75323
   version 2.1 of the License, or (at your option) any later version.
Packit Service e75323
Packit Service e75323
   The GNU C Library is distributed in the hope that it will be useful,
Packit Service e75323
   but WITHOUT ANY WARRANTY; without even the implied warranty of
Packit Service e75323
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
Packit Service e75323
   Lesser General Public License for more details.
Packit Service e75323
Packit Service e75323
   You should have received a copy of the GNU Lesser General Public
Packit Service e75323
   License along with the GNU C Library; if not, see
Packit Service e75323
   <http://www.gnu.org/licenses/>.  */
Packit Service e75323
Packit Service e75323
/* For a full analysis see comment:
Packit Service e75323
   https://sourceware.org/bugzilla/show_bug.cgi?id=23844#c14
Packit Service e75323
Packit Service e75323
   Provided here for reference:
Packit Service e75323
Packit Service e75323
   --- Analysis of pthread_rwlock_tryrdlock() stall ---
Packit Service e75323
   A read lock begins to execute.
Packit Service e75323
Packit Service e75323
   In __pthread_rwlock_rdlock_full:
Packit Service e75323
Packit Service e75323
   We can attempt a read lock, but find that the lock is
Packit Service e75323
   in a write phase (PTHREAD_RWLOCK_WRPHASE, or WP-bit
Packit Service e75323
   is set), and the lock is held by a primary writer
Packit Service e75323
   (PTHREAD_RWLOCK_WRLOCKED is set). In this case we must
Packit Service e75323
   wait for explicit hand over from the writer to us or
Packit Service e75323
   one of the other waiters. The read lock threads are
Packit Service e75323
   about to execute:
Packit Service e75323
Packit Service e75323
   341   r = (atomic_fetch_add_acquire (&rwlock->__data.__readers,
Packit Service e75323
   342                                  (1 << PTHREAD_RWLOCK_READER_SHIFT))
Packit Service e75323
   343        + (1 << PTHREAD_RWLOCK_READER_SHIFT));
Packit Service e75323
Packit Service e75323
   An unlock beings to execute.
Packit Service e75323
Packit Service e75323
   Then in __pthread_rwlock_wrunlock:
Packit Service e75323
Packit Service e75323
   547   unsigned int r = atomic_load_relaxed (&rwlock->__data.__readers);
Packit Service e75323
   ...
Packit Service e75323
   549   while (!atomic_compare_exchange_weak_release
Packit Service e75323
   550          (&rwlock->__data.__readers, &r,
Packit Service e75323
   551           ((r ^ PTHREAD_RWLOCK_WRLOCKED)
Packit Service e75323
   552            ^ ((r >> PTHREAD_RWLOCK_READER_SHIFT) == 0 ? 0
Packit Service e75323
   553               : PTHREAD_RWLOCK_WRPHASE))))
Packit Service e75323
   554     {
Packit Service e75323
   ...
Packit Service e75323
   556     }
Packit Service e75323
Packit Service e75323
   We clear PTHREAD_RWLOCK_WRLOCKED, and if there are
Packit Service e75323
   no readers so we leave the lock in PTHRAD_RWLOCK_WRPHASE.
Packit Service e75323
Packit Service e75323
   Back in the read lock.
Packit Service e75323
Packit Service e75323
   The read lock adjusts __readres as above.
Packit Service e75323
Packit Service e75323
   383   while ((r & PTHREAD_RWLOCK_WRPHASE) != 0
Packit Service e75323
   384          && (r & PTHREAD_RWLOCK_WRLOCKED) == 0)
Packit Service e75323
   385     {
Packit Service e75323
   ...
Packit Service e75323
   390       if (atomic_compare_exchange_weak_acquire (&rwlock->__data.__readers, &r,
Packit Service e75323
   391                                                 r ^ PTHREAD_RWLOCK_WRPHASE))
Packit Service e75323
   392         {
Packit Service e75323
Packit Service e75323
   And then attemps to start the read phase.
Packit Service e75323
Packit Service e75323
   Assume there happens to be a tryrdlock at this point, noting
Packit Service e75323
   that PTHREAD_RWLOCK_WRLOCKED is clear, and PTHREAD_RWLOCK_WRPHASE
Packit Service e75323
   is 1. So the try lock attemps to start the read phase.
Packit Service e75323
Packit Service e75323
   In __pthread_rwlock_tryrdlock:
Packit Service e75323
Packit Service e75323
    44       if ((r & PTHREAD_RWLOCK_WRPHASE) == 0)
Packit Service e75323
    45         {
Packit Service e75323
   ...
Packit Service e75323
    49           if (((r & PTHREAD_RWLOCK_WRLOCKED) != 0)
Packit Service e75323
    50               && (rwlock->__data.__flags
Packit Service e75323
    51                   == PTHREAD_RWLOCK_PREFER_WRITER_NONRECURSIVE_NP))
Packit Service e75323
    52             return EBUSY;
Packit Service e75323
    53           rnew = r + (1 << PTHREAD_RWLOCK_READER_SHIFT);
Packit Service e75323
    54         }
Packit Service e75323
   ...
Packit Service e75323
    89   while (!atomic_compare_exchange_weak_acquire (&rwlock->__data.__readers,
Packit Service e75323
    90       &r, rnew));
Packit Service e75323
Packit Service e75323
   And succeeds.
Packit Service e75323
Packit Service e75323
   Back in the write unlock:
Packit Service e75323
Packit Service e75323
   557   if ((r >> PTHREAD_RWLOCK_READER_SHIFT) != 0)
Packit Service e75323
   558     {
Packit Service e75323
   ...
Packit Service e75323
   563       if ((atomic_exchange_relaxed (&rwlock->__data.__wrphase_futex, 0)
Packit Service e75323
   564            & PTHREAD_RWLOCK_FUTEX_USED) != 0)
Packit Service e75323
   565         futex_wake (&rwlock->__data.__wrphase_futex, INT_MAX, private);
Packit Service e75323
   566     }
Packit Service e75323
Packit Service e75323
   We note that PTHREAD_RWLOCK_FUTEX_USED is non-zero
Packit Service e75323
   and don't wake anyone. This is OK because we handed
Packit Service e75323
   over to the trylock. It will be the trylock's responsibility
Packit Service e75323
   to wake any waiters.
Packit Service e75323
Packit Service e75323
   Back in the read lock:
Packit Service e75323
Packit Service e75323
   The read lock fails to install PTHRAD_REWLOCK_WRPHASE as 0 because
Packit Service e75323
   the __readers value was adjusted by the trylock, and so it falls through
Packit Service e75323
   to waiting on the lock for explicit handover from either a new writer
Packit Service e75323
   or a new reader.
Packit Service e75323
Packit Service e75323
   448           int err = futex_abstimed_wait (&rwlock->__data.__wrphase_futex,
Packit Service e75323
   449                                          1 | PTHREAD_RWLOCK_FUTEX_USED,
Packit Service e75323
   450                                          abstime, private);
Packit Service e75323
Packit Service e75323
   We use PTHREAD_RWLOCK_FUTEX_USED to indicate the futex
Packit Service e75323
   is in use.
Packit Service e75323
Packit Service e75323
   At this point we have readers waiting on the read lock
Packit Service e75323
   to unlock. The wrlock is done. The trylock is finishing
Packit Service e75323
   the installation of the read phase.
Packit Service e75323
Packit Service e75323
    92   if ((r & PTHREAD_RWLOCK_WRPHASE) != 0)
Packit Service e75323
    93     {
Packit Service e75323
   ...
Packit Service e75323
   105       atomic_store_relaxed (&rwlock->__data.__wrphase_futex, 0);
Packit Service e75323
   106     }
Packit Service e75323
Packit Service e75323
   The trylock does note that we were the one that
Packit Service e75323
   installed the read phase, but the comments are not
Packit Service e75323
   correct, the execution ordering above shows that
Packit Service e75323
   readers might indeed be waiting, and they are.
Packit Service e75323
Packit Service e75323
   The atomic_store_relaxed throws away PTHREAD_RWLOCK_FUTEX_USED,
Packit Service e75323
   and the waiting reader is never worken becuase as noted
Packit Service e75323
   above it is conditional on the futex being used.
Packit Service e75323
Packit Service e75323
   The solution is for the trylock thread to inspect
Packit Service e75323
   PTHREAD_RWLOCK_FUTEX_USED and wake the waiting readers.
Packit Service e75323
Packit Service e75323
   --- Analysis of pthread_rwlock_trywrlock() stall ---
Packit Service e75323
Packit Service e75323
   A write lock begins to execute, takes the write lock,
Packit Service e75323
   and then releases the lock...
Packit Service e75323
Packit Service e75323
   In pthread_rwlock_wrunlock():
Packit Service e75323
Packit Service e75323
   547   unsigned int r = atomic_load_relaxed (&rwlock->__data.__readers);
Packit Service e75323
   ...
Packit Service e75323
   549   while (!atomic_compare_exchange_weak_release
Packit Service e75323
   550          (&rwlock->__data.__readers, &r,
Packit Service e75323
   551           ((r ^ PTHREAD_RWLOCK_WRLOCKED)
Packit Service e75323
   552            ^ ((r >> PTHREAD_RWLOCK_READER_SHIFT) == 0 ? 0
Packit Service e75323
   553               : PTHREAD_RWLOCK_WRPHASE))))
Packit Service e75323
   554     {
Packit Service e75323
   ...
Packit Service e75323
   556     }
Packit Service e75323
Packit Service e75323
   ... leaving it in the write phase with zero readers
Packit Service e75323
   (the case where we leave the write phase in place
Packit Service e75323
   during a write unlock).
Packit Service e75323
Packit Service e75323
   A write trylock begins to execute.
Packit Service e75323
Packit Service e75323
   In __pthread_rwlock_trywrlock:
Packit Service e75323
Packit Service e75323
    40   while (((r & PTHREAD_RWLOCK_WRLOCKED) == 0)
Packit Service e75323
    41       && (((r >> PTHREAD_RWLOCK_READER_SHIFT) == 0)
Packit Service e75323
    42           || (prefer_writer && ((r & PTHREAD_RWLOCK_WRPHASE) != 0))))
Packit Service e75323
    43     {
Packit Service e75323
Packit Service e75323
   The lock is not locked.
Packit Service e75323
Packit Service e75323
   There are no readers.
Packit Service e75323
Packit Service e75323
    45       if (atomic_compare_exchange_weak_acquire (
Packit Service e75323
    46           &rwlock->__data.__readers, &r,
Packit Service e75323
    47           r | PTHREAD_RWLOCK_WRPHASE | PTHREAD_RWLOCK_WRLOCKED))
Packit Service e75323
Packit Service e75323
   We atomically install the write phase and we take the
Packit Service e75323
   exclusive write lock.
Packit Service e75323
Packit Service e75323
    48         {
Packit Service e75323
    49           atomic_store_relaxed (&rwlock->__data.__writers_futex, 1);
Packit Service e75323
Packit Service e75323
   We get this far.
Packit Service e75323
Packit Service e75323
   A reader lock begins to execute.
Packit Service e75323
Packit Service e75323
   In pthread_rwlock_rdlock:
Packit Service e75323
Packit Service e75323
   437   for (;;)
Packit Service e75323
   438     {
Packit Service e75323
   439       while (((wpf = atomic_load_relaxed (&rwlock->__data.__wrphase_futex))
Packit Service e75323
   440               | PTHREAD_RWLOCK_FUTEX_USED) == (1 | PTHREAD_RWLOCK_FUTEX_USED))
Packit Service e75323
   441         {
Packit Service e75323
   442           int private = __pthread_rwlock_get_private (rwlock);
Packit Service e75323
   443           if (((wpf & PTHREAD_RWLOCK_FUTEX_USED) == 0)
Packit Service e75323
   444               && (!atomic_compare_exchange_weak_relaxed
Packit Service e75323
   445                   (&rwlock->__data.__wrphase_futex,
Packit Service e75323
   446                    &wpf, wpf | PTHREAD_RWLOCK_FUTEX_USED)))
Packit Service e75323
   447             continue;
Packit Service e75323
   448           int err = futex_abstimed_wait (&rwlock->__data.__wrphase_futex,
Packit Service e75323
   449                                          1 | PTHREAD_RWLOCK_FUTEX_USED,
Packit Service e75323
   450                                          abstime, private);
Packit Service e75323
Packit Service e75323
   We are in a write phase, so the while() on line 439 is true.
Packit Service e75323
Packit Service e75323
   The value of wpf does not have PTHREAD_RWLOCK_FUTEX_USED set
Packit Service e75323
   since this is the first reader to lock.
Packit Service e75323
Packit Service e75323
   The atomic operation sets wpf with PTHREAD_RELOCK_FUTEX_USED
Packit Service e75323
   on the expectation that this reader will be woken during
Packit Service e75323
   the handoff.
Packit Service e75323
Packit Service e75323
   Back in pthread_rwlock_trywrlock:
Packit Service e75323
Packit Service e75323
    50           atomic_store_relaxed (&rwlock->__data.__wrphase_futex, 1);
Packit Service e75323
    51           atomic_store_relaxed (&rwlock->__data.__cur_writer,
Packit Service e75323
    52               THREAD_GETMEM (THREAD_SELF, tid));
Packit Service e75323
    53           return 0;
Packit Service e75323
    54         }
Packit Service e75323
   ...
Packit Service e75323
    57     }
Packit Service e75323
Packit Service e75323
   We write 1 to __wrphase_futex discarding PTHREAD_RWLOCK_FUTEX_USED,
Packit Service e75323
   and so in the unlock we will not awaken the waiting reader.
Packit Service e75323
Packit Service e75323
   The solution to this is to realize that if we did not start the write
Packit Service e75323
   phase we need not write 1 or any other value to __wrphase_futex.
Packit Service e75323
   This ensures that any readers (which saw __wrphase_futex != 0) can
Packit Service e75323
   set PTHREAD_RWLOCK_FUTEX_USED and this can be used at unlock to
Packit Service e75323
   wake them.
Packit Service e75323
Packit Service e75323
   If we installed the write phase then all other readers are looping
Packit Service e75323
   here:
Packit Service e75323
Packit Service e75323
   In __pthread_rwlock_rdlock_full:
Packit Service e75323
Packit Service e75323
   437   for (;;)
Packit Service e75323
   438     {
Packit Service e75323
   439       while (((wpf = atomic_load_relaxed (&rwlock->__data.__wrphase_futex))
Packit Service e75323
   440               | PTHREAD_RWLOCK_FUTEX_USED) == (1 | PTHREAD_RWLOCK_FUTEX_USED))
Packit Service e75323
   441         {
Packit Service e75323
   ...
Packit Service e75323
   508     }
Packit Service e75323
Packit Service e75323
   waiting for the write phase to be installed or removed before they
Packit Service e75323
   can begin waiting on __wrphase_futex (part of the algorithm), or
Packit Service e75323
   taking a concurrent read lock, and thus we can safely write 1 to
Packit Service e75323
   __wrphase_futex.
Packit Service e75323
Packit Service e75323
   If we did not install the write phase then the readers may already
Packit Service e75323
   be waiting on the futex, the original writer wrote 1 to __wrphase_futex
Packit Service e75323
   as part of starting the write phase, and we cannot also write 1
Packit Service e75323
   without loosing the PTHREAD_RWLOCK_FUTEX_USED bit.
Packit Service e75323
Packit Service e75323
   ---
Packit Service e75323
Packit Service e75323
   Summary for the pthread_rwlock_tryrdlock() stall:
Packit Service e75323
Packit Service e75323
   The stall is caused by pthread_rwlock_tryrdlock failing to check
Packit Service e75323
   that PTHREAD_RWLOCK_FUTEX_USED is set in the __wrphase_futex futex
Packit Service e75323
   and then waking the futex.
Packit Service e75323
Packit Service e75323
   The fix for bug 23844 ensures that waiters on __wrphase_futex are
Packit Service e75323
   correctly woken.  Before the fix the test stalls as readers can
Packit Service e75323
   wait forever on __wrphase_futex.  */
Packit Service e75323
Packit Service e75323
#include <stdio.h>
Packit Service e75323
#include <stdlib.h>
Packit Service e75323
#include <unistd.h>
Packit Service e75323
#include <pthread.h>
Packit Service e75323
#include <support/xthread.h>
Packit Service e75323
#include <errno.h>
Packit Service e75323
Packit Service e75323
/* We need only one lock to reproduce the issue. We will need multiple
Packit Service e75323
   threads to get the exact case where we have a read, try, and unlock
Packit Service e75323
   all interleaving to produce the case where the readers are waiting
Packit Service e75323
   and the try fails to wake them.  */
Packit Service e75323
pthread_rwlock_t onelock;
Packit Service e75323
Packit Service e75323
/* The number of threads is arbitrary but empirically chosen to have
Packit Service e75323
   enough threads that we see the condition where waiting readers are
Packit Service e75323
   not woken by a successful tryrdlock.  */
Packit Service e75323
#define NTHREADS 32
Packit Service e75323
Packit Service e75323
_Atomic int do_exit;
Packit Service e75323
Packit Service e75323
void *
Packit Service e75323
run_loop (void *arg)
Packit Service e75323
{
Packit Service e75323
  int i = 0, ret;
Packit Service e75323
  while (!do_exit)
Packit Service e75323
    {
Packit Service e75323
      /* Arbitrarily choose if we are the writer or reader.  Choose a
Packit Service e75323
	 high enough ratio of readers to writers to make it likely
Packit Service e75323
	 that readers block (and eventually are susceptable to
Packit Service e75323
	 stalling).
Packit Service e75323
Packit Service e75323
         If we are a writer, take the write lock, and then unlock.
Packit Service e75323
	 If we are a reader, try the lock, then lock, then unlock.  */
Packit Service e75323
      if ((i % 8) != 0)
Packit Service e75323
	xpthread_rwlock_wrlock (&onelock);
Packit Service e75323
      else
Packit Service e75323
	{
Packit Service e75323
	  if ((ret = pthread_rwlock_tryrdlock (&onelock)) != 0)
Packit Service e75323
	    {
Packit Service e75323
	      if (ret == EBUSY)
Packit Service e75323
		xpthread_rwlock_rdlock (&onelock);
Packit Service e75323
	      else
Packit Service e75323
		exit (EXIT_FAILURE);
Packit Service e75323
	    }
Packit Service e75323
	}
Packit Service e75323
      /* Thread does some work and then unlocks.  */
Packit Service e75323
      xpthread_rwlock_unlock (&onelock);
Packit Service e75323
      i++;
Packit Service e75323
    }
Packit Service e75323
  return NULL;
Packit Service e75323
}
Packit Service e75323
Packit Service e75323
int
Packit Service e75323
do_test (void)
Packit Service e75323
{
Packit Service e75323
  int i;
Packit Service e75323
  pthread_t tids[NTHREADS];
Packit Service e75323
  xpthread_rwlock_init (&onelock, NULL);
Packit Service e75323
  for (i = 0; i < NTHREADS; i++)
Packit Service e75323
    tids[i] = xpthread_create (NULL, run_loop, NULL);
Packit Service e75323
  /* Run for some amount of time.  Empirically speaking exercising
Packit Service e75323
     the stall via pthread_rwlock_tryrdlock is much harder, and on
Packit Service e75323
     a 3.5GHz 4 core x86_64 VM system it takes somewhere around
Packit Service e75323
     20-200s to stall, approaching 100% stall past 200s.  We can't
Packit Service e75323
     wait that long for a regression test so we just test for 20s,
Packit Service e75323
     and expect the stall to happen with a 5-10% chance (enough for
Packit Service e75323
     developers to see).  */
Packit Service e75323
  sleep (20);
Packit Service e75323
  /* Then exit.  */
Packit Service e75323
  printf ("INFO: Exiting...\n");
Packit Service e75323
  do_exit = 1;
Packit Service e75323
  /* If any readers stalled then we will timeout waiting for them.  */
Packit Service e75323
  for (i = 0; i < NTHREADS; i++)
Packit Service e75323
    xpthread_join (tids[i]);
Packit Service e75323
  printf ("INFO: Done.\n");
Packit Service e75323
  xpthread_rwlock_destroy (&onelock);
Packit Service e75323
  printf ("PASS: No pthread_rwlock_tryrdlock stalls detected.\n");
Packit Service e75323
  return 0;
Packit Service e75323
}
Packit Service e75323
Packit Service e75323
#define TIMEOUT 30
Packit Service e75323
#include <support/test-driver.c>