Source-Changes-HG archive

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index][Old Index]

[src/trunk]: src/lib/libpthread Another bug. The CAS loop in pthread_cond_si...



details:   https://anonhg.NetBSD.org/src/rev/5d2545e323a9
branches:  trunk
changeset: 1011001:5d2545e323a9
user:      ad <ad%NetBSD.org@localhost>
date:      Sun Jun 14 21:33:28 2020 +0000

description:
Another bug.  The CAS loop in pthread_cond_signal() could race against the
thread it is trying to awake.  The thread could exit the condvar and then
reinsert itself at the head of the list with a new waiter behind it.  It's
likely possible to fix this in a way that's wait-free but for now just fix
the bug.

diffstat:

 lib/libpthread/pthread_cond.c |  95 ++++++++++++++++++++++++++++--------------
 1 files changed, 63 insertions(+), 32 deletions(-)

diffs (211 lines):

diff -r cd88be92e1db -r 5d2545e323a9 lib/libpthread/pthread_cond.c
--- a/lib/libpthread/pthread_cond.c     Sun Jun 14 21:31:11 2020 +0000
+++ b/lib/libpthread/pthread_cond.c     Sun Jun 14 21:33:28 2020 +0000
@@ -1,4 +1,4 @@
-/*     $NetBSD: pthread_cond.c,v 1.75 2020/06/13 17:39:42 riastradh Exp $      */
+/*     $NetBSD: pthread_cond.c,v 1.76 2020/06/14 21:33:28 ad Exp $     */
 
 /*-
  * Copyright (c) 2001, 2006, 2007, 2008, 2020 The NetBSD Foundation, Inc.
@@ -30,7 +30,7 @@
  */
 
 #include <sys/cdefs.h>
-__RCSID("$NetBSD: pthread_cond.c,v 1.75 2020/06/13 17:39:42 riastradh Exp $");
+__RCSID("$NetBSD: pthread_cond.c,v 1.76 2020/06/14 21:33:28 ad Exp $");
 
 #include <stdlib.h>
 #include <errno.h>
@@ -54,6 +54,13 @@
 __strong_alias(__libc_cond_timedwait,pthread_cond_timedwait)
 __strong_alias(__libc_cond_destroy,pthread_cond_destroy)
 
+/*
+ * A dummy waiter that's used to flag that pthread_cond_signal() is in
+ * progress and nobody else should try to modify the waiter list until
+ * it completes.
+ */
+static struct pthread__waiter pthread__cond_dummy;
+
 static clockid_t
 pthread_cond_getclock(const pthread_cond_t *cond)
 {
@@ -111,7 +118,7 @@
 pthread_cond_timedwait(pthread_cond_t *cond, pthread_mutex_t *mutex,
                       const struct timespec *abstime)
 {
-       struct pthread__waiter waiter, *next, *waiters;
+       struct pthread__waiter waiter, *next, *head;
        pthread_t self;
        int error, cancel;
        clockid_t clkid = pthread_cond_getclock(cond);
@@ -135,33 +142,39 @@
 
        /* Note this thread as waiting on the CV. */
        cond->ptc_mutex = mutex;
-       for (waiters = cond->ptc_waiters;; waiters = next) {
+       for (head = cond->ptc_waiters;; head = next) {
+               /* Wait while pthread_cond_signal() in progress. */
+               if (__predict_false(head == &pthread__cond_dummy)) {
+                       sched_yield();
+                       next = cond->ptc_waiters;
+                       continue;
+               }
                waiter.lid = self->pt_lid;
-               waiter.next = waiters;
+               waiter.next = head;
 #ifndef PTHREAD__ATOMIC_IS_MEMBAR
                membar_producer();
 #endif
-               next = atomic_cas_ptr(&cond->ptc_waiters, waiters, &waiter);
-               if (__predict_true(next == waiters)) {
+               next = atomic_cas_ptr(&cond->ptc_waiters, head, &waiter);
+               if (__predict_true(next == head)) {
                        break;
                }
        }
 
-       /* Drop the interlock */
+       /* Drop the interlock and wait. */
+       error = 0;
        pthread_mutex_unlock(mutex);
-       error = 0;
-
        while (waiter.lid && !(cancel = self->pt_cancel)) {
                int rv = _lwp_park(clkid, TIMER_ABSTIME, __UNCONST(abstime),
                    0, NULL, NULL);
                if (rv == 0) {
                        continue;
                }
-               if (errno != EINTR && errno != EALREADY && errno != ESRCH) {
+               if (errno != EINTR && errno != EALREADY) {
                        error = errno;
                        break;
                }
        }
+       pthread_mutex_lock(mutex);
 
        /*
         * If this thread absorbed a wakeup from pthread_cond_signal() and
@@ -169,11 +182,6 @@
         *
         * And if awoken early, we may still be on the waiter list and must
         * remove self.
-        *
-        * In all cases do the wakeup without the mutex held otherwise:
-        *
-        * - wakeup could be deferred until mutex release
-        * - it would be mixing up two sets of waitpoints
         */
        if (__predict_false(cancel | error)) {
                pthread_cond_broadcast(cond);
@@ -183,10 +191,12 @@
                 * Wait until released, otherwise "waiter" is still globally
                 * visible.
                 */
+               pthread_mutex_unlock(mutex);
                while (__predict_false(waiter.lid)) {
                        (void)_lwp_park(CLOCK_MONOTONIC, 0, NULL, 0, NULL,
                            NULL);
                }
+               pthread_mutex_lock(mutex);
        } else {
                pthread__assert(!waiter.lid);
        }
@@ -195,7 +205,6 @@
         * If cancelled then exit.  POSIX dictates that the mutex must be
         * held if this happens.
         */
-       pthread_mutex_lock(mutex);
        if (cancel) {
                pthread__cancelled();
        }
@@ -215,7 +224,7 @@
 int
 pthread_cond_signal(pthread_cond_t *cond)
 {
-       struct pthread__waiter *waiter, *next;
+       struct pthread__waiter *head, *next;
        pthread_mutex_t *mutex;
        pthread_t self;
 
@@ -228,28 +237,39 @@
        /* Take ownership of one waiter. */
        self = pthread_self();
        mutex = cond->ptc_mutex;
-       for (waiter = cond->ptc_waiters;; waiter = next) {
-               if (waiter == NULL) {
+       for (head = cond->ptc_waiters;; head = next) {
+               /* Wait while pthread_cond_signal() in progress. */
+               if (__predict_false(head == &pthread__cond_dummy)) {
+                       sched_yield();
+                       next = cond->ptc_waiters;
+                       continue;
+               }
+               if (head == NULL) {
                        return 0;
                }
-               membar_datadep_consumer(); /* for alpha */
-               next = waiter->next;
-               next = atomic_cas_ptr(&cond->ptc_waiters, waiter, next);
-               if (__predict_true(next == waiter)) {
+               /* Block concurrent access to the waiter list. */
+               next = atomic_cas_ptr(&cond->ptc_waiters, head,
+                   &pthread__cond_dummy);
+               if (__predict_true(next == head)) {
                        break;
                }
        }
 
+       /* Now that list is locked, read pointer to next and then unlock. */
+       membar_enter();
+       cond->ptc_waiters = head->next;
+       membar_producer();
+       head->next = NULL;
+
        /* Now transfer waiter to the mutex. */
-       waiter->next = NULL;
-       pthread__mutex_deferwake(self, mutex, waiter);
+       pthread__mutex_deferwake(self, mutex, head);
        return 0;
 }
 
 int
 pthread_cond_broadcast(pthread_cond_t *cond)
 {
-       struct pthread__waiter *head;
+       struct pthread__waiter *head, *next;
        pthread_mutex_t *mutex;
        pthread_t self;
 
@@ -262,14 +282,25 @@
        if (cond->ptc_waiters == NULL)
                return 0;
 
-       /* Take ownership of the current set of waiters. */
+       /* Take ownership of current set of waiters. */
        self = pthread_self();
        mutex = cond->ptc_mutex;
-       head = atomic_swap_ptr(&cond->ptc_waiters, NULL);
-       if (head == NULL) {
-               return 0;
+       for (head = cond->ptc_waiters;; head = next) {
+               /* Wait while pthread_cond_signal() in progress. */
+               if (__predict_false(head == &pthread__cond_dummy)) {
+                       sched_yield();
+                       next = cond->ptc_waiters;
+                       continue;
+               }
+               if (head == NULL) {
+                       return 0;
+               }
+               next = atomic_cas_ptr(&cond->ptc_waiters, head, NULL);
+               if (__predict_true(next == head)) {
+                       break;
+               }
        }
-       membar_datadep_consumer(); /* for alpha */
+       membar_enter();
 
        /* Now transfer waiters to the mutex. */
        pthread__mutex_deferwake(self, mutex, head);



Home | Main Index | Thread Index | Old Index