Source-Changes-HG archive
[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index][Old Index]
[src/netbsd-9]: src/sys/kern Pullup the following (requested by jdolecek in t...
details: https://anonhg.NetBSD.org/src/rev/4a0fa1406b90
branches: netbsd-9
changeset: 1002143:4a0fa1406b90
user: martin <martin%NetBSD.org@localhost>
date: Thu Feb 04 16:57:25 2021 +0000
description:
Pullup the following (requested by jdolecek in ticket #1191):
sys/kern/kern_event.c r1.110-1.115 (via patch)
fix a race in kqueue_scan() - when multiple threads check the same
kqueue, it could happen other thread seen empty kqueue while kevent
was being checked for re-firing and re-queued
make sure to keep retrying if there are outstanding kevents even
if no kevent is found on first pass through the queue, and only
kq_count when actually completely done with the kevent
PR kern/50094 by Christof Meerwal
Also fixes timer latency in Go, as reported in
https://github.com/golang/go/issues/42515 by Michael Pratt
diffstat:
sys/kern/kern_event.c | 245 +++++++++++++++++++++++++++----------------------
1 files changed, 133 insertions(+), 112 deletions(-)
diffs (truncated from 304 to 300 lines):
diff -r 0947e19b24a1 -r 4a0fa1406b90 sys/kern/kern_event.c
--- a/sys/kern/kern_event.c Fri Jan 29 21:01:53 2021 +0000
+++ b/sys/kern/kern_event.c Thu Feb 04 16:57:25 2021 +0000
@@ -1,4 +1,4 @@
-/* $NetBSD: kern_event.c,v 1.104 2018/11/13 06:58:14 maxv Exp $ */
+/* $NetBSD: kern_event.c,v 1.104.4.1 2021/02/04 16:57:25 martin Exp $ */
/*-
* Copyright (c) 2008, 2009 The NetBSD Foundation, Inc.
@@ -58,7 +58,7 @@
*/
#include <sys/cdefs.h>
-__KERNEL_RCSID(0, "$NetBSD: kern_event.c,v 1.104 2018/11/13 06:58:14 maxv Exp $");
+__KERNEL_RCSID(0, "$NetBSD: kern_event.c,v 1.104.4.1 2021/02/04 16:57:25 martin Exp $");
#include <sys/param.h>
#include <sys/systm.h>
@@ -166,6 +166,8 @@
extern const struct filterops sig_filtops;
+#define KQ_FLUX_WAKEUP(kq) cv_broadcast(&kq->kq_cv)
+
/*
* Table for for all system-defined filters.
* These should be listed in the numeric order of the EVFILT_* defines.
@@ -1226,7 +1228,10 @@
}
count++;
if (count > kq->kq_count) {
- goto bad;
+ panic("%s,%zu: kq=%p kq->kq_count(%d) != "
+ "count(%d), nmarker=%d",
+ func, line, kq, kq->kq_count, count,
+ nmarker);
}
} else {
nmarker++;
@@ -1240,11 +1245,6 @@
#endif
}
}
- if (kq->kq_count != count) {
-bad:
- panic("%s,%zu: kq=%p kq->kq_count(%d) != count(%d), nmarker=%d",
- func, line, kq, kq->kq_count, count, nmarker);
- }
}
#define kq_check(a) kqueue_check(__func__, __LINE__, (a))
#else /* defined(DEBUG) */
@@ -1268,7 +1268,7 @@
struct timespec ats, sleepts;
struct knote *kn, *marker, morker;
size_t count, nkev, nevents;
- int timeout, error, rv;
+ int timeout, error, rv, influx;
filedesc_t *fdp;
fdp = curlwp->l_fd;
@@ -1317,119 +1317,140 @@
}
}
mutex_spin_exit(&kq->kq_lock);
- } else {
- /* mark end of knote list */
- TAILQ_INSERT_TAIL(&kq->kq_head, marker, kn_tqe);
+ goto done;
+ }
+
+ /* mark end of knote list */
+ TAILQ_INSERT_TAIL(&kq->kq_head, marker, kn_tqe);
+ influx = 0;
- /*
- * Acquire the fdp->fd_lock interlock to avoid races with
- * file creation/destruction from other threads.
- */
- mutex_spin_exit(&kq->kq_lock);
- mutex_enter(&fdp->fd_lock);
- mutex_spin_enter(&kq->kq_lock);
+ /*
+ * Acquire the fdp->fd_lock interlock to avoid races with
+ * file creation/destruction from other threads.
+ */
+relock:
+ mutex_spin_exit(&kq->kq_lock);
+ mutex_enter(&fdp->fd_lock);
+ mutex_spin_enter(&kq->kq_lock);
+
+ while (count != 0) {
+ kn = TAILQ_FIRST(&kq->kq_head); /* get next knote */
+
+ if ((kn->kn_status & KN_MARKER) != 0 && kn != marker) {
+ if (influx) {
+ influx = 0;
+ KQ_FLUX_WAKEUP(kq);
+ }
+ mutex_exit(&fdp->fd_lock);
+ (void)cv_wait(&kq->kq_cv, &kq->kq_lock);
+ goto relock;
+ }
- while (count != 0) {
- kn = TAILQ_FIRST(&kq->kq_head); /* get next knote */
- while ((kn->kn_status & KN_MARKER) != 0) {
- if (kn == marker) {
- /* it's our marker, stop */
- TAILQ_REMOVE(&kq->kq_head, kn, kn_tqe);
- if (count < maxevents || (tsp != NULL &&
- (timeout = gettimeleft(&ats,
- &sleepts)) <= 0))
- goto done;
- mutex_exit(&fdp->fd_lock);
- goto retry;
- }
- /* someone else's marker. */
- kn = TAILQ_NEXT(kn, kn_tqe);
+ TAILQ_REMOVE(&kq->kq_head, kn, kn_tqe);
+ if (kn == marker) {
+ /* it's our marker, stop */
+ KQ_FLUX_WAKEUP(kq);
+ if (count == maxevents) {
+ mutex_exit(&fdp->fd_lock);
+ goto retry;
}
- kq_check(kq);
+ break;
+ }
+ KASSERT((kn->kn_status & KN_BUSY) == 0);
+
+ kq_check(kq);
+ kn->kn_status &= ~KN_QUEUED;
+ kn->kn_status |= KN_BUSY;
+ kq_check(kq);
+ if (kn->kn_status & KN_DISABLED) {
+ kn->kn_status &= ~KN_BUSY;
kq->kq_count--;
- TAILQ_REMOVE(&kq->kq_head, kn, kn_tqe);
- kn->kn_status &= ~KN_QUEUED;
- kn->kn_status |= KN_BUSY;
- kq_check(kq);
- if (kn->kn_status & KN_DISABLED) {
+ /* don't want disabled events */
+ continue;
+ }
+ if ((kn->kn_flags & EV_ONESHOT) == 0) {
+ mutex_spin_exit(&kq->kq_lock);
+ KASSERT(kn->kn_fop != NULL);
+ KASSERT(kn->kn_fop->f_event != NULL);
+ KERNEL_LOCK(1, NULL); /* XXXSMP */
+ KASSERT(mutex_owned(&fdp->fd_lock));
+ rv = (*kn->kn_fop->f_event)(kn, 0);
+ KERNEL_UNLOCK_ONE(NULL); /* XXXSMP */
+ mutex_spin_enter(&kq->kq_lock);
+ /* Re-poll if note was re-enqueued. */
+ if ((kn->kn_status & KN_QUEUED) != 0) {
kn->kn_status &= ~KN_BUSY;
- /* don't want disabled events */
+ /* Re-enqueue raised kq_count, lower it again */
+ kq->kq_count--;
+ influx = 1;
continue;
}
- if ((kn->kn_flags & EV_ONESHOT) == 0) {
- mutex_spin_exit(&kq->kq_lock);
- KASSERT(kn->kn_fop != NULL);
- KASSERT(kn->kn_fop->f_event != NULL);
- KERNEL_LOCK(1, NULL); /* XXXSMP */
- KASSERT(mutex_owned(&fdp->fd_lock));
- rv = (*kn->kn_fop->f_event)(kn, 0);
- KERNEL_UNLOCK_ONE(NULL); /* XXXSMP */
- mutex_spin_enter(&kq->kq_lock);
- /* Re-poll if note was re-enqueued. */
- if ((kn->kn_status & KN_QUEUED) != 0) {
- kn->kn_status &= ~KN_BUSY;
- continue;
- }
- if (rv == 0) {
- /*
- * non-ONESHOT event that hasn't
- * triggered again, so de-queue.
- */
- kn->kn_status &= ~(KN_ACTIVE|KN_BUSY);
- continue;
- }
- }
- /* XXXAD should be got from f_event if !oneshot. */
- *kevp++ = kn->kn_kevent;
- nkev++;
- if (kn->kn_flags & EV_ONESHOT) {
- /* delete ONESHOT events after retrieval */
- kn->kn_status &= ~KN_BUSY;
- mutex_spin_exit(&kq->kq_lock);
- knote_detach(kn, fdp, true);
- mutex_enter(&fdp->fd_lock);
- mutex_spin_enter(&kq->kq_lock);
- } else if (kn->kn_flags & EV_CLEAR) {
- /* clear state after retrieval */
- kn->kn_data = 0;
- kn->kn_fflags = 0;
- kn->kn_status &= ~(KN_QUEUED|KN_ACTIVE|KN_BUSY);
- } else if (kn->kn_flags & EV_DISPATCH) {
- kn->kn_status |= KN_DISABLED;
- kn->kn_status &= ~(KN_QUEUED|KN_ACTIVE|KN_BUSY);
- } else {
- /* add event back on list */
- kq_check(kq);
- kn->kn_status |= KN_QUEUED;
- kn->kn_status &= ~KN_BUSY;
- TAILQ_INSERT_TAIL(&kq->kq_head, kn, kn_tqe);
- kq->kq_count++;
- kq_check(kq);
- }
- if (nkev == kevcnt) {
- /* do copyouts in kevcnt chunks */
- mutex_spin_exit(&kq->kq_lock);
- mutex_exit(&fdp->fd_lock);
- error = (*keops->keo_put_events)
- (keops->keo_private,
- kevbuf, ulistp, nevents, nkev);
- mutex_enter(&fdp->fd_lock);
- mutex_spin_enter(&kq->kq_lock);
- nevents += nkev;
- nkev = 0;
- kevp = kevbuf;
- }
- count--;
- if (error != 0 || count == 0) {
- /* remove marker */
- TAILQ_REMOVE(&kq->kq_head, marker, kn_tqe);
- break;
+ if (rv == 0) {
+ /*
+ * non-ONESHOT event that hasn't
+ * triggered again, so de-queue.
+ */
+ kn->kn_status &= ~(KN_ACTIVE|KN_BUSY);
+ kq->kq_count--;
+ influx = 1;
+ continue;
}
}
- done:
- mutex_spin_exit(&kq->kq_lock);
- mutex_exit(&fdp->fd_lock);
+ /* XXXAD should be got from f_event if !oneshot. */
+ *kevp++ = kn->kn_kevent;
+ nkev++;
+ if (kn->kn_flags & EV_ONESHOT) {
+ /* delete ONESHOT events after retrieval */
+ kn->kn_status &= ~KN_BUSY;
+ mutex_spin_exit(&kq->kq_lock);
+ knote_detach(kn, fdp, true);
+ mutex_enter(&fdp->fd_lock);
+ mutex_spin_enter(&kq->kq_lock);
+ } else if (kn->kn_flags & EV_CLEAR) {
+ /* clear state after retrieval */
+ kn->kn_data = 0;
+ kn->kn_fflags = 0;
+ kn->kn_status &= ~(KN_ACTIVE|KN_BUSY);
+ kq->kq_count--;
+ } else if (kn->kn_flags & EV_DISPATCH) {
+ kn->kn_status |= KN_DISABLED;
+ kn->kn_status &= ~(KN_ACTIVE|KN_BUSY);
+ kq->kq_count--;
+ } else {
+ /* add event back on list */
+ kq_check(kq);
+ kn->kn_status |= KN_QUEUED;
+ kn->kn_status &= ~KN_BUSY;
+ TAILQ_INSERT_TAIL(&kq->kq_head, kn, kn_tqe);
+ kq_check(kq);
+ }
+ if (nkev == kevcnt) {
+ /* do copyouts in kevcnt chunks */
+ influx = 0;
+ KQ_FLUX_WAKEUP(kq);
+ mutex_spin_exit(&kq->kq_lock);
+ mutex_exit(&fdp->fd_lock);
+ error = (*keops->keo_put_events)
+ (keops->keo_private,
+ kevbuf, ulistp, nevents, nkev);
+ mutex_enter(&fdp->fd_lock);
+ mutex_spin_enter(&kq->kq_lock);
+ nevents += nkev;
+ nkev = 0;
+ kevp = kevbuf;
+ }
+ count--;
+ if (error != 0 || count == 0) {
+ /* remove marker */
+ TAILQ_REMOVE(&kq->kq_head, marker, kn_tqe);
+ break;
+ }
}
+ KQ_FLUX_WAKEUP(kq);
+ mutex_spin_exit(&kq->kq_lock);
+ mutex_exit(&fdp->fd_lock);
+
Home |
Main Index |
Thread Index |
Old Index