io_uring: pass in EPOLL_URING_WAKE for eventfd signaling and wakeups

author Jens Axboe <axboe@kernel.dk>

Sun, 20 Nov 2022 17:18:45 +0000 (10:18 -0700)

committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>

Wed, 4 Jan 2023 10:28:48 +0000 (11:28 +0100)
author Jens Axboe <axboe@kernel.dk>
Sun, 20 Nov 2022 17:18:45 +0000 (10:18 -0700)
committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Wed, 4 Jan 2023 10:28:48 +0000 (11:28 +0100)
diff --git a/io_uring/io_uring.c b/io_uring/io_uring.c

index 17771cb..71f1cab 100644 (file)
--- a/io_uring/io_uring.c
+++ b/io_uring/io_uring.c
@@ -495,7 +495,7 @@ static void io_eventfd_ops(struct rcu_head *rcu)
         int ops = atomic_xchg(&ev_fd->ops, 0);
  
         if (ops & BIT(IO_EVENTFD_OP_SIGNAL_BIT))
-               eventfd_signal(ev_fd->cq_ev_fd, 1);
+               eventfd_signal_mask(ev_fd->cq_ev_fd, 1, EPOLL_URING_WAKE);
  
         /* IO_EVENTFD_OP_FREE_BIT may not be set here depending on callback
          * ordering in a race but if references are 0 we know we have to free
@@ -531,7 +531,7 @@ static void io_eventfd_signal(struct io_ring_ctx *ctx)
                 goto out;
  
         if (likely(eventfd_signal_allowed())) {
-               eventfd_signal(ev_fd->cq_ev_fd, 1);
+               eventfd_signal_mask(ev_fd->cq_ev_fd, 1, EPOLL_URING_WAKE);
         } else {
                 atomic_inc(&ev_fd->refs);
                 if (!atomic_fetch_or(BIT(IO_EVENTFD_OP_SIGNAL_BIT), &ev_fd->ops))
diff --git a/io_uring/io_uring.h b/io_uring/io_uring.h

index 50bc3af..4334cd3 100644 (file)
--- a/io_uring/io_uring.h
+++ b/io_uring/io_uring.h
@@ -4,6 +4,7 @@
  #include <linux/errno.h>
  #include <linux/lockdep.h>
  #include <linux/io_uring_types.h>
+#include <uapi/linux/eventpoll.h>
  #include "io-wq.h"
  #include "slist.h"
  #include "filetable.h"
@@ -207,12 +208,18 @@ static inline void io_commit_cqring(struct io_ring_ctx *ctx)
  static inline void __io_cqring_wake(struct io_ring_ctx *ctx)
  {
         /*
-        * wake_up_all() may seem excessive, but io_wake_function() and
-        * io_should_wake() handle the termination of the loop and only
-        * wake as many waiters as we need to.
+        * Trigger waitqueue handler on all waiters on our waitqueue. This
+        * won't necessarily wake up all the tasks, io_should_wake() will make
+        * that decision.
+        *
+        * Pass in EPOLLIN|EPOLL_URING_WAKE as the poll wakeup key. The latter
+        * set in the mask so that if we recurse back into our own poll
+        * waitqueue handlers, we know we have a dependency between eventfd or
+        * epoll and should terminate multishot poll at that point.
          */
         if (waitqueue_active(&ctx->cq_wait))
-               wake_up_all(&ctx->cq_wait);
+               __wake_up(&ctx->cq_wait, TASK_NORMAL, 0,
+                               poll_to_key(EPOLL_URING_WAKE | EPOLLIN));
  }
  
  static inline void io_cqring_wake(struct io_ring_ctx *ctx)
diff --git a/io_uring/poll.c b/io_uring/poll.c

index d9bf176..fded144 100644 (file)
--- a/io_uring/poll.c
+++ b/io_uring/poll.c
@@ -429,6 +429,14 @@ static int io_poll_wake(struct wait_queue_entry *wait, unsigned mode, int sync,
                 return 0;
  
         if (io_poll_get_ownership(req)) {
+               /*
+                * If we trigger a multishot poll off our own wakeup path,
+                * disable multishot as there is a circular dependency between
+                * CQ posting and triggering the event.
+                */
+               if (mask & EPOLL_URING_WAKE)
+                       poll->events |= EPOLLONESHOT;
+
                 /* optional, saves extra locking for removal in tw handler */
                 if (mask && poll->events & EPOLLONESHOT) {
                         list_del_init(&poll->wait.entry);
author	Jens Axboe <axboe@kernel.dk>
	Sun, 20 Nov 2022 17:18:45 +0000 (10:18 -0700)
committer	Greg Kroah-Hartman <gregkh@linuxfoundation.org>
	Wed, 4 Jan 2023 10:28:48 +0000 (11:28 +0100)
io_uring/io_uring.c		patch \| blob \| history
io_uring/io_uring.h		patch \| blob \| history
io_uring/poll.c		patch \| blob \| history