io_uring/poll: don't enable lazy wake for POLLEXCLUSIVE

author Jens Axboe <axboe@kernel.dk>

Wed, 13 Dec 2023 15:58:15 +0000 (08:58 -0700)

committer Jens Axboe <axboe@kernel.dk>

Wed, 13 Dec 2023 15:58:15 +0000 (08:58 -0700)
author Jens Axboe <axboe@kernel.dk>
Wed, 13 Dec 2023 15:58:15 +0000 (08:58 -0700)
committer Jens Axboe <axboe@kernel.dk>
Wed, 13 Dec 2023 15:58:15 +0000 (08:58 -0700)
diff --git a/include/linux/io_uring_types.h b/include/linux/io_uring_types.h

index 805bb635cdf55805171c20f66312663a6d84fe8e..239a4f68801bb59812c33b80d88958065bf124a3 100644 (file)
--- a/include/linux/io_uring_types.h
+++ b/include/linux/io_uring_types.h
@@ -434,6 +434,7 @@ enum {
         /* keep async read/write and isreg together and in order */
         REQ_F_SUPPORT_NOWAIT_BIT,
         REQ_F_ISREG_BIT,
+       REQ_F_POLL_NO_LAZY_BIT,
  
         /* not a real bit, just to check we're not overflowing the space */
         __REQ_F_LAST_BIT,
@@ -501,6 +502,8 @@ enum {
         REQ_F_CLEAR_POLLIN      = BIT(REQ_F_CLEAR_POLLIN_BIT),
         /* hashed into ->cancel_hash_locked, protected by ->uring_lock */
         REQ_F_HASH_LOCKED       = BIT(REQ_F_HASH_LOCKED_BIT),
+       /* don't use lazy poll wake for this request */
+       REQ_F_POLL_NO_LAZY      = BIT(REQ_F_POLL_NO_LAZY_BIT),
  };
  
  typedef void (*io_req_tw_func_t)(struct io_kiocb *req, struct io_tw_state *ts);
diff --git a/io_uring/poll.c b/io_uring/poll.c

index d38d05edb4fa26c92f46b48bc89d0aa280c568ab..d59b74a99d4e4b444dcb2f86dc9d3594d838e1cf 100644 (file)
--- a/io_uring/poll.c
+++ b/io_uring/poll.c
@@ -366,11 +366,16 @@ void io_poll_task_func(struct io_kiocb *req, struct io_tw_state *ts)
  
  static void __io_poll_execute(struct io_kiocb *req, int mask)
  {
+       unsigned flags = 0;
+
         io_req_set_res(req, mask, 0);
         req->io_task_work.func = io_poll_task_func;
  
         trace_io_uring_task_add(req, mask);
-       __io_req_task_work_add(req, IOU_F_TWQ_LAZY_WAKE);
+
+       if (!(req->flags & REQ_F_POLL_NO_LAZY))
+               flags = IOU_F_TWQ_LAZY_WAKE;
+       __io_req_task_work_add(req, flags);
  }
  
  static inline void io_poll_execute(struct io_kiocb *req, int res)
@@ -526,10 +531,19 @@ static void __io_queue_proc(struct io_poll *poll, struct io_poll_table *pt,
         poll->head = head;
         poll->wait.private = (void *) wqe_private;
  
-       if (poll->events & EPOLLEXCLUSIVE)
+       if (poll->events & EPOLLEXCLUSIVE) {
+               /*
+                * Exclusive waits may only wake a limited amount of entries
+                * rather than all of them, this may interfere with lazy
+                * wake if someone does wait(events > 1). Ensure we don't do
+                * lazy wake for those, as we need to process each one as they
+                * come in.
+                */
+               req->flags |= REQ_F_POLL_NO_LAZY;
                 add_wait_queue_exclusive(head, &poll->wait);
-       else
+       } else {
                 add_wait_queue(head, &poll->wait);
+       }
  }
  
  static void io_poll_queue_proc(struct file *file, struct wait_queue_head *head,
author	Jens Axboe <axboe@kernel.dk>
	Wed, 13 Dec 2023 15:58:15 +0000 (08:58 -0700)
committer	Jens Axboe <axboe@kernel.dk>
	Wed, 13 Dec 2023 15:58:15 +0000 (08:58 -0700)
include/linux/io_uring_types.h		patch \| blob \| history
io_uring/poll.c		patch \| blob \| history