io_uring: use cancelation match helper for poll and timeout requests

[platform/kernel/linux-starfive.git] / io_uring / io_uring.c
diff --git a/io_uring/io_uring.c b/io_uring/io_uring.c

index 1b53a2a..7505de2 100644 (file)
--- a/io_uring/io_uring.c
+++ b/io_uring/io_uring.c
@@ -149,7 +149,6 @@ static bool io_uring_try_cancel_requests(struct io_ring_ctx *ctx,
  static void io_queue_sqe(struct io_kiocb *req);
  static void io_move_task_work_from_local(struct io_ring_ctx *ctx);
  static void __io_submit_flush_completions(struct io_ring_ctx *ctx);
-static __cold void io_fallback_tw(struct io_uring_task *tctx);
  
  struct kmem_cache *req_cachep;
  
@@ -1238,6 +1237,34 @@ static inline struct llist_node *io_llist_cmpxchg(struct llist_head *head,
         return cmpxchg(&head->first, old, new);
  }
  
+static __cold void io_fallback_tw(struct io_uring_task *tctx, bool sync)
+{
+       struct llist_node *node = llist_del_all(&tctx->task_list);
+       struct io_ring_ctx *last_ctx = NULL;
+       struct io_kiocb *req;
+
+       while (node) {
+               req = container_of(node, struct io_kiocb, io_task_work.node);
+               node = node->next;
+               if (sync && last_ctx != req->ctx) {
+                       if (last_ctx) {
+                               flush_delayed_work(&last_ctx->fallback_work);
+                               percpu_ref_put(&last_ctx->refs);
+                       }
+                       last_ctx = req->ctx;
+                       percpu_ref_get(&last_ctx->refs);
+               }
+               if (llist_add(&req->io_task_work.node,
+                             &req->ctx->fallback_llist))
+                       schedule_delayed_work(&req->ctx->fallback_work, 1);
+       }
+
+       if (last_ctx) {
+               flush_delayed_work(&last_ctx->fallback_work);
+               percpu_ref_put(&last_ctx->refs);
+       }
+}
+
  void tctx_task_work(struct callback_head *cb)
  {
         struct io_tw_state ts = {};
@@ -1250,7 +1277,7 @@ void tctx_task_work(struct callback_head *cb)
         unsigned int count = 0;
  
         if (unlikely(current->flags & PF_EXITING)) {
-               io_fallback_tw(tctx);
+               io_fallback_tw(tctx, true);
                 return;
         }
  
@@ -1279,20 +1306,6 @@ void tctx_task_work(struct callback_head *cb)
         trace_io_uring_task_work_run(tctx, count, loops);
  }
  
-static __cold void io_fallback_tw(struct io_uring_task *tctx)
-{
-       struct llist_node *node = llist_del_all(&tctx->task_list);
-       struct io_kiocb *req;
-
-       while (node) {
-               req = container_of(node, struct io_kiocb, io_task_work.node);
-               node = node->next;
-               if (llist_add(&req->io_task_work.node,
-                             &req->ctx->fallback_llist))
-                       schedule_delayed_work(&req->ctx->fallback_work, 1);
-       }
-}
-
  static inline void io_req_local_work_add(struct io_kiocb *req, unsigned flags)
  {
         struct io_ring_ctx *ctx = req->ctx;
@@ -1359,7 +1372,7 @@ static void io_req_normal_work_add(struct io_kiocb *req)
         if (likely(!task_work_add(req->task, &tctx->task_work, ctx->notify_method)))
                 return;
  
-       io_fallback_tw(tctx);
+       io_fallback_tw(tctx, false);
  }
  
  void __io_req_task_work_add(struct io_kiocb *req, unsigned flags)
@@ -2476,6 +2489,8 @@ int io_run_task_work_sig(struct io_ring_ctx *ctx)
  static inline int io_cqring_wait_schedule(struct io_ring_ctx *ctx,
                                           struct io_wait_queue *iowq)
  {
+       int token, ret;
+
         if (unlikely(READ_ONCE(ctx->check_cq)))
                 return 1;
         if (unlikely(!llist_empty(&ctx->work_llist)))
@@ -2486,11 +2501,20 @@ static inline int io_cqring_wait_schedule(struct io_ring_ctx *ctx,
                 return -EINTR;
         if (unlikely(io_should_wake(iowq)))
                 return 0;
+
+       /*
+        * Use io_schedule_prepare/finish, so cpufreq can take into account
+        * that the task is waiting for IO - turns out to be important for low
+        * QD IO.
+        */
+       token = io_schedule_prepare();
+       ret = 0;
         if (iowq->timeout == KTIME_MAX)
                 schedule();
         else if (!schedule_hrtimeout(&iowq->timeout, HRTIMER_MODE_ABS))
-               return -ETIME;
-       return 0;
+               ret = -ETIME;
+       io_schedule_finish(token);
+       return ret;
  }
  
  /*
@@ -3109,6 +3133,8 @@ static __cold void io_ring_ctx_wait_and_kill(struct io_ring_ctx *ctx)
         if (ctx->rings)
                 io_kill_timeouts(ctx, NULL, true);
  
+       flush_delayed_work(&ctx->fallback_work);
+
         INIT_WORK(&ctx->exit_work, io_ring_exit_work);
         /*
          * Use system_unbound_wq to avoid spawning tons of event kworkers