io-wq: check max_worker limits if a worker transitions bound state

author Jens Axboe <axboe@kernel.dk>

Sun, 29 Aug 2021 22:13:03 +0000 (16:13 -0600)

committer Jens Axboe <axboe@kernel.dk>

Mon, 30 Aug 2021 13:28:19 +0000 (07:28 -0600)
author Jens Axboe <axboe@kernel.dk>
Sun, 29 Aug 2021 22:13:03 +0000 (16:13 -0600)
committer Jens Axboe <axboe@kernel.dk>
Mon, 30 Aug 2021 13:28:19 +0000 (07:28 -0600)
diff --git a/fs/io-wq.c b/fs/io-wq.c

index 4b5fc621ab397a0db64b2e30d0b3896bf33abbb8..da3ad45028f9dede09b89903418a7a861fbf6529 100644 (file)
--- a/fs/io-wq.c
+++ b/fs/io-wq.c
@@ -424,7 +424,28 @@ static void io_wait_on_hash(struct io_wqe *wqe, unsigned int hash)
         spin_unlock(&wq->hash->wait.lock);
  }
  
-static struct io_wq_work *io_get_next_work(struct io_wqe *wqe)
+/*
+ * We can always run the work if the worker is currently the same type as
+ * the work (eg both are bound, or both are unbound). If they are not the
+ * same, only allow it if incrementing the worker count would be allowed.
+ */
+static bool io_worker_can_run_work(struct io_worker *worker,
+                                  struct io_wq_work *work)
+{
+       struct io_wqe_acct *acct;
+
+       if (!(worker->flags & IO_WORKER_F_BOUND) !=
+           !(work->flags & IO_WQ_WORK_UNBOUND))
+               return true;
+
+       /* not the same type, check if we'd go over the limit */
+       acct = io_work_get_acct(worker->wqe, work);
+       return acct->nr_workers < acct->max_workers;
+}
+
+static struct io_wq_work *io_get_next_work(struct io_wqe *wqe,
+                                          struct io_worker *worker,
+                                          bool *stalled)
         __must_hold(wqe->lock)
  {
         struct io_wq_work_node *node, *prev;
@@ -436,6 +457,9 @@ static struct io_wq_work *io_get_next_work(struct io_wqe *wqe)
  
                 work = container_of(node, struct io_wq_work, list);
  
+               if (!io_worker_can_run_work(worker, work))
+                       break;
+
                 /* not hashed, can run anytime */
                 if (!io_wq_is_hashed(work)) {
                         wq_list_del(&wqe->work_list, node, prev);
@@ -462,6 +486,7 @@ static struct io_wq_work *io_get_next_work(struct io_wqe *wqe)
                 raw_spin_unlock(&wqe->lock);
                 io_wait_on_hash(wqe, stall_hash);
                 raw_spin_lock(&wqe->lock);
+               *stalled = true;
         }
  
         return NULL;
@@ -501,6 +526,7 @@ static void io_worker_handle_work(struct io_worker *worker)
  
         do {
                 struct io_wq_work *work;
+               bool stalled;
  get_next:
                 /*
                  * If we got some work, mark us as busy. If we didn't, but
@@ -509,10 +535,11 @@ get_next:
                  * can't make progress, any work completion or insertion will
                  * clear the stalled flag.
                  */
-               work = io_get_next_work(wqe);
+               stalled = false;
+               work = io_get_next_work(wqe, worker, &stalled);
                 if (work)
                         __io_worker_busy(wqe, worker, work);
-               else if (!wq_list_empty(&wqe->work_list))
+               else if (stalled)
                         wqe->flags |= IO_WQE_FLAG_STALLED;
  
                 raw_spin_unlock_irq(&wqe->lock);
author	Jens Axboe <axboe@kernel.dk>
	Sun, 29 Aug 2021 22:13:03 +0000 (16:13 -0600)
committer	Jens Axboe <axboe@kernel.dk>
	Mon, 30 Aug 2021 13:28:19 +0000 (07:28 -0600)