ARM/ARM64: config: enable DM_INIT configuration

[platform/kernel/linux-rpi.git] / fs / io_uring.c
diff --git a/fs/io_uring.c b/fs/io_uring.c

index 10578cd..b8ae64d 100644 (file)
--- a/fs/io_uring.c
+++ b/fs/io_uring.c
@@ -1155,12 +1155,6 @@ static inline bool req_ref_put_and_test(struct io_kiocb *req)
         return atomic_dec_and_test(&req->refs);
  }
  
-static inline void req_ref_put(struct io_kiocb *req)
-{
-       WARN_ON_ONCE(!(req->flags & REQ_F_REFCOUNT));
-       WARN_ON_ONCE(req_ref_put_and_test(req));
-}
-
  static inline void req_ref_get(struct io_kiocb *req)
  {
         WARN_ON_ONCE(!(req->flags & REQ_F_REFCOUNT));
@@ -2707,6 +2701,20 @@ static bool __io_complete_rw_common(struct io_kiocb *req, long res)
         return false;
  }
  
+static inline int io_fixup_rw_res(struct io_kiocb *req, unsigned res)
+{
+       struct io_async_rw *io = req->async_data;
+
+       /* add previously done IO, if any */
+       if (io && io->bytes_done > 0) {
+               if (res < 0)
+                       res = io->bytes_done;
+               else
+                       res += io->bytes_done;
+       }
+       return res;
+}
+
  static void io_req_task_complete(struct io_kiocb *req, bool *locked)
  {
         unsigned int cflags = io_put_rw_kbuf(req);
@@ -2730,7 +2738,7 @@ static void __io_complete_rw(struct io_kiocb *req, long res, long res2,
  {
         if (__io_complete_rw_common(req, res))
                 return;
-       __io_req_complete(req, issue_flags, req->result, io_put_rw_kbuf(req));
+       __io_req_complete(req, issue_flags, io_fixup_rw_res(req, res), io_put_rw_kbuf(req));
  }
  
  static void io_complete_rw(struct kiocb *kiocb, long res, long res2)
@@ -2739,7 +2747,7 @@ static void io_complete_rw(struct kiocb *kiocb, long res, long res2)
  
         if (__io_complete_rw_common(req, res))
                 return;
-       req->result = res;
+       req->result = io_fixup_rw_res(req, res);
         req->io_task_work.func = io_req_task_complete;
         io_req_task_work_add(req);
  }
@@ -2985,15 +2993,6 @@ static void kiocb_done(struct kiocb *kiocb, ssize_t ret,
                        unsigned int issue_flags)
  {
         struct io_kiocb *req = container_of(kiocb, struct io_kiocb, rw.kiocb);
-       struct io_async_rw *io = req->async_data;
-
-       /* add previously done IO, if any */
-       if (io && io->bytes_done > 0) {
-               if (ret < 0)
-                       ret = io->bytes_done;
-               else
-                       ret += io->bytes_done;
-       }
  
         if (req->flags & REQ_F_CUR_POS)
                 req->file->f_pos = kiocb->ki_pos;
@@ -3010,6 +3009,7 @@ static void kiocb_done(struct kiocb *kiocb, ssize_t ret,
                         unsigned int cflags = io_put_rw_kbuf(req);
                         struct io_ring_ctx *ctx = req->ctx;
  
+                       ret = io_fixup_rw_res(req, ret);
                         req_set_fail(req);
                         if (!(issue_flags & IO_URING_F_NONBLOCK)) {
                                 mutex_lock(&ctx->uring_lock);
@@ -3606,6 +3606,7 @@ static int io_read(struct io_kiocb *req, unsigned int issue_flags)
                         return -EAGAIN;
                 }
  
+               req->result = iov_iter_count(iter);
                 /*
                  * Now retry read with the IOCB_WAITQ parts set in the iocb. If
                  * we get -EIOCBQUEUED, then we'll get a notification when the
@@ -4768,7 +4769,8 @@ static int io_setup_async_msg(struct io_kiocb *req,
         async_msg = req->async_data;
         req->flags |= REQ_F_NEED_CLEANUP;
         memcpy(async_msg, kmsg, sizeof(*kmsg));
-       async_msg->msg.msg_name = &async_msg->addr;
+       if (async_msg->msg.msg_name)
+               async_msg->msg.msg_name = &async_msg->addr;
         /* if were using fast_iov, set it to the new one */
         if (!async_msg->free_iov)
                 async_msg->msg.msg_iter.iov = async_msg->fast_iov;
@@ -5320,7 +5322,7 @@ struct io_poll_table {
  };
  
  #define IO_POLL_CANCEL_FLAG    BIT(31)
-#define IO_POLL_REF_MASK       ((1u << 20)-1)
+#define IO_POLL_REF_MASK       GENMASK(30, 0)
  
  /*
   * If refs part of ->poll_refs (see IO_POLL_REF_MASK) is 0, it's free. We can
@@ -5375,12 +5377,14 @@ static void io_init_poll_iocb(struct io_poll_iocb *poll, __poll_t events,
  
  static inline void io_poll_remove_entry(struct io_poll_iocb *poll)
  {
-       struct wait_queue_head *head = poll->head;
+       struct wait_queue_head *head = smp_load_acquire(&poll->head);
  
-       spin_lock_irq(&head->lock);
-       list_del_init(&poll->wait.entry);
-       poll->head = NULL;
-       spin_unlock_irq(&head->lock);
+       if (head) {
+               spin_lock_irq(&head->lock);
+               list_del_init(&poll->wait.entry);
+               poll->head = NULL;
+               spin_unlock_irq(&head->lock);
+       }
  }
  
  static void io_poll_remove_entries(struct io_kiocb *req)
@@ -5388,10 +5392,26 @@ static void io_poll_remove_entries(struct io_kiocb *req)
         struct io_poll_iocb *poll = io_poll_get_single(req);
         struct io_poll_iocb *poll_double = io_poll_get_double(req);
  
-       if (poll->head)
-               io_poll_remove_entry(poll);
-       if (poll_double && poll_double->head)
+       /*
+        * While we hold the waitqueue lock and the waitqueue is nonempty,
+        * wake_up_pollfree() will wait for us.  However, taking the waitqueue
+        * lock in the first place can race with the waitqueue being freed.
+        *
+        * We solve this as eventpoll does: by taking advantage of the fact that
+        * all users of wake_up_pollfree() will RCU-delay the actual free.  If
+        * we enter rcu_read_lock() and see that the pointer to the queue is
+        * non-NULL, we can then lock it without the memory being freed out from
+        * under us.
+        *
+        * Keep holding rcu_read_lock() as long as we hold the queue lock, in
+        * case the caller deletes the entry from the queue, leaving it empty.
+        * In that case, only RCU prevents the queue memory from being freed.
+        */
+       rcu_read_lock();
+       io_poll_remove_entry(poll);
+       if (poll_double)
                 io_poll_remove_entry(poll_double);
+       rcu_read_unlock();
  }
  
  /*
@@ -5529,6 +5549,30 @@ static int io_poll_wake(struct wait_queue_entry *wait, unsigned mode, int sync,
                                                  wait);
         __poll_t mask = key_to_poll(key);
  
+       if (unlikely(mask & POLLFREE)) {
+               io_poll_mark_cancelled(req);
+               /* we have to kick tw in case it's not already */
+               io_poll_execute(req, 0);
+
+               /*
+                * If the waitqueue is being freed early but someone is already
+                * holds ownership over it, we have to tear down the request as
+                * best we can. That means immediately removing the request from
+                * its waitqueue and preventing all further accesses to the
+                * waitqueue via the request.
+                */
+               list_del_init(&poll->wait.entry);
+
+               /*
+                * Careful: this *must* be the last step, since as soon
+                * as req->head is NULL'ed out, the request can be
+                * completed and freed, since aio_poll_complete_work()
+                * will no longer need to take the waitqueue lock.
+                */
+               smp_store_release(&poll->head, NULL);
+               return 1;
+       }
+
         /* for instances that support it check for an event match first */
         if (mask && !(mask & poll->events))
                 return 0;
@@ -5633,8 +5677,10 @@ static int __io_arm_poll_handler(struct io_kiocb *req,
  
         if (mask) {
                 /* can't multishot if failed, just queue the event we've got */
-               if (unlikely(ipt->error || !ipt->nr_entries))
+               if (unlikely(ipt->error || !ipt->nr_entries)) {
                         poll->events |= EPOLLONESHOT;
+                       ipt->error = 0;
+               }
                 __io_poll_execute(req, mask);
                 return 0;
         }
@@ -5726,6 +5772,7 @@ static bool io_poll_remove_all(struct io_ring_ctx *ctx, struct task_struct *tsk,
                 list = &ctx->cancel_hash[i];
                 hlist_for_each_entry_safe(req, tmp, list, hash_node) {
                         if (io_match_task_safe(req, tsk, cancel_all)) {
+                               hlist_del_init(&req->hash_node);
                                 io_poll_cancel_req(req);
                                 found = true;
                         }
@@ -5849,6 +5896,8 @@ static int io_poll_add(struct io_kiocb *req, unsigned int issue_flags)
         ipt.pt._qproc = io_poll_queue_proc;
  
         ret = __io_arm_poll_handler(req, &req->poll, &ipt, poll->events);
+       if (!ret && ipt.error)
+               req_set_fail(req);
         ret = ret ?: ipt.error;
         if (ret)
                 __io_req_complete(req, issue_flags, ret, 0);
@@ -8024,6 +8073,7 @@ static int __io_sqe_files_scm(struct io_ring_ctx *ctx, int nr, int offset)
         }
  
         skb->sk = sk;
+       skb->scm_io_uring = 1;
  
         nr_files = 0;
         fpl->user = get_uid(current_user());
@@ -9260,11 +9310,6 @@ static void io_ring_ctx_free(struct io_ring_ctx *ctx)
  {
         io_sq_thread_finish(ctx);
  
-       if (ctx->mm_account) {
-               mmdrop(ctx->mm_account);
-               ctx->mm_account = NULL;
-       }
-
         /* __io_rsrc_put_work() may need uring_lock to progress, wait w/o it */
         io_wait_rsrc_data(ctx->buf_data);
         io_wait_rsrc_data(ctx->file_data);
@@ -9300,6 +9345,11 @@ static void io_ring_ctx_free(struct io_ring_ctx *ctx)
  #endif
         WARN_ON_ONCE(!list_empty(&ctx->ltimeout_list));
  
+       if (ctx->mm_account) {
+               mmdrop(ctx->mm_account);
+               ctx->mm_account = NULL;
+       }
+
         io_mem_free(ctx->rings);
         io_mem_free(ctx->sq_sqes);