Merge tag 'block-5.16-2021-11-19' of git://git.kernel.dk/linux-block

author Linus Torvalds <torvalds@linux-foundation.org>

Sat, 20 Nov 2021 19:05:10 +0000 (11:05 -0800)

committer Linus Torvalds <torvalds@linux-foundation.org>

Sat, 20 Nov 2021 19:05:10 +0000 (11:05 -0800)
author Linus Torvalds <torvalds@linux-foundation.org>
Sat, 20 Nov 2021 19:05:10 +0000 (11:05 -0800)
committer Linus Torvalds <torvalds@linux-foundation.org>
Sat, 20 Nov 2021 19:05:10 +0000 (11:05 -0800)
diff --git a/block/blk-cgroup.c b/block/blk-cgroup.c

index 88b1fce..663aabf 100644 (file)
--- a/block/blk-cgroup.c
+++ b/block/blk-cgroup.c
@@ -640,7 +640,7 @@ int blkg_conf_prep(struct blkcg *blkcg, const struct blkcg_policy *pol,
          */
         ret = blk_queue_enter(q, 0);
         if (ret)
-               return ret;
+               goto fail;
  
         rcu_read_lock();
         spin_lock_irq(&q->queue_lock);
@@ -676,13 +676,13 @@ int blkg_conf_prep(struct blkcg *blkcg, const struct blkcg_policy *pol,
                 new_blkg = blkg_alloc(pos, q, GFP_KERNEL);
                 if (unlikely(!new_blkg)) {
                         ret = -ENOMEM;
-                       goto fail;
+                       goto fail_exit_queue;
                 }
  
                 if (radix_tree_preload(GFP_KERNEL)) {
                         blkg_free(new_blkg);
                         ret = -ENOMEM;
-                       goto fail;
+                       goto fail_exit_queue;
                 }
  
                 rcu_read_lock();
@@ -722,9 +722,10 @@ fail_preloaded:
  fail_unlock:
         spin_unlock_irq(&q->queue_lock);
         rcu_read_unlock();
+fail_exit_queue:
+       blk_queue_exit(q);
  fail:
         blkdev_put_no_open(bdev);
-       blk_queue_exit(q);
         /*
          * If queue was bypassing, we should retry.  Do so after a
          * short msleep().  It isn't strictly necessary but queue
diff --git a/block/blk-core.c b/block/blk-core.c

index 9ee32f8..f0f38ca 100644 (file)
--- a/block/blk-core.c
+++ b/block/blk-core.c
@@ -363,8 +363,10 @@ void blk_cleanup_queue(struct request_queue *q)
         blk_queue_flag_set(QUEUE_FLAG_DEAD, q);
  
         blk_sync_queue(q);
-       if (queue_is_mq(q))
+       if (queue_is_mq(q)) {
+               blk_mq_cancel_work_sync(q);
                 blk_mq_exit_queue(q);
+       }
  
         /*
          * In theory, request pool of sched_tags belongs to request queue.
diff --git a/block/blk-flush.c b/block/blk-flush.c

index 8e364bd..1fce6d1 100644 (file)
--- a/block/blk-flush.c
+++ b/block/blk-flush.c
@@ -379,7 +379,7 @@ static void mq_flush_data_end_io(struct request *rq, blk_status_t error)
   * @rq is being submitted.  Analyze what needs to be done and put it on the
   * right queue.
   */
-bool blk_insert_flush(struct request *rq)
+void blk_insert_flush(struct request *rq)
  {
         struct request_queue *q = rq->q;
         unsigned long fflags = q->queue_flags;  /* may change, cache */
@@ -409,7 +409,7 @@ bool blk_insert_flush(struct request *rq)
          */
         if (!policy) {
                 blk_mq_end_request(rq, 0);
-               return true;
+               return;
         }
  
         BUG_ON(rq->bio != rq->biotail); /*assumes zero or single bio rq */
@@ -420,8 +420,10 @@ bool blk_insert_flush(struct request *rq)
          * for normal execution.
          */
         if ((policy & REQ_FSEQ_DATA) &&
-           !(policy & (REQ_FSEQ_PREFLUSH | REQ_FSEQ_POSTFLUSH)))
-               return false;
+           !(policy & (REQ_FSEQ_PREFLUSH | REQ_FSEQ_POSTFLUSH))) {
+               blk_mq_request_bypass_insert(rq, false, true);
+               return;
+       }
  
         /*
          * @rq should go through flush machinery.  Mark it part of flush
@@ -437,8 +439,6 @@ bool blk_insert_flush(struct request *rq)
         spin_lock_irq(&fq->mq_flush_lock);
         blk_flush_complete_seq(rq, fq, REQ_FSEQ_ACTIONS & ~policy, 0);
         spin_unlock_irq(&fq->mq_flush_lock);
-
-       return true;
  }
  
  /**
diff --git a/block/blk-mq.c b/block/blk-mq.c

index 3ab34c4..8799fa7 100644 (file)
--- a/block/blk-mq.c
+++ b/block/blk-mq.c
@@ -2543,8 +2543,7 @@ static struct request *blk_mq_get_new_requests(struct request_queue *q,
         return NULL;
  }
  
-static inline bool blk_mq_can_use_cached_rq(struct request *rq,
-               struct bio *bio)
+static inline bool blk_mq_can_use_cached_rq(struct request *rq, struct bio *bio)
  {
         if (blk_mq_get_hctx_type(bio->bi_opf) != rq->mq_hctx->type)
                 return false;
@@ -2565,7 +2564,6 @@ static inline struct request *blk_mq_get_request(struct request_queue *q,
         bool checked = false;
  
         if (plug) {
-
                 rq = rq_list_peek(&plug->cached_rq);
                 if (rq && rq->q == q) {
                         if (unlikely(!submit_bio_checks(bio)))
@@ -2587,12 +2585,14 @@ static inline struct request *blk_mq_get_request(struct request_queue *q,
  fallback:
         if (unlikely(bio_queue_enter(bio)))
                 return NULL;
-       if (!checked && !submit_bio_checks(bio))
-               return NULL;
+       if (unlikely(!checked && !submit_bio_checks(bio)))
+               goto out_put;
         rq = blk_mq_get_new_requests(q, plug, bio, nsegs, same_queue_rq);
-       if (!rq)
-               blk_queue_exit(q);
-       return rq;
+       if (rq)
+               return rq;
+out_put:
+       blk_queue_exit(q);
+       return NULL;
  }
  
  /**
@@ -2647,8 +2647,10 @@ void blk_mq_submit_bio(struct bio *bio)
                 return;
         }
  
-       if (op_is_flush(bio->bi_opf) && blk_insert_flush(rq))
+       if (op_is_flush(bio->bi_opf)) {
+               blk_insert_flush(rq);
                 return;
+       }
  
         if (plug && (q->nr_hw_queues == 1 ||
             blk_mq_is_shared_tags(rq->mq_hctx->flags) ||
@@ -4417,6 +4419,19 @@ unsigned int blk_mq_rq_cpu(struct request *rq)
  }
  EXPORT_SYMBOL(blk_mq_rq_cpu);
  
+void blk_mq_cancel_work_sync(struct request_queue *q)
+{
+       if (queue_is_mq(q)) {
+               struct blk_mq_hw_ctx *hctx;
+               int i;
+
+               cancel_delayed_work_sync(&q->requeue_work);
+
+               queue_for_each_hw_ctx(q, hctx, i)
+                       cancel_delayed_work_sync(&hctx->run_work);
+       }
+}
+
  static int __init blk_mq_init(void)
  {
         int i;
diff --git a/block/blk-mq.h b/block/blk-mq.h

index 8acfa65..afcf993 100644 (file)
--- a/block/blk-mq.h
+++ b/block/blk-mq.h
@@ -128,6 +128,8 @@ extern void blk_mq_hctx_kobj_init(struct blk_mq_hw_ctx *hctx);
  void blk_mq_free_plug_rqs(struct blk_plug *plug);
  void blk_mq_flush_plug_list(struct blk_plug *plug, bool from_schedule);
  
+void blk_mq_cancel_work_sync(struct request_queue *q);
+
  void blk_mq_release(struct request_queue *q);
  
  static inline struct blk_mq_ctx *__blk_mq_get_ctx(struct request_queue *q,
diff --git a/block/blk-sysfs.c b/block/blk-sysfs.c

index cef1f71..cd75b0f 100644 (file)
--- a/block/blk-sysfs.c
+++ b/block/blk-sysfs.c
@@ -791,16 +791,6 @@ static void blk_release_queue(struct kobject *kobj)
  
         blk_free_queue_stats(q->stats);
  
-       if (queue_is_mq(q)) {
-               struct blk_mq_hw_ctx *hctx;
-               int i;
-
-               cancel_delayed_work_sync(&q->requeue_work);
-
-               queue_for_each_hw_ctx(q, hctx, i)
-                       cancel_delayed_work_sync(&hctx->run_work);
-       }
-
         blk_exit_queue(q);
  
         blk_queue_free_zone_bitmaps(q);
diff --git a/block/blk.h b/block/blk.h

index b4fed20..ccde6e6 100644 (file)
--- a/block/blk.h
+++ b/block/blk.h
@@ -271,7 +271,7 @@ void __blk_account_io_done(struct request *req, u64 now);
   */
  #define ELV_ON_HASH(rq) ((rq)->rq_flags & RQF_HASHED)
  
-bool blk_insert_flush(struct request *rq);
+void blk_insert_flush(struct request *rq);
  
  int elevator_switch_mq(struct request_queue *q,
                               struct elevator_type *new_e);
diff --git a/block/elevator.c b/block/elevator.c

index 1f39f6e..19a78d5 100644 (file)
--- a/block/elevator.c
+++ b/block/elevator.c
@@ -694,12 +694,18 @@ void elevator_init_mq(struct request_queue *q)
         if (!e)
                 return;
  
+       /*
+        * We are called before adding disk, when there isn't any FS I/O,
+        * so freezing queue plus canceling dispatch work is enough to
+        * drain any dispatch activities originated from passthrough
+        * requests, then no need to quiesce queue which may add long boot
+        * latency, especially when lots of disks are involved.
+        */
         blk_mq_freeze_queue(q);
-       blk_mq_quiesce_queue(q);
+       blk_mq_cancel_work_sync(q);
  
         err = blk_mq_init_sched(q, e);
  
-       blk_mq_unquiesce_queue(q);
         blk_mq_unfreeze_queue(q);
  
         if (err) {
diff --git a/block/genhd.c b/block/genhd.c

index c5392cc..30362ae 100644 (file)
--- a/block/genhd.c
+++ b/block/genhd.c
@@ -1111,6 +1111,8 @@ static void disk_release(struct device *dev)
         might_sleep();
         WARN_ON_ONCE(disk_live(disk));
  
+       blk_mq_cancel_work_sync(disk->queue);
+
         disk_release_events(disk);
         kfree(disk->random);
         xa_destroy(&disk->part_tbl);
diff --git a/block/ioprio.c b/block/ioprio.c

index 0e4ff24..313c14a 100644 (file)
--- a/block/ioprio.c
+++ b/block/ioprio.c
@@ -69,7 +69,14 @@ int ioprio_check_cap(int ioprio)
  
         switch (class) {
                 case IOPRIO_CLASS_RT:
-                       if (!capable(CAP_SYS_NICE) && !capable(CAP_SYS_ADMIN))
+                       /*
+                        * Originally this only checked for CAP_SYS_ADMIN,
+                        * which was implicitly allowed for pid 0 by security
+                        * modules such as SELinux. Make sure we check
+                        * CAP_SYS_ADMIN first to avoid a denial/avc for
+                        * possibly missing CAP_SYS_NICE permission.
+                        */
+                       if (!capable(CAP_SYS_ADMIN) && !capable(CAP_SYS_NICE))
                                 return -EPERM;
                         fallthrough;
                         /* rt has prio field too */
diff --git a/fs/pstore/Kconfig b/fs/pstore/Kconfig

index 328da35..8adabde 100644 (file)
--- a/fs/pstore/Kconfig
+++ b/fs/pstore/Kconfig
@@ -173,7 +173,6 @@ config PSTORE_BLK
         tristate "Log panic/oops to a block device"
         depends on PSTORE
         depends on BLOCK
-       depends on BROKEN
         select PSTORE_ZONE
         default n
         help
author	Linus Torvalds <torvalds@linux-foundation.org>
	Sat, 20 Nov 2021 19:05:10 +0000 (11:05 -0800)
committer	Linus Torvalds <torvalds@linux-foundation.org>
	Sat, 20 Nov 2021 19:05:10 +0000 (11:05 -0800)
block/blk-cgroup.c		patch \| blob \| history
block/blk-core.c		patch \| blob \| history
block/blk-flush.c		patch \| blob \| history
block/blk-mq.c		patch \| blob \| history
block/blk-mq.h		patch \| blob \| history
block/blk-sysfs.c		patch \| blob \| history
block/blk.h		patch \| blob \| history
block/elevator.c		patch \| blob \| history
block/genhd.c		patch \| blob \| history
block/ioprio.c		patch \| blob \| history
fs/pstore/Kconfig		patch \| blob \| history