2 * Functions related to sysfs handling
4 #include <linux/kernel.h>
5 #include <linux/slab.h>
6 #include <linux/module.h>
8 #include <linux/blkdev.h>
9 #include <linux/backing-dev.h>
10 #include <linux/blktrace_api.h>
11 #include <linux/blk-mq.h>
12 #include <linux/blk-cgroup.h>
17 struct queue_sysfs_entry {
18 struct attribute attr;
19 ssize_t (*show)(struct request_queue *, char *);
20 ssize_t (*store)(struct request_queue *, const char *, size_t);
24 queue_var_show(unsigned long var, char *page)
26 return sprintf(page, "%lu\n", var);
30 queue_var_store(unsigned long *var, const char *page, size_t count)
35 err = kstrtoul(page, 10, &v);
36 if (err || v > UINT_MAX)
44 static ssize_t queue_requests_show(struct request_queue *q, char *page)
46 return queue_var_show(q->nr_requests, (page));
50 queue_requests_store(struct request_queue *q, const char *page, size_t count)
55 if (!q->request_fn && !q->mq_ops)
58 ret = queue_var_store(&nr, page, count);
62 if (nr < BLKDEV_MIN_RQ)
66 err = blk_update_nr_requests(q, nr);
68 err = blk_mq_update_nr_requests(q, nr);
76 static ssize_t queue_ra_show(struct request_queue *q, char *page)
78 unsigned long ra_kb = q->backing_dev_info.ra_pages <<
81 return queue_var_show(ra_kb, (page));
85 queue_ra_store(struct request_queue *q, const char *page, size_t count)
88 ssize_t ret = queue_var_store(&ra_kb, page, count);
93 q->backing_dev_info.ra_pages = ra_kb >> (PAGE_SHIFT - 10);
98 static ssize_t queue_max_sectors_show(struct request_queue *q, char *page)
100 int max_sectors_kb = queue_max_sectors(q) >> 1;
102 return queue_var_show(max_sectors_kb, (page));
105 static ssize_t queue_max_segments_show(struct request_queue *q, char *page)
107 return queue_var_show(queue_max_segments(q), (page));
110 static ssize_t queue_max_integrity_segments_show(struct request_queue *q, char *page)
112 return queue_var_show(q->limits.max_integrity_segments, (page));
115 static ssize_t queue_max_segment_size_show(struct request_queue *q, char *page)
117 if (blk_queue_cluster(q))
118 return queue_var_show(queue_max_segment_size(q), (page));
120 return queue_var_show(PAGE_SIZE, (page));
123 static ssize_t queue_logical_block_size_show(struct request_queue *q, char *page)
125 return queue_var_show(queue_logical_block_size(q), page);
128 static ssize_t queue_physical_block_size_show(struct request_queue *q, char *page)
130 return queue_var_show(queue_physical_block_size(q), page);
133 static ssize_t queue_io_min_show(struct request_queue *q, char *page)
135 return queue_var_show(queue_io_min(q), page);
138 static ssize_t queue_io_opt_show(struct request_queue *q, char *page)
140 return queue_var_show(queue_io_opt(q), page);
143 static ssize_t queue_discard_granularity_show(struct request_queue *q, char *page)
145 return queue_var_show(q->limits.discard_granularity, page);
148 static ssize_t queue_discard_max_hw_show(struct request_queue *q, char *page)
151 return sprintf(page, "%llu\n",
152 (unsigned long long)q->limits.max_hw_discard_sectors << 9);
155 static ssize_t queue_discard_max_show(struct request_queue *q, char *page)
157 return sprintf(page, "%llu\n",
158 (unsigned long long)q->limits.max_discard_sectors << 9);
161 static ssize_t queue_discard_max_store(struct request_queue *q,
162 const char *page, size_t count)
164 unsigned long max_discard;
165 ssize_t ret = queue_var_store(&max_discard, page, count);
170 if (max_discard & (q->limits.discard_granularity - 1))
174 if (max_discard > UINT_MAX)
177 if (max_discard > q->limits.max_hw_discard_sectors)
178 max_discard = q->limits.max_hw_discard_sectors;
180 q->limits.max_discard_sectors = max_discard;
184 static ssize_t queue_discard_zeroes_data_show(struct request_queue *q, char *page)
186 return queue_var_show(queue_discard_zeroes_data(q), page);
189 static ssize_t queue_write_same_max_show(struct request_queue *q, char *page)
191 return sprintf(page, "%llu\n",
192 (unsigned long long)q->limits.max_write_same_sectors << 9);
197 queue_max_sectors_store(struct request_queue *q, const char *page, size_t count)
199 unsigned long max_sectors_kb,
200 max_hw_sectors_kb = queue_max_hw_sectors(q) >> 1,
201 page_kb = 1 << (PAGE_SHIFT - 10);
202 ssize_t ret = queue_var_store(&max_sectors_kb, page, count);
207 max_hw_sectors_kb = min_not_zero(max_hw_sectors_kb, (unsigned long)
208 q->limits.max_dev_sectors >> 1);
210 if (max_sectors_kb > max_hw_sectors_kb || max_sectors_kb < page_kb)
213 spin_lock_irq(q->queue_lock);
214 q->limits.max_sectors = max_sectors_kb << 1;
215 spin_unlock_irq(q->queue_lock);
220 static ssize_t queue_max_hw_sectors_show(struct request_queue *q, char *page)
222 int max_hw_sectors_kb = queue_max_hw_sectors(q) >> 1;
224 return queue_var_show(max_hw_sectors_kb, (page));
227 #define QUEUE_SYSFS_BIT_FNS(name, flag, neg) \
229 queue_show_##name(struct request_queue *q, char *page) \
232 bit = test_bit(QUEUE_FLAG_##flag, &q->queue_flags); \
233 return queue_var_show(neg ? !bit : bit, page); \
236 queue_store_##name(struct request_queue *q, const char *page, size_t count) \
240 ret = queue_var_store(&val, page, count); \
246 spin_lock_irq(q->queue_lock); \
248 queue_flag_set(QUEUE_FLAG_##flag, q); \
250 queue_flag_clear(QUEUE_FLAG_##flag, q); \
251 spin_unlock_irq(q->queue_lock); \
255 QUEUE_SYSFS_BIT_FNS(nonrot, NONROT, 1);
256 QUEUE_SYSFS_BIT_FNS(random, ADD_RANDOM, 0);
257 QUEUE_SYSFS_BIT_FNS(iostats, IO_STAT, 0);
258 #undef QUEUE_SYSFS_BIT_FNS
260 static ssize_t queue_nomerges_show(struct request_queue *q, char *page)
262 return queue_var_show((blk_queue_nomerges(q) << 1) |
263 blk_queue_noxmerges(q), page);
266 static ssize_t queue_nomerges_store(struct request_queue *q, const char *page,
270 ssize_t ret = queue_var_store(&nm, page, count);
275 spin_lock_irq(q->queue_lock);
276 queue_flag_clear(QUEUE_FLAG_NOMERGES, q);
277 queue_flag_clear(QUEUE_FLAG_NOXMERGES, q);
279 queue_flag_set(QUEUE_FLAG_NOMERGES, q);
281 queue_flag_set(QUEUE_FLAG_NOXMERGES, q);
282 spin_unlock_irq(q->queue_lock);
287 static ssize_t queue_rq_affinity_show(struct request_queue *q, char *page)
289 bool set = test_bit(QUEUE_FLAG_SAME_COMP, &q->queue_flags);
290 bool force = test_bit(QUEUE_FLAG_SAME_FORCE, &q->queue_flags);
292 return queue_var_show(set << force, page);
296 queue_rq_affinity_store(struct request_queue *q, const char *page, size_t count)
298 ssize_t ret = -EINVAL;
302 ret = queue_var_store(&val, page, count);
306 spin_lock_irq(q->queue_lock);
308 queue_flag_set(QUEUE_FLAG_SAME_COMP, q);
309 queue_flag_set(QUEUE_FLAG_SAME_FORCE, q);
310 } else if (val == 1) {
311 queue_flag_set(QUEUE_FLAG_SAME_COMP, q);
312 queue_flag_clear(QUEUE_FLAG_SAME_FORCE, q);
313 } else if (val == 0) {
314 queue_flag_clear(QUEUE_FLAG_SAME_COMP, q);
315 queue_flag_clear(QUEUE_FLAG_SAME_FORCE, q);
317 spin_unlock_irq(q->queue_lock);
322 static ssize_t queue_poll_show(struct request_queue *q, char *page)
324 return queue_var_show(test_bit(QUEUE_FLAG_POLL, &q->queue_flags), page);
327 static ssize_t queue_poll_store(struct request_queue *q, const char *page,
330 unsigned long poll_on;
333 if (!q->mq_ops || !q->mq_ops->poll)
336 ret = queue_var_store(&poll_on, page, count);
340 spin_lock_irq(q->queue_lock);
342 queue_flag_set(QUEUE_FLAG_POLL, q);
344 queue_flag_clear(QUEUE_FLAG_POLL, q);
345 spin_unlock_irq(q->queue_lock);
350 static struct queue_sysfs_entry queue_requests_entry = {
351 .attr = {.name = "nr_requests", .mode = S_IRUGO | S_IWUSR },
352 .show = queue_requests_show,
353 .store = queue_requests_store,
356 static struct queue_sysfs_entry queue_ra_entry = {
357 .attr = {.name = "read_ahead_kb", .mode = S_IRUGO | S_IWUSR },
358 .show = queue_ra_show,
359 .store = queue_ra_store,
362 static struct queue_sysfs_entry queue_max_sectors_entry = {
363 .attr = {.name = "max_sectors_kb", .mode = S_IRUGO | S_IWUSR },
364 .show = queue_max_sectors_show,
365 .store = queue_max_sectors_store,
368 static struct queue_sysfs_entry queue_max_hw_sectors_entry = {
369 .attr = {.name = "max_hw_sectors_kb", .mode = S_IRUGO },
370 .show = queue_max_hw_sectors_show,
373 static struct queue_sysfs_entry queue_max_segments_entry = {
374 .attr = {.name = "max_segments", .mode = S_IRUGO },
375 .show = queue_max_segments_show,
378 static struct queue_sysfs_entry queue_max_integrity_segments_entry = {
379 .attr = {.name = "max_integrity_segments", .mode = S_IRUGO },
380 .show = queue_max_integrity_segments_show,
383 static struct queue_sysfs_entry queue_max_segment_size_entry = {
384 .attr = {.name = "max_segment_size", .mode = S_IRUGO },
385 .show = queue_max_segment_size_show,
388 static struct queue_sysfs_entry queue_iosched_entry = {
389 .attr = {.name = "scheduler", .mode = S_IRUGO | S_IWUSR },
390 .show = elv_iosched_show,
391 .store = elv_iosched_store,
394 static struct queue_sysfs_entry queue_hw_sector_size_entry = {
395 .attr = {.name = "hw_sector_size", .mode = S_IRUGO },
396 .show = queue_logical_block_size_show,
399 static struct queue_sysfs_entry queue_logical_block_size_entry = {
400 .attr = {.name = "logical_block_size", .mode = S_IRUGO },
401 .show = queue_logical_block_size_show,
404 static struct queue_sysfs_entry queue_physical_block_size_entry = {
405 .attr = {.name = "physical_block_size", .mode = S_IRUGO },
406 .show = queue_physical_block_size_show,
409 static struct queue_sysfs_entry queue_io_min_entry = {
410 .attr = {.name = "minimum_io_size", .mode = S_IRUGO },
411 .show = queue_io_min_show,
414 static struct queue_sysfs_entry queue_io_opt_entry = {
415 .attr = {.name = "optimal_io_size", .mode = S_IRUGO },
416 .show = queue_io_opt_show,
419 static struct queue_sysfs_entry queue_discard_granularity_entry = {
420 .attr = {.name = "discard_granularity", .mode = S_IRUGO },
421 .show = queue_discard_granularity_show,
424 static struct queue_sysfs_entry queue_discard_max_hw_entry = {
425 .attr = {.name = "discard_max_hw_bytes", .mode = S_IRUGO },
426 .show = queue_discard_max_hw_show,
429 static struct queue_sysfs_entry queue_discard_max_entry = {
430 .attr = {.name = "discard_max_bytes", .mode = S_IRUGO | S_IWUSR },
431 .show = queue_discard_max_show,
432 .store = queue_discard_max_store,
435 static struct queue_sysfs_entry queue_discard_zeroes_data_entry = {
436 .attr = {.name = "discard_zeroes_data", .mode = S_IRUGO },
437 .show = queue_discard_zeroes_data_show,
440 static struct queue_sysfs_entry queue_write_same_max_entry = {
441 .attr = {.name = "write_same_max_bytes", .mode = S_IRUGO },
442 .show = queue_write_same_max_show,
445 static struct queue_sysfs_entry queue_nonrot_entry = {
446 .attr = {.name = "rotational", .mode = S_IRUGO | S_IWUSR },
447 .show = queue_show_nonrot,
448 .store = queue_store_nonrot,
451 static struct queue_sysfs_entry queue_nomerges_entry = {
452 .attr = {.name = "nomerges", .mode = S_IRUGO | S_IWUSR },
453 .show = queue_nomerges_show,
454 .store = queue_nomerges_store,
457 static struct queue_sysfs_entry queue_rq_affinity_entry = {
458 .attr = {.name = "rq_affinity", .mode = S_IRUGO | S_IWUSR },
459 .show = queue_rq_affinity_show,
460 .store = queue_rq_affinity_store,
463 static struct queue_sysfs_entry queue_iostats_entry = {
464 .attr = {.name = "iostats", .mode = S_IRUGO | S_IWUSR },
465 .show = queue_show_iostats,
466 .store = queue_store_iostats,
469 static struct queue_sysfs_entry queue_random_entry = {
470 .attr = {.name = "add_random", .mode = S_IRUGO | S_IWUSR },
471 .show = queue_show_random,
472 .store = queue_store_random,
475 static struct queue_sysfs_entry queue_poll_entry = {
476 .attr = {.name = "io_poll", .mode = S_IRUGO | S_IWUSR },
477 .show = queue_poll_show,
478 .store = queue_poll_store,
481 static struct attribute *default_attrs[] = {
482 &queue_requests_entry.attr,
483 &queue_ra_entry.attr,
484 &queue_max_hw_sectors_entry.attr,
485 &queue_max_sectors_entry.attr,
486 &queue_max_segments_entry.attr,
487 &queue_max_integrity_segments_entry.attr,
488 &queue_max_segment_size_entry.attr,
489 &queue_iosched_entry.attr,
490 &queue_hw_sector_size_entry.attr,
491 &queue_logical_block_size_entry.attr,
492 &queue_physical_block_size_entry.attr,
493 &queue_io_min_entry.attr,
494 &queue_io_opt_entry.attr,
495 &queue_discard_granularity_entry.attr,
496 &queue_discard_max_entry.attr,
497 &queue_discard_max_hw_entry.attr,
498 &queue_discard_zeroes_data_entry.attr,
499 &queue_write_same_max_entry.attr,
500 &queue_nonrot_entry.attr,
501 &queue_nomerges_entry.attr,
502 &queue_rq_affinity_entry.attr,
503 &queue_iostats_entry.attr,
504 &queue_random_entry.attr,
505 &queue_poll_entry.attr,
509 #define to_queue(atr) container_of((atr), struct queue_sysfs_entry, attr)
512 queue_attr_show(struct kobject *kobj, struct attribute *attr, char *page)
514 struct queue_sysfs_entry *entry = to_queue(attr);
515 struct request_queue *q =
516 container_of(kobj, struct request_queue, kobj);
521 mutex_lock(&q->sysfs_lock);
522 if (blk_queue_dying(q)) {
523 mutex_unlock(&q->sysfs_lock);
526 res = entry->show(q, page);
527 mutex_unlock(&q->sysfs_lock);
532 queue_attr_store(struct kobject *kobj, struct attribute *attr,
533 const char *page, size_t length)
535 struct queue_sysfs_entry *entry = to_queue(attr);
536 struct request_queue *q;
542 q = container_of(kobj, struct request_queue, kobj);
543 mutex_lock(&q->sysfs_lock);
544 if (blk_queue_dying(q)) {
545 mutex_unlock(&q->sysfs_lock);
548 res = entry->store(q, page, length);
549 mutex_unlock(&q->sysfs_lock);
553 static void blk_free_queue_rcu(struct rcu_head *rcu_head)
555 struct request_queue *q = container_of(rcu_head, struct request_queue,
557 kmem_cache_free(blk_requestq_cachep, q);
561 * blk_release_queue: - release a &struct request_queue when it is no longer needed
562 * @kobj: the kobj belonging to the request queue to be released
565 * blk_release_queue is the pair to blk_init_queue() or
566 * blk_queue_make_request(). It should be called when a request queue is
567 * being released; typically when a block device is being de-registered.
568 * Currently, its primary task it to free all the &struct request
569 * structures that were allocated to the queue and the queue itself.
572 * The low level driver must have finished any outstanding requests first
573 * via blk_cleanup_queue().
575 static void blk_release_queue(struct kobject *kobj)
577 struct request_queue *q =
578 container_of(kobj, struct request_queue, kobj);
580 bdi_exit(&q->backing_dev_info);
584 spin_lock_irq(q->queue_lock);
586 spin_unlock_irq(q->queue_lock);
587 elevator_exit(q->elevator);
590 blk_exit_rl(&q->root_rl);
593 __blk_queue_free_tags(q);
596 blk_free_flush_queue(q->fq);
600 blk_trace_shutdown(q);
603 bioset_free(q->bio_split);
605 ida_simple_remove(&blk_queue_ida, q->id);
606 call_rcu(&q->rcu_head, blk_free_queue_rcu);
609 static const struct sysfs_ops queue_sysfs_ops = {
610 .show = queue_attr_show,
611 .store = queue_attr_store,
614 struct kobj_type blk_queue_ktype = {
615 .sysfs_ops = &queue_sysfs_ops,
616 .default_attrs = default_attrs,
617 .release = blk_release_queue,
620 int blk_register_queue(struct gendisk *disk)
623 struct device *dev = disk_to_dev(disk);
624 struct request_queue *q = disk->queue;
630 * SCSI probing may synchronously create and destroy a lot of
631 * request_queues for non-existent devices. Shutting down a fully
632 * functional queue takes measureable wallclock time as RCU grace
633 * periods are involved. To avoid excessive latency in these
634 * cases, a request_queue starts out in a degraded mode which is
635 * faster to shut down and is made fully functional here as
636 * request_queues for non-existent devices never get registered.
638 if (!blk_queue_init_done(q)) {
639 queue_flag_set_unlocked(QUEUE_FLAG_INIT_DONE, q);
640 percpu_ref_switch_to_percpu(&q->q_usage_counter);
641 blk_queue_bypass_end(q);
644 ret = blk_trace_init_sysfs(dev);
648 ret = kobject_add(&q->kobj, kobject_get(&dev->kobj), "%s", "queue");
650 blk_trace_remove_sysfs(dev);
654 kobject_uevent(&q->kobj, KOBJ_ADD);
657 blk_mq_register_disk(disk);
662 ret = elv_register_queue(q);
664 kobject_uevent(&q->kobj, KOBJ_REMOVE);
665 kobject_del(&q->kobj);
666 blk_trace_remove_sysfs(dev);
667 kobject_put(&dev->kobj);
674 void blk_unregister_queue(struct gendisk *disk)
676 struct request_queue *q = disk->queue;
682 blk_mq_unregister_disk(disk);
685 elv_unregister_queue(q);
687 kobject_uevent(&q->kobj, KOBJ_REMOVE);
688 kobject_del(&q->kobj);
689 blk_trace_remove_sysfs(disk_to_dev(disk));
690 kobject_put(&disk_to_dev(disk)->kobj);