2 * Functions related to sysfs handling
4 #include <linux/kernel.h>
5 #include <linux/slab.h>
6 #include <linux/module.h>
8 #include <linux/blkdev.h>
9 #include <linux/backing-dev.h>
10 #include <linux/blktrace_api.h>
11 #include <linux/blk-mq.h>
12 #include <linux/blk-cgroup.h>
17 struct queue_sysfs_entry
{
18 struct attribute attr
;
19 ssize_t (*show
)(struct request_queue
*, char *);
20 ssize_t (*store
)(struct request_queue
*, const char *, size_t);
24 queue_var_show(unsigned long var
, char *page
)
26 return sprintf(page
, "%lu\n", var
);
30 queue_var_store(unsigned long *var
, const char *page
, size_t count
)
35 err
= kstrtoul(page
, 10, &v
);
36 if (err
|| v
> UINT_MAX
)
44 static ssize_t
queue_requests_show(struct request_queue
*q
, char *page
)
46 return queue_var_show(q
->nr_requests
, (page
));
50 queue_requests_store(struct request_queue
*q
, const char *page
, size_t count
)
55 if (!q
->request_fn
&& !q
->mq_ops
)
58 ret
= queue_var_store(&nr
, page
, count
);
62 if (nr
< BLKDEV_MIN_RQ
)
66 err
= blk_update_nr_requests(q
, nr
);
68 err
= blk_mq_update_nr_requests(q
, nr
);
76 static ssize_t
queue_ra_show(struct request_queue
*q
, char *page
)
78 unsigned long ra_kb
= q
->backing_dev_info
.ra_pages
<<
81 return queue_var_show(ra_kb
, (page
));
85 queue_ra_store(struct request_queue
*q
, const char *page
, size_t count
)
88 ssize_t ret
= queue_var_store(&ra_kb
, page
, count
);
93 q
->backing_dev_info
.ra_pages
= ra_kb
>> (PAGE_SHIFT
- 10);
98 static ssize_t
queue_max_sectors_show(struct request_queue
*q
, char *page
)
100 int max_sectors_kb
= queue_max_sectors(q
) >> 1;
102 return queue_var_show(max_sectors_kb
, (page
));
105 static ssize_t
queue_max_segments_show(struct request_queue
*q
, char *page
)
107 return queue_var_show(queue_max_segments(q
), (page
));
110 static ssize_t
queue_max_integrity_segments_show(struct request_queue
*q
, char *page
)
112 return queue_var_show(q
->limits
.max_integrity_segments
, (page
));
115 static ssize_t
queue_max_segment_size_show(struct request_queue
*q
, char *page
)
117 if (blk_queue_cluster(q
))
118 return queue_var_show(queue_max_segment_size(q
), (page
));
120 return queue_var_show(PAGE_SIZE
, (page
));
123 static ssize_t
queue_logical_block_size_show(struct request_queue
*q
, char *page
)
125 return queue_var_show(queue_logical_block_size(q
), page
);
128 static ssize_t
queue_physical_block_size_show(struct request_queue
*q
, char *page
)
130 return queue_var_show(queue_physical_block_size(q
), page
);
133 static ssize_t
queue_io_min_show(struct request_queue
*q
, char *page
)
135 return queue_var_show(queue_io_min(q
), page
);
138 static ssize_t
queue_io_opt_show(struct request_queue
*q
, char *page
)
140 return queue_var_show(queue_io_opt(q
), page
);
143 static ssize_t
queue_discard_granularity_show(struct request_queue
*q
, char *page
)
145 return queue_var_show(q
->limits
.discard_granularity
, page
);
148 static ssize_t
queue_discard_max_hw_show(struct request_queue
*q
, char *page
)
151 return sprintf(page
, "%llu\n",
152 (unsigned long long)q
->limits
.max_hw_discard_sectors
<< 9);
155 static ssize_t
queue_discard_max_show(struct request_queue
*q
, char *page
)
157 return sprintf(page
, "%llu\n",
158 (unsigned long long)q
->limits
.max_discard_sectors
<< 9);
161 static ssize_t
queue_discard_max_store(struct request_queue
*q
,
162 const char *page
, size_t count
)
164 unsigned long max_discard
;
165 ssize_t ret
= queue_var_store(&max_discard
, page
, count
);
170 if (max_discard
& (q
->limits
.discard_granularity
- 1))
174 if (max_discard
> UINT_MAX
)
177 if (max_discard
> q
->limits
.max_hw_discard_sectors
)
178 max_discard
= q
->limits
.max_hw_discard_sectors
;
180 q
->limits
.max_discard_sectors
= max_discard
;
184 static ssize_t
queue_discard_zeroes_data_show(struct request_queue
*q
, char *page
)
186 return queue_var_show(queue_discard_zeroes_data(q
), page
);
189 static ssize_t
queue_write_same_max_show(struct request_queue
*q
, char *page
)
191 return sprintf(page
, "%llu\n",
192 (unsigned long long)q
->limits
.max_write_same_sectors
<< 9);
197 queue_max_sectors_store(struct request_queue
*q
, const char *page
, size_t count
)
199 unsigned long max_sectors_kb
,
200 max_hw_sectors_kb
= queue_max_hw_sectors(q
) >> 1,
201 page_kb
= 1 << (PAGE_SHIFT
- 10);
202 ssize_t ret
= queue_var_store(&max_sectors_kb
, page
, count
);
207 max_hw_sectors_kb
= min_not_zero(max_hw_sectors_kb
, (unsigned long)
208 q
->limits
.max_dev_sectors
>> 1);
210 if (max_sectors_kb
> max_hw_sectors_kb
|| max_sectors_kb
< page_kb
)
213 spin_lock_irq(q
->queue_lock
);
214 q
->limits
.max_sectors
= max_sectors_kb
<< 1;
215 q
->backing_dev_info
.io_pages
= max_sectors_kb
>> (PAGE_SHIFT
- 10);
216 spin_unlock_irq(q
->queue_lock
);
221 static ssize_t
queue_max_hw_sectors_show(struct request_queue
*q
, char *page
)
223 int max_hw_sectors_kb
= queue_max_hw_sectors(q
) >> 1;
225 return queue_var_show(max_hw_sectors_kb
, (page
));
228 #define QUEUE_SYSFS_BIT_FNS(name, flag, neg) \
230 queue_show_##name(struct request_queue *q, char *page) \
233 bit = test_bit(QUEUE_FLAG_##flag, &q->queue_flags); \
234 return queue_var_show(neg ? !bit : bit, page); \
237 queue_store_##name(struct request_queue *q, const char *page, size_t count) \
241 ret = queue_var_store(&val, page, count); \
247 spin_lock_irq(q->queue_lock); \
249 queue_flag_set(QUEUE_FLAG_##flag, q); \
251 queue_flag_clear(QUEUE_FLAG_##flag, q); \
252 spin_unlock_irq(q->queue_lock); \
256 QUEUE_SYSFS_BIT_FNS(nonrot
, NONROT
, 1);
257 QUEUE_SYSFS_BIT_FNS(random
, ADD_RANDOM
, 0);
258 QUEUE_SYSFS_BIT_FNS(iostats
, IO_STAT
, 0);
259 #undef QUEUE_SYSFS_BIT_FNS
261 static ssize_t
queue_nomerges_show(struct request_queue
*q
, char *page
)
263 return queue_var_show((blk_queue_nomerges(q
) << 1) |
264 blk_queue_noxmerges(q
), page
);
267 static ssize_t
queue_nomerges_store(struct request_queue
*q
, const char *page
,
271 ssize_t ret
= queue_var_store(&nm
, page
, count
);
276 spin_lock_irq(q
->queue_lock
);
277 queue_flag_clear(QUEUE_FLAG_NOMERGES
, q
);
278 queue_flag_clear(QUEUE_FLAG_NOXMERGES
, q
);
280 queue_flag_set(QUEUE_FLAG_NOMERGES
, q
);
282 queue_flag_set(QUEUE_FLAG_NOXMERGES
, q
);
283 spin_unlock_irq(q
->queue_lock
);
288 static ssize_t
queue_rq_affinity_show(struct request_queue
*q
, char *page
)
290 bool set
= test_bit(QUEUE_FLAG_SAME_COMP
, &q
->queue_flags
);
291 bool force
= test_bit(QUEUE_FLAG_SAME_FORCE
, &q
->queue_flags
);
293 return queue_var_show(set
<< force
, page
);
297 queue_rq_affinity_store(struct request_queue
*q
, const char *page
, size_t count
)
299 ssize_t ret
= -EINVAL
;
303 ret
= queue_var_store(&val
, page
, count
);
307 spin_lock_irq(q
->queue_lock
);
309 queue_flag_set(QUEUE_FLAG_SAME_COMP
, q
);
310 queue_flag_set(QUEUE_FLAG_SAME_FORCE
, q
);
311 } else if (val
== 1) {
312 queue_flag_set(QUEUE_FLAG_SAME_COMP
, q
);
313 queue_flag_clear(QUEUE_FLAG_SAME_FORCE
, q
);
314 } else if (val
== 0) {
315 queue_flag_clear(QUEUE_FLAG_SAME_COMP
, q
);
316 queue_flag_clear(QUEUE_FLAG_SAME_FORCE
, q
);
318 spin_unlock_irq(q
->queue_lock
);
323 static ssize_t
queue_poll_show(struct request_queue
*q
, char *page
)
325 return queue_var_show(test_bit(QUEUE_FLAG_POLL
, &q
->queue_flags
), page
);
328 static ssize_t
queue_poll_store(struct request_queue
*q
, const char *page
,
331 unsigned long poll_on
;
334 if (!q
->mq_ops
|| !q
->mq_ops
->poll
)
337 ret
= queue_var_store(&poll_on
, page
, count
);
341 spin_lock_irq(q
->queue_lock
);
343 queue_flag_set(QUEUE_FLAG_POLL
, q
);
345 queue_flag_clear(QUEUE_FLAG_POLL
, q
);
346 spin_unlock_irq(q
->queue_lock
);
351 static ssize_t
queue_wc_show(struct request_queue
*q
, char *page
)
353 if (test_bit(QUEUE_FLAG_WC
, &q
->queue_flags
))
354 return sprintf(page
, "write back\n");
356 return sprintf(page
, "write through\n");
359 static ssize_t
queue_wc_store(struct request_queue
*q
, const char *page
,
364 if (!strncmp(page
, "write back", 10))
366 else if (!strncmp(page
, "write through", 13) ||
367 !strncmp(page
, "none", 4))
373 spin_lock_irq(q
->queue_lock
);
375 queue_flag_set(QUEUE_FLAG_WC
, q
);
377 queue_flag_clear(QUEUE_FLAG_WC
, q
);
378 spin_unlock_irq(q
->queue_lock
);
383 static ssize_t
queue_dax_show(struct request_queue
*q
, char *page
)
385 return queue_var_show(blk_queue_dax(q
), page
);
388 static struct queue_sysfs_entry queue_requests_entry
= {
389 .attr
= {.name
= "nr_requests", .mode
= S_IRUGO
| S_IWUSR
},
390 .show
= queue_requests_show
,
391 .store
= queue_requests_store
,
394 static struct queue_sysfs_entry queue_ra_entry
= {
395 .attr
= {.name
= "read_ahead_kb", .mode
= S_IRUGO
| S_IWUSR
},
396 .show
= queue_ra_show
,
397 .store
= queue_ra_store
,
400 static struct queue_sysfs_entry queue_max_sectors_entry
= {
401 .attr
= {.name
= "max_sectors_kb", .mode
= S_IRUGO
| S_IWUSR
},
402 .show
= queue_max_sectors_show
,
403 .store
= queue_max_sectors_store
,
406 static struct queue_sysfs_entry queue_max_hw_sectors_entry
= {
407 .attr
= {.name
= "max_hw_sectors_kb", .mode
= S_IRUGO
},
408 .show
= queue_max_hw_sectors_show
,
411 static struct queue_sysfs_entry queue_max_segments_entry
= {
412 .attr
= {.name
= "max_segments", .mode
= S_IRUGO
},
413 .show
= queue_max_segments_show
,
416 static struct queue_sysfs_entry queue_max_integrity_segments_entry
= {
417 .attr
= {.name
= "max_integrity_segments", .mode
= S_IRUGO
},
418 .show
= queue_max_integrity_segments_show
,
421 static struct queue_sysfs_entry queue_max_segment_size_entry
= {
422 .attr
= {.name
= "max_segment_size", .mode
= S_IRUGO
},
423 .show
= queue_max_segment_size_show
,
426 static struct queue_sysfs_entry queue_iosched_entry
= {
427 .attr
= {.name
= "scheduler", .mode
= S_IRUGO
| S_IWUSR
},
428 .show
= elv_iosched_show
,
429 .store
= elv_iosched_store
,
432 static struct queue_sysfs_entry queue_hw_sector_size_entry
= {
433 .attr
= {.name
= "hw_sector_size", .mode
= S_IRUGO
},
434 .show
= queue_logical_block_size_show
,
437 static struct queue_sysfs_entry queue_logical_block_size_entry
= {
438 .attr
= {.name
= "logical_block_size", .mode
= S_IRUGO
},
439 .show
= queue_logical_block_size_show
,
442 static struct queue_sysfs_entry queue_physical_block_size_entry
= {
443 .attr
= {.name
= "physical_block_size", .mode
= S_IRUGO
},
444 .show
= queue_physical_block_size_show
,
447 static struct queue_sysfs_entry queue_io_min_entry
= {
448 .attr
= {.name
= "minimum_io_size", .mode
= S_IRUGO
},
449 .show
= queue_io_min_show
,
452 static struct queue_sysfs_entry queue_io_opt_entry
= {
453 .attr
= {.name
= "optimal_io_size", .mode
= S_IRUGO
},
454 .show
= queue_io_opt_show
,
457 static struct queue_sysfs_entry queue_discard_granularity_entry
= {
458 .attr
= {.name
= "discard_granularity", .mode
= S_IRUGO
},
459 .show
= queue_discard_granularity_show
,
462 static struct queue_sysfs_entry queue_discard_max_hw_entry
= {
463 .attr
= {.name
= "discard_max_hw_bytes", .mode
= S_IRUGO
},
464 .show
= queue_discard_max_hw_show
,
467 static struct queue_sysfs_entry queue_discard_max_entry
= {
468 .attr
= {.name
= "discard_max_bytes", .mode
= S_IRUGO
| S_IWUSR
},
469 .show
= queue_discard_max_show
,
470 .store
= queue_discard_max_store
,
473 static struct queue_sysfs_entry queue_discard_zeroes_data_entry
= {
474 .attr
= {.name
= "discard_zeroes_data", .mode
= S_IRUGO
},
475 .show
= queue_discard_zeroes_data_show
,
478 static struct queue_sysfs_entry queue_write_same_max_entry
= {
479 .attr
= {.name
= "write_same_max_bytes", .mode
= S_IRUGO
},
480 .show
= queue_write_same_max_show
,
483 static struct queue_sysfs_entry queue_nonrot_entry
= {
484 .attr
= {.name
= "rotational", .mode
= S_IRUGO
| S_IWUSR
},
485 .show
= queue_show_nonrot
,
486 .store
= queue_store_nonrot
,
489 static struct queue_sysfs_entry queue_nomerges_entry
= {
490 .attr
= {.name
= "nomerges", .mode
= S_IRUGO
| S_IWUSR
},
491 .show
= queue_nomerges_show
,
492 .store
= queue_nomerges_store
,
495 static struct queue_sysfs_entry queue_rq_affinity_entry
= {
496 .attr
= {.name
= "rq_affinity", .mode
= S_IRUGO
| S_IWUSR
},
497 .show
= queue_rq_affinity_show
,
498 .store
= queue_rq_affinity_store
,
501 static struct queue_sysfs_entry queue_iostats_entry
= {
502 .attr
= {.name
= "iostats", .mode
= S_IRUGO
| S_IWUSR
},
503 .show
= queue_show_iostats
,
504 .store
= queue_store_iostats
,
507 static struct queue_sysfs_entry queue_random_entry
= {
508 .attr
= {.name
= "add_random", .mode
= S_IRUGO
| S_IWUSR
},
509 .show
= queue_show_random
,
510 .store
= queue_store_random
,
513 static struct queue_sysfs_entry queue_poll_entry
= {
514 .attr
= {.name
= "io_poll", .mode
= S_IRUGO
| S_IWUSR
},
515 .show
= queue_poll_show
,
516 .store
= queue_poll_store
,
519 static struct queue_sysfs_entry queue_wc_entry
= {
520 .attr
= {.name
= "write_cache", .mode
= S_IRUGO
| S_IWUSR
},
521 .show
= queue_wc_show
,
522 .store
= queue_wc_store
,
525 static struct queue_sysfs_entry queue_dax_entry
= {
526 .attr
= {.name
= "dax", .mode
= S_IRUGO
},
527 .show
= queue_dax_show
,
530 static struct attribute
*default_attrs
[] = {
531 &queue_requests_entry
.attr
,
532 &queue_ra_entry
.attr
,
533 &queue_max_hw_sectors_entry
.attr
,
534 &queue_max_sectors_entry
.attr
,
535 &queue_max_segments_entry
.attr
,
536 &queue_max_integrity_segments_entry
.attr
,
537 &queue_max_segment_size_entry
.attr
,
538 &queue_iosched_entry
.attr
,
539 &queue_hw_sector_size_entry
.attr
,
540 &queue_logical_block_size_entry
.attr
,
541 &queue_physical_block_size_entry
.attr
,
542 &queue_io_min_entry
.attr
,
543 &queue_io_opt_entry
.attr
,
544 &queue_discard_granularity_entry
.attr
,
545 &queue_discard_max_entry
.attr
,
546 &queue_discard_max_hw_entry
.attr
,
547 &queue_discard_zeroes_data_entry
.attr
,
548 &queue_write_same_max_entry
.attr
,
549 &queue_nonrot_entry
.attr
,
550 &queue_nomerges_entry
.attr
,
551 &queue_rq_affinity_entry
.attr
,
552 &queue_iostats_entry
.attr
,
553 &queue_random_entry
.attr
,
554 &queue_poll_entry
.attr
,
555 &queue_wc_entry
.attr
,
556 &queue_dax_entry
.attr
,
560 #define to_queue(atr) container_of((atr), struct queue_sysfs_entry, attr)
563 queue_attr_show(struct kobject
*kobj
, struct attribute
*attr
, char *page
)
565 struct queue_sysfs_entry
*entry
= to_queue(attr
);
566 struct request_queue
*q
=
567 container_of(kobj
, struct request_queue
, kobj
);
572 mutex_lock(&q
->sysfs_lock
);
573 if (blk_queue_dying(q
)) {
574 mutex_unlock(&q
->sysfs_lock
);
577 res
= entry
->show(q
, page
);
578 mutex_unlock(&q
->sysfs_lock
);
583 queue_attr_store(struct kobject
*kobj
, struct attribute
*attr
,
584 const char *page
, size_t length
)
586 struct queue_sysfs_entry
*entry
= to_queue(attr
);
587 struct request_queue
*q
;
593 q
= container_of(kobj
, struct request_queue
, kobj
);
594 mutex_lock(&q
->sysfs_lock
);
595 if (blk_queue_dying(q
)) {
596 mutex_unlock(&q
->sysfs_lock
);
599 res
= entry
->store(q
, page
, length
);
600 mutex_unlock(&q
->sysfs_lock
);
604 static void blk_free_queue_rcu(struct rcu_head
*rcu_head
)
606 struct request_queue
*q
= container_of(rcu_head
, struct request_queue
,
608 kmem_cache_free(blk_requestq_cachep
, q
);
612 * blk_release_queue: - release a &struct request_queue when it is no longer needed
613 * @kobj: the kobj belonging to the request queue to be released
616 * blk_release_queue is the pair to blk_init_queue() or
617 * blk_queue_make_request(). It should be called when a request queue is
618 * being released; typically when a block device is being de-registered.
619 * Currently, its primary task it to free all the &struct request
620 * structures that were allocated to the queue and the queue itself.
623 * The low level driver must have finished any outstanding requests first
624 * via blk_cleanup_queue().
626 static void blk_release_queue(struct kobject
*kobj
)
628 struct request_queue
*q
=
629 container_of(kobj
, struct request_queue
, kobj
);
631 bdi_exit(&q
->backing_dev_info
);
635 spin_lock_irq(q
->queue_lock
);
637 spin_unlock_irq(q
->queue_lock
);
638 elevator_exit(q
->elevator
);
641 blk_exit_rl(&q
->root_rl
);
644 __blk_queue_free_tags(q
);
647 blk_free_flush_queue(q
->fq
);
651 blk_trace_shutdown(q
);
654 bioset_free(q
->bio_split
);
656 ida_simple_remove(&blk_queue_ida
, q
->id
);
657 call_rcu(&q
->rcu_head
, blk_free_queue_rcu
);
660 static const struct sysfs_ops queue_sysfs_ops
= {
661 .show
= queue_attr_show
,
662 .store
= queue_attr_store
,
665 struct kobj_type blk_queue_ktype
= {
666 .sysfs_ops
= &queue_sysfs_ops
,
667 .default_attrs
= default_attrs
,
668 .release
= blk_release_queue
,
671 int blk_register_queue(struct gendisk
*disk
)
674 struct device
*dev
= disk_to_dev(disk
);
675 struct request_queue
*q
= disk
->queue
;
681 * SCSI probing may synchronously create and destroy a lot of
682 * request_queues for non-existent devices. Shutting down a fully
683 * functional queue takes measureable wallclock time as RCU grace
684 * periods are involved. To avoid excessive latency in these
685 * cases, a request_queue starts out in a degraded mode which is
686 * faster to shut down and is made fully functional here as
687 * request_queues for non-existent devices never get registered.
689 if (!blk_queue_init_done(q
)) {
690 queue_flag_set_unlocked(QUEUE_FLAG_INIT_DONE
, q
);
691 percpu_ref_switch_to_percpu(&q
->q_usage_counter
);
692 blk_queue_bypass_end(q
);
695 ret
= blk_trace_init_sysfs(dev
);
699 ret
= kobject_add(&q
->kobj
, kobject_get(&dev
->kobj
), "%s", "queue");
701 blk_trace_remove_sysfs(dev
);
705 kobject_uevent(&q
->kobj
, KOBJ_ADD
);
708 blk_mq_register_dev(dev
, q
);
713 ret
= elv_register_queue(q
);
715 kobject_uevent(&q
->kobj
, KOBJ_REMOVE
);
716 kobject_del(&q
->kobj
);
717 blk_trace_remove_sysfs(dev
);
718 kobject_put(&dev
->kobj
);
725 void blk_unregister_queue(struct gendisk
*disk
)
727 struct request_queue
*q
= disk
->queue
;
733 blk_mq_unregister_dev(disk_to_dev(disk
), q
);
736 elv_unregister_queue(q
);
738 kobject_uevent(&q
->kobj
, KOBJ_REMOVE
);
739 kobject_del(&q
->kobj
);
740 blk_trace_remove_sysfs(disk_to_dev(disk
));
741 kobject_put(&disk_to_dev(disk
)->kobj
);