2 * Functions related to sysfs handling
4 #include <linux/kernel.h>
5 #include <linux/slab.h>
6 #include <linux/module.h>
8 #include <linux/blkdev.h>
9 #include <linux/blktrace_api.h>
10 #include <linux/blk-mq.h>
13 #include "blk-cgroup.h"
16 struct queue_sysfs_entry
{
17 struct attribute attr
;
18 ssize_t (*show
)(struct request_queue
*, char *);
19 ssize_t (*store
)(struct request_queue
*, const char *, size_t);
23 queue_var_show(unsigned long var
, char *page
)
25 return sprintf(page
, "%lu\n", var
);
29 queue_var_store(unsigned long *var
, const char *page
, size_t count
)
34 err
= kstrtoul(page
, 10, &v
);
35 if (err
|| v
> UINT_MAX
)
43 static ssize_t
queue_requests_show(struct request_queue
*q
, char *page
)
45 return queue_var_show(q
->nr_requests
, (page
));
49 queue_requests_store(struct request_queue
*q
, const char *page
, size_t count
)
51 struct request_list
*rl
;
58 ret
= queue_var_store(&nr
, page
, count
);
62 if (nr
< BLKDEV_MIN_RQ
)
65 spin_lock_irq(q
->queue_lock
);
67 blk_queue_congestion_threshold(q
);
69 /* congestion isn't cgroup aware and follows root blkcg for now */
72 if (rl
->count
[BLK_RW_SYNC
] >= queue_congestion_on_threshold(q
))
73 blk_set_queue_congested(q
, BLK_RW_SYNC
);
74 else if (rl
->count
[BLK_RW_SYNC
] < queue_congestion_off_threshold(q
))
75 blk_clear_queue_congested(q
, BLK_RW_SYNC
);
77 if (rl
->count
[BLK_RW_ASYNC
] >= queue_congestion_on_threshold(q
))
78 blk_set_queue_congested(q
, BLK_RW_ASYNC
);
79 else if (rl
->count
[BLK_RW_ASYNC
] < queue_congestion_off_threshold(q
))
80 blk_clear_queue_congested(q
, BLK_RW_ASYNC
);
82 blk_queue_for_each_rl(rl
, q
) {
83 if (rl
->count
[BLK_RW_SYNC
] >= q
->nr_requests
) {
84 blk_set_rl_full(rl
, BLK_RW_SYNC
);
86 blk_clear_rl_full(rl
, BLK_RW_SYNC
);
87 wake_up(&rl
->wait
[BLK_RW_SYNC
]);
90 if (rl
->count
[BLK_RW_ASYNC
] >= q
->nr_requests
) {
91 blk_set_rl_full(rl
, BLK_RW_ASYNC
);
93 blk_clear_rl_full(rl
, BLK_RW_ASYNC
);
94 wake_up(&rl
->wait
[BLK_RW_ASYNC
]);
98 spin_unlock_irq(q
->queue_lock
);
102 static ssize_t
queue_ra_show(struct request_queue
*q
, char *page
)
104 unsigned long ra_kb
= q
->backing_dev_info
.ra_pages
<<
105 (PAGE_CACHE_SHIFT
- 10);
107 return queue_var_show(ra_kb
, (page
));
111 queue_ra_store(struct request_queue
*q
, const char *page
, size_t count
)
114 ssize_t ret
= queue_var_store(&ra_kb
, page
, count
);
119 q
->backing_dev_info
.ra_pages
= ra_kb
>> (PAGE_CACHE_SHIFT
- 10);
124 static ssize_t
queue_max_sectors_show(struct request_queue
*q
, char *page
)
126 int max_sectors_kb
= queue_max_sectors(q
) >> 1;
128 return queue_var_show(max_sectors_kb
, (page
));
131 static ssize_t
queue_max_segments_show(struct request_queue
*q
, char *page
)
133 return queue_var_show(queue_max_segments(q
), (page
));
136 static ssize_t
queue_max_integrity_segments_show(struct request_queue
*q
, char *page
)
138 return queue_var_show(q
->limits
.max_integrity_segments
, (page
));
141 static ssize_t
queue_max_segment_size_show(struct request_queue
*q
, char *page
)
143 if (blk_queue_cluster(q
))
144 return queue_var_show(queue_max_segment_size(q
), (page
));
146 return queue_var_show(PAGE_CACHE_SIZE
, (page
));
149 static ssize_t
queue_logical_block_size_show(struct request_queue
*q
, char *page
)
151 return queue_var_show(queue_logical_block_size(q
), page
);
154 static ssize_t
queue_physical_block_size_show(struct request_queue
*q
, char *page
)
156 return queue_var_show(queue_physical_block_size(q
), page
);
159 static ssize_t
queue_io_min_show(struct request_queue
*q
, char *page
)
161 return queue_var_show(queue_io_min(q
), page
);
164 static ssize_t
queue_io_opt_show(struct request_queue
*q
, char *page
)
166 return queue_var_show(queue_io_opt(q
), page
);
169 static ssize_t
queue_discard_granularity_show(struct request_queue
*q
, char *page
)
171 return queue_var_show(q
->limits
.discard_granularity
, page
);
174 static ssize_t
queue_discard_max_show(struct request_queue
*q
, char *page
)
176 return sprintf(page
, "%llu\n",
177 (unsigned long long)q
->limits
.max_discard_sectors
<< 9);
180 static ssize_t
queue_discard_zeroes_data_show(struct request_queue
*q
, char *page
)
182 return queue_var_show(queue_discard_zeroes_data(q
), page
);
185 static ssize_t
queue_write_same_max_show(struct request_queue
*q
, char *page
)
187 return sprintf(page
, "%llu\n",
188 (unsigned long long)q
->limits
.max_write_same_sectors
<< 9);
193 queue_max_sectors_store(struct request_queue
*q
, const char *page
, size_t count
)
195 unsigned long max_sectors_kb
,
196 max_hw_sectors_kb
= queue_max_hw_sectors(q
) >> 1,
197 page_kb
= 1 << (PAGE_CACHE_SHIFT
- 10);
198 ssize_t ret
= queue_var_store(&max_sectors_kb
, page
, count
);
203 if (max_sectors_kb
> max_hw_sectors_kb
|| max_sectors_kb
< page_kb
)
206 spin_lock_irq(q
->queue_lock
);
207 q
->limits
.max_sectors
= max_sectors_kb
<< 1;
208 spin_unlock_irq(q
->queue_lock
);
213 static ssize_t
queue_max_hw_sectors_show(struct request_queue
*q
, char *page
)
215 int max_hw_sectors_kb
= queue_max_hw_sectors(q
) >> 1;
217 return queue_var_show(max_hw_sectors_kb
, (page
));
220 #define QUEUE_SYSFS_BIT_FNS(name, flag, neg) \
222 queue_show_##name(struct request_queue *q, char *page) \
225 bit = test_bit(QUEUE_FLAG_##flag, &q->queue_flags); \
226 return queue_var_show(neg ? !bit : bit, page); \
229 queue_store_##name(struct request_queue *q, const char *page, size_t count) \
233 ret = queue_var_store(&val, page, count); \
239 spin_lock_irq(q->queue_lock); \
241 queue_flag_set(QUEUE_FLAG_##flag, q); \
243 queue_flag_clear(QUEUE_FLAG_##flag, q); \
244 spin_unlock_irq(q->queue_lock); \
248 QUEUE_SYSFS_BIT_FNS(nonrot
, NONROT
, 1);
249 QUEUE_SYSFS_BIT_FNS(random
, ADD_RANDOM
, 0);
250 QUEUE_SYSFS_BIT_FNS(iostats
, IO_STAT
, 0);
251 #undef QUEUE_SYSFS_BIT_FNS
253 static ssize_t
queue_nomerges_show(struct request_queue
*q
, char *page
)
255 return queue_var_show((blk_queue_nomerges(q
) << 1) |
256 blk_queue_noxmerges(q
), page
);
259 static ssize_t
queue_nomerges_store(struct request_queue
*q
, const char *page
,
263 ssize_t ret
= queue_var_store(&nm
, page
, count
);
268 spin_lock_irq(q
->queue_lock
);
269 queue_flag_clear(QUEUE_FLAG_NOMERGES
, q
);
270 queue_flag_clear(QUEUE_FLAG_NOXMERGES
, q
);
272 queue_flag_set(QUEUE_FLAG_NOMERGES
, q
);
274 queue_flag_set(QUEUE_FLAG_NOXMERGES
, q
);
275 spin_unlock_irq(q
->queue_lock
);
280 static ssize_t
queue_rq_affinity_show(struct request_queue
*q
, char *page
)
282 bool set
= test_bit(QUEUE_FLAG_SAME_COMP
, &q
->queue_flags
);
283 bool force
= test_bit(QUEUE_FLAG_SAME_FORCE
, &q
->queue_flags
);
285 return queue_var_show(set
<< force
, page
);
289 queue_rq_affinity_store(struct request_queue
*q
, const char *page
, size_t count
)
291 ssize_t ret
= -EINVAL
;
295 ret
= queue_var_store(&val
, page
, count
);
299 spin_lock_irq(q
->queue_lock
);
301 queue_flag_set(QUEUE_FLAG_SAME_COMP
, q
);
302 queue_flag_set(QUEUE_FLAG_SAME_FORCE
, q
);
303 } else if (val
== 1) {
304 queue_flag_set(QUEUE_FLAG_SAME_COMP
, q
);
305 queue_flag_clear(QUEUE_FLAG_SAME_FORCE
, q
);
306 } else if (val
== 0) {
307 queue_flag_clear(QUEUE_FLAG_SAME_COMP
, q
);
308 queue_flag_clear(QUEUE_FLAG_SAME_FORCE
, q
);
310 spin_unlock_irq(q
->queue_lock
);
315 static struct queue_sysfs_entry queue_requests_entry
= {
316 .attr
= {.name
= "nr_requests", .mode
= S_IRUGO
| S_IWUSR
},
317 .show
= queue_requests_show
,
318 .store
= queue_requests_store
,
321 static struct queue_sysfs_entry queue_ra_entry
= {
322 .attr
= {.name
= "read_ahead_kb", .mode
= S_IRUGO
| S_IWUSR
},
323 .show
= queue_ra_show
,
324 .store
= queue_ra_store
,
327 static struct queue_sysfs_entry queue_max_sectors_entry
= {
328 .attr
= {.name
= "max_sectors_kb", .mode
= S_IRUGO
| S_IWUSR
},
329 .show
= queue_max_sectors_show
,
330 .store
= queue_max_sectors_store
,
333 static struct queue_sysfs_entry queue_max_hw_sectors_entry
= {
334 .attr
= {.name
= "max_hw_sectors_kb", .mode
= S_IRUGO
},
335 .show
= queue_max_hw_sectors_show
,
338 static struct queue_sysfs_entry queue_max_segments_entry
= {
339 .attr
= {.name
= "max_segments", .mode
= S_IRUGO
},
340 .show
= queue_max_segments_show
,
343 static struct queue_sysfs_entry queue_max_integrity_segments_entry
= {
344 .attr
= {.name
= "max_integrity_segments", .mode
= S_IRUGO
},
345 .show
= queue_max_integrity_segments_show
,
348 static struct queue_sysfs_entry queue_max_segment_size_entry
= {
349 .attr
= {.name
= "max_segment_size", .mode
= S_IRUGO
},
350 .show
= queue_max_segment_size_show
,
353 static struct queue_sysfs_entry queue_iosched_entry
= {
354 .attr
= {.name
= "scheduler", .mode
= S_IRUGO
| S_IWUSR
},
355 .show
= elv_iosched_show
,
356 .store
= elv_iosched_store
,
359 static struct queue_sysfs_entry queue_hw_sector_size_entry
= {
360 .attr
= {.name
= "hw_sector_size", .mode
= S_IRUGO
},
361 .show
= queue_logical_block_size_show
,
364 static struct queue_sysfs_entry queue_logical_block_size_entry
= {
365 .attr
= {.name
= "logical_block_size", .mode
= S_IRUGO
},
366 .show
= queue_logical_block_size_show
,
369 static struct queue_sysfs_entry queue_physical_block_size_entry
= {
370 .attr
= {.name
= "physical_block_size", .mode
= S_IRUGO
},
371 .show
= queue_physical_block_size_show
,
374 static struct queue_sysfs_entry queue_io_min_entry
= {
375 .attr
= {.name
= "minimum_io_size", .mode
= S_IRUGO
},
376 .show
= queue_io_min_show
,
379 static struct queue_sysfs_entry queue_io_opt_entry
= {
380 .attr
= {.name
= "optimal_io_size", .mode
= S_IRUGO
},
381 .show
= queue_io_opt_show
,
384 static struct queue_sysfs_entry queue_discard_granularity_entry
= {
385 .attr
= {.name
= "discard_granularity", .mode
= S_IRUGO
},
386 .show
= queue_discard_granularity_show
,
389 static struct queue_sysfs_entry queue_discard_max_entry
= {
390 .attr
= {.name
= "discard_max_bytes", .mode
= S_IRUGO
},
391 .show
= queue_discard_max_show
,
394 static struct queue_sysfs_entry queue_discard_zeroes_data_entry
= {
395 .attr
= {.name
= "discard_zeroes_data", .mode
= S_IRUGO
},
396 .show
= queue_discard_zeroes_data_show
,
399 static struct queue_sysfs_entry queue_write_same_max_entry
= {
400 .attr
= {.name
= "write_same_max_bytes", .mode
= S_IRUGO
},
401 .show
= queue_write_same_max_show
,
404 static struct queue_sysfs_entry queue_nonrot_entry
= {
405 .attr
= {.name
= "rotational", .mode
= S_IRUGO
| S_IWUSR
},
406 .show
= queue_show_nonrot
,
407 .store
= queue_store_nonrot
,
410 static struct queue_sysfs_entry queue_nomerges_entry
= {
411 .attr
= {.name
= "nomerges", .mode
= S_IRUGO
| S_IWUSR
},
412 .show
= queue_nomerges_show
,
413 .store
= queue_nomerges_store
,
416 static struct queue_sysfs_entry queue_rq_affinity_entry
= {
417 .attr
= {.name
= "rq_affinity", .mode
= S_IRUGO
| S_IWUSR
},
418 .show
= queue_rq_affinity_show
,
419 .store
= queue_rq_affinity_store
,
422 static struct queue_sysfs_entry queue_iostats_entry
= {
423 .attr
= {.name
= "iostats", .mode
= S_IRUGO
| S_IWUSR
},
424 .show
= queue_show_iostats
,
425 .store
= queue_store_iostats
,
428 static struct queue_sysfs_entry queue_random_entry
= {
429 .attr
= {.name
= "add_random", .mode
= S_IRUGO
| S_IWUSR
},
430 .show
= queue_show_random
,
431 .store
= queue_store_random
,
434 static struct attribute
*default_attrs
[] = {
435 &queue_requests_entry
.attr
,
436 &queue_ra_entry
.attr
,
437 &queue_max_hw_sectors_entry
.attr
,
438 &queue_max_sectors_entry
.attr
,
439 &queue_max_segments_entry
.attr
,
440 &queue_max_integrity_segments_entry
.attr
,
441 &queue_max_segment_size_entry
.attr
,
442 &queue_iosched_entry
.attr
,
443 &queue_hw_sector_size_entry
.attr
,
444 &queue_logical_block_size_entry
.attr
,
445 &queue_physical_block_size_entry
.attr
,
446 &queue_io_min_entry
.attr
,
447 &queue_io_opt_entry
.attr
,
448 &queue_discard_granularity_entry
.attr
,
449 &queue_discard_max_entry
.attr
,
450 &queue_discard_zeroes_data_entry
.attr
,
451 &queue_write_same_max_entry
.attr
,
452 &queue_nonrot_entry
.attr
,
453 &queue_nomerges_entry
.attr
,
454 &queue_rq_affinity_entry
.attr
,
455 &queue_iostats_entry
.attr
,
456 &queue_random_entry
.attr
,
460 #define to_queue(atr) container_of((atr), struct queue_sysfs_entry, attr)
463 queue_attr_show(struct kobject
*kobj
, struct attribute
*attr
, char *page
)
465 struct queue_sysfs_entry
*entry
= to_queue(attr
);
466 struct request_queue
*q
=
467 container_of(kobj
, struct request_queue
, kobj
);
472 mutex_lock(&q
->sysfs_lock
);
473 if (blk_queue_dying(q
)) {
474 mutex_unlock(&q
->sysfs_lock
);
477 res
= entry
->show(q
, page
);
478 mutex_unlock(&q
->sysfs_lock
);
483 queue_attr_store(struct kobject
*kobj
, struct attribute
*attr
,
484 const char *page
, size_t length
)
486 struct queue_sysfs_entry
*entry
= to_queue(attr
);
487 struct request_queue
*q
;
493 q
= container_of(kobj
, struct request_queue
, kobj
);
494 mutex_lock(&q
->sysfs_lock
);
495 if (blk_queue_dying(q
)) {
496 mutex_unlock(&q
->sysfs_lock
);
499 res
= entry
->store(q
, page
, length
);
500 mutex_unlock(&q
->sysfs_lock
);
504 static void blk_free_queue_rcu(struct rcu_head
*rcu_head
)
506 struct request_queue
*q
= container_of(rcu_head
, struct request_queue
,
508 kmem_cache_free(blk_requestq_cachep
, q
);
512 * blk_release_queue: - release a &struct request_queue when it is no longer needed
513 * @kobj: the kobj belonging to the request queue to be released
516 * blk_release_queue is the pair to blk_init_queue() or
517 * blk_queue_make_request(). It should be called when a request queue is
518 * being released; typically when a block device is being de-registered.
519 * Currently, its primary task it to free all the &struct request
520 * structures that were allocated to the queue and the queue itself.
523 * Hopefully the low level driver will have finished any
524 * outstanding requests first...
526 static void blk_release_queue(struct kobject
*kobj
)
528 struct request_queue
*q
=
529 container_of(kobj
, struct request_queue
, kobj
);
536 spin_lock_irq(q
->queue_lock
);
538 spin_unlock_irq(q
->queue_lock
);
539 elevator_exit(q
->elevator
);
542 blk_exit_rl(&q
->root_rl
);
545 __blk_queue_free_tags(q
);
547 percpu_counter_destroy(&q
->mq_usage_counter
);
550 blk_mq_free_queue(q
);
554 blk_trace_shutdown(q
);
556 bdi_destroy(&q
->backing_dev_info
);
558 ida_simple_remove(&blk_queue_ida
, q
->id
);
559 call_rcu(&q
->rcu_head
, blk_free_queue_rcu
);
562 static const struct sysfs_ops queue_sysfs_ops
= {
563 .show
= queue_attr_show
,
564 .store
= queue_attr_store
,
567 struct kobj_type blk_queue_ktype
= {
568 .sysfs_ops
= &queue_sysfs_ops
,
569 .default_attrs
= default_attrs
,
570 .release
= blk_release_queue
,
573 int blk_register_queue(struct gendisk
*disk
)
576 struct device
*dev
= disk_to_dev(disk
);
577 struct request_queue
*q
= disk
->queue
;
583 * Initialization must be complete by now. Finish the initial
584 * bypass from queue allocation.
586 blk_queue_bypass_end(q
);
587 queue_flag_set_unlocked(QUEUE_FLAG_INIT_DONE
, q
);
589 ret
= blk_trace_init_sysfs(dev
);
593 ret
= kobject_add(&q
->kobj
, kobject_get(&dev
->kobj
), "%s", "queue");
595 blk_trace_remove_sysfs(dev
);
599 kobject_uevent(&q
->kobj
, KOBJ_ADD
);
602 blk_mq_register_disk(disk
);
607 ret
= elv_register_queue(q
);
609 kobject_uevent(&q
->kobj
, KOBJ_REMOVE
);
610 kobject_del(&q
->kobj
);
611 blk_trace_remove_sysfs(dev
);
612 kobject_put(&dev
->kobj
);
619 void blk_unregister_queue(struct gendisk
*disk
)
621 struct request_queue
*q
= disk
->queue
;
627 blk_mq_unregister_disk(disk
);
630 elv_unregister_queue(q
);
632 kobject_uevent(&q
->kobj
, KOBJ_REMOVE
);
633 kobject_del(&q
->kobj
);
634 blk_trace_remove_sysfs(disk_to_dev(disk
));
635 kobject_put(&disk_to_dev(disk
)->kobj
);