2 * Functions related to sysfs handling
4 #include <linux/kernel.h>
5 #include <linux/slab.h>
6 #include <linux/module.h>
8 #include <linux/blkdev.h>
9 #include <linux/blktrace_api.h>
10 #include <linux/blk-mq.h>
13 #include "blk-cgroup.h"
15 struct queue_sysfs_entry
{
16 struct attribute attr
;
17 ssize_t (*show
)(struct request_queue
*, char *);
18 ssize_t (*store
)(struct request_queue
*, const char *, size_t);
22 queue_var_show(unsigned long var
, char *page
)
24 return sprintf(page
, "%lu\n", var
);
28 queue_var_store(unsigned long *var
, const char *page
, size_t count
)
33 err
= kstrtoul(page
, 10, &v
);
34 if (err
|| v
> UINT_MAX
)
42 static ssize_t
queue_requests_show(struct request_queue
*q
, char *page
)
44 return queue_var_show(q
->nr_requests
, (page
));
48 queue_requests_store(struct request_queue
*q
, const char *page
, size_t count
)
50 struct request_list
*rl
;
57 ret
= queue_var_store(&nr
, page
, count
);
61 if (nr
< BLKDEV_MIN_RQ
)
64 spin_lock_irq(q
->queue_lock
);
66 blk_queue_congestion_threshold(q
);
68 /* congestion isn't cgroup aware and follows root blkcg for now */
71 if (rl
->count
[BLK_RW_SYNC
] >= queue_congestion_on_threshold(q
))
72 blk_set_queue_congested(q
, BLK_RW_SYNC
);
73 else if (rl
->count
[BLK_RW_SYNC
] < queue_congestion_off_threshold(q
))
74 blk_clear_queue_congested(q
, BLK_RW_SYNC
);
76 if (rl
->count
[BLK_RW_ASYNC
] >= queue_congestion_on_threshold(q
))
77 blk_set_queue_congested(q
, BLK_RW_ASYNC
);
78 else if (rl
->count
[BLK_RW_ASYNC
] < queue_congestion_off_threshold(q
))
79 blk_clear_queue_congested(q
, BLK_RW_ASYNC
);
81 blk_queue_for_each_rl(rl
, q
) {
82 if (rl
->count
[BLK_RW_SYNC
] >= q
->nr_requests
) {
83 blk_set_rl_full(rl
, BLK_RW_SYNC
);
85 blk_clear_rl_full(rl
, BLK_RW_SYNC
);
86 wake_up(&rl
->wait
[BLK_RW_SYNC
]);
89 if (rl
->count
[BLK_RW_ASYNC
] >= q
->nr_requests
) {
90 blk_set_rl_full(rl
, BLK_RW_ASYNC
);
92 blk_clear_rl_full(rl
, BLK_RW_ASYNC
);
93 wake_up(&rl
->wait
[BLK_RW_ASYNC
]);
97 spin_unlock_irq(q
->queue_lock
);
101 static ssize_t
queue_ra_show(struct request_queue
*q
, char *page
)
103 unsigned long ra_kb
= q
->backing_dev_info
.ra_pages
<<
104 (PAGE_CACHE_SHIFT
- 10);
106 return queue_var_show(ra_kb
, (page
));
110 queue_ra_store(struct request_queue
*q
, const char *page
, size_t count
)
113 ssize_t ret
= queue_var_store(&ra_kb
, page
, count
);
118 q
->backing_dev_info
.ra_pages
= ra_kb
>> (PAGE_CACHE_SHIFT
- 10);
123 static ssize_t
queue_max_sectors_show(struct request_queue
*q
, char *page
)
125 int max_sectors_kb
= queue_max_sectors(q
) >> 1;
127 return queue_var_show(max_sectors_kb
, (page
));
130 static ssize_t
queue_max_segments_show(struct request_queue
*q
, char *page
)
132 return queue_var_show(queue_max_segments(q
), (page
));
135 static ssize_t
queue_max_integrity_segments_show(struct request_queue
*q
, char *page
)
137 return queue_var_show(q
->limits
.max_integrity_segments
, (page
));
140 static ssize_t
queue_max_segment_size_show(struct request_queue
*q
, char *page
)
142 if (blk_queue_cluster(q
))
143 return queue_var_show(queue_max_segment_size(q
), (page
));
145 return queue_var_show(PAGE_CACHE_SIZE
, (page
));
148 static ssize_t
queue_logical_block_size_show(struct request_queue
*q
, char *page
)
150 return queue_var_show(queue_logical_block_size(q
), page
);
153 static ssize_t
queue_physical_block_size_show(struct request_queue
*q
, char *page
)
155 return queue_var_show(queue_physical_block_size(q
), page
);
158 static ssize_t
queue_io_min_show(struct request_queue
*q
, char *page
)
160 return queue_var_show(queue_io_min(q
), page
);
163 static ssize_t
queue_io_opt_show(struct request_queue
*q
, char *page
)
165 return queue_var_show(queue_io_opt(q
), page
);
168 static ssize_t
queue_discard_granularity_show(struct request_queue
*q
, char *page
)
170 return queue_var_show(q
->limits
.discard_granularity
, page
);
173 static ssize_t
queue_discard_max_show(struct request_queue
*q
, char *page
)
175 return sprintf(page
, "%llu\n",
176 (unsigned long long)q
->limits
.max_discard_sectors
<< 9);
179 static ssize_t
queue_discard_zeroes_data_show(struct request_queue
*q
, char *page
)
181 return queue_var_show(queue_discard_zeroes_data(q
), page
);
184 static ssize_t
queue_write_same_max_show(struct request_queue
*q
, char *page
)
186 return sprintf(page
, "%llu\n",
187 (unsigned long long)q
->limits
.max_write_same_sectors
<< 9);
192 queue_max_sectors_store(struct request_queue
*q
, const char *page
, size_t count
)
194 unsigned long max_sectors_kb
,
195 max_hw_sectors_kb
= queue_max_hw_sectors(q
) >> 1,
196 page_kb
= 1 << (PAGE_CACHE_SHIFT
- 10);
197 ssize_t ret
= queue_var_store(&max_sectors_kb
, page
, count
);
202 if (max_sectors_kb
> max_hw_sectors_kb
|| max_sectors_kb
< page_kb
)
205 spin_lock_irq(q
->queue_lock
);
206 q
->limits
.max_sectors
= max_sectors_kb
<< 1;
207 spin_unlock_irq(q
->queue_lock
);
212 static ssize_t
queue_max_hw_sectors_show(struct request_queue
*q
, char *page
)
214 int max_hw_sectors_kb
= queue_max_hw_sectors(q
) >> 1;
216 return queue_var_show(max_hw_sectors_kb
, (page
));
219 #define QUEUE_SYSFS_BIT_FNS(name, flag, neg) \
221 queue_show_##name(struct request_queue *q, char *page) \
224 bit = test_bit(QUEUE_FLAG_##flag, &q->queue_flags); \
225 return queue_var_show(neg ? !bit : bit, page); \
228 queue_store_##name(struct request_queue *q, const char *page, size_t count) \
232 ret = queue_var_store(&val, page, count); \
238 spin_lock_irq(q->queue_lock); \
240 queue_flag_set(QUEUE_FLAG_##flag, q); \
242 queue_flag_clear(QUEUE_FLAG_##flag, q); \
243 spin_unlock_irq(q->queue_lock); \
247 QUEUE_SYSFS_BIT_FNS(nonrot
, NONROT
, 1);
248 QUEUE_SYSFS_BIT_FNS(random
, ADD_RANDOM
, 0);
249 QUEUE_SYSFS_BIT_FNS(iostats
, IO_STAT
, 0);
250 #undef QUEUE_SYSFS_BIT_FNS
252 static ssize_t
queue_nomerges_show(struct request_queue
*q
, char *page
)
254 return queue_var_show((blk_queue_nomerges(q
) << 1) |
255 blk_queue_noxmerges(q
), page
);
258 static ssize_t
queue_nomerges_store(struct request_queue
*q
, const char *page
,
262 ssize_t ret
= queue_var_store(&nm
, page
, count
);
267 spin_lock_irq(q
->queue_lock
);
268 queue_flag_clear(QUEUE_FLAG_NOMERGES
, q
);
269 queue_flag_clear(QUEUE_FLAG_NOXMERGES
, q
);
271 queue_flag_set(QUEUE_FLAG_NOMERGES
, q
);
273 queue_flag_set(QUEUE_FLAG_NOXMERGES
, q
);
274 spin_unlock_irq(q
->queue_lock
);
279 static ssize_t
queue_rq_affinity_show(struct request_queue
*q
, char *page
)
281 bool set
= test_bit(QUEUE_FLAG_SAME_COMP
, &q
->queue_flags
);
282 bool force
= test_bit(QUEUE_FLAG_SAME_FORCE
, &q
->queue_flags
);
284 return queue_var_show(set
<< force
, page
);
288 queue_rq_affinity_store(struct request_queue
*q
, const char *page
, size_t count
)
290 ssize_t ret
= -EINVAL
;
294 ret
= queue_var_store(&val
, page
, count
);
298 spin_lock_irq(q
->queue_lock
);
300 queue_flag_set(QUEUE_FLAG_SAME_COMP
, q
);
301 queue_flag_set(QUEUE_FLAG_SAME_FORCE
, q
);
302 } else if (val
== 1) {
303 queue_flag_set(QUEUE_FLAG_SAME_COMP
, q
);
304 queue_flag_clear(QUEUE_FLAG_SAME_FORCE
, q
);
305 } else if (val
== 0) {
306 queue_flag_clear(QUEUE_FLAG_SAME_COMP
, q
);
307 queue_flag_clear(QUEUE_FLAG_SAME_FORCE
, q
);
309 spin_unlock_irq(q
->queue_lock
);
314 static struct queue_sysfs_entry queue_requests_entry
= {
315 .attr
= {.name
= "nr_requests", .mode
= S_IRUGO
| S_IWUSR
},
316 .show
= queue_requests_show
,
317 .store
= queue_requests_store
,
320 static struct queue_sysfs_entry queue_ra_entry
= {
321 .attr
= {.name
= "read_ahead_kb", .mode
= S_IRUGO
| S_IWUSR
},
322 .show
= queue_ra_show
,
323 .store
= queue_ra_store
,
326 static struct queue_sysfs_entry queue_max_sectors_entry
= {
327 .attr
= {.name
= "max_sectors_kb", .mode
= S_IRUGO
| S_IWUSR
},
328 .show
= queue_max_sectors_show
,
329 .store
= queue_max_sectors_store
,
332 static struct queue_sysfs_entry queue_max_hw_sectors_entry
= {
333 .attr
= {.name
= "max_hw_sectors_kb", .mode
= S_IRUGO
},
334 .show
= queue_max_hw_sectors_show
,
337 static struct queue_sysfs_entry queue_max_segments_entry
= {
338 .attr
= {.name
= "max_segments", .mode
= S_IRUGO
},
339 .show
= queue_max_segments_show
,
342 static struct queue_sysfs_entry queue_max_integrity_segments_entry
= {
343 .attr
= {.name
= "max_integrity_segments", .mode
= S_IRUGO
},
344 .show
= queue_max_integrity_segments_show
,
347 static struct queue_sysfs_entry queue_max_segment_size_entry
= {
348 .attr
= {.name
= "max_segment_size", .mode
= S_IRUGO
},
349 .show
= queue_max_segment_size_show
,
352 static struct queue_sysfs_entry queue_iosched_entry
= {
353 .attr
= {.name
= "scheduler", .mode
= S_IRUGO
| S_IWUSR
},
354 .show
= elv_iosched_show
,
355 .store
= elv_iosched_store
,
358 static struct queue_sysfs_entry queue_hw_sector_size_entry
= {
359 .attr
= {.name
= "hw_sector_size", .mode
= S_IRUGO
},
360 .show
= queue_logical_block_size_show
,
363 static struct queue_sysfs_entry queue_logical_block_size_entry
= {
364 .attr
= {.name
= "logical_block_size", .mode
= S_IRUGO
},
365 .show
= queue_logical_block_size_show
,
368 static struct queue_sysfs_entry queue_physical_block_size_entry
= {
369 .attr
= {.name
= "physical_block_size", .mode
= S_IRUGO
},
370 .show
= queue_physical_block_size_show
,
373 static struct queue_sysfs_entry queue_io_min_entry
= {
374 .attr
= {.name
= "minimum_io_size", .mode
= S_IRUGO
},
375 .show
= queue_io_min_show
,
378 static struct queue_sysfs_entry queue_io_opt_entry
= {
379 .attr
= {.name
= "optimal_io_size", .mode
= S_IRUGO
},
380 .show
= queue_io_opt_show
,
383 static struct queue_sysfs_entry queue_discard_granularity_entry
= {
384 .attr
= {.name
= "discard_granularity", .mode
= S_IRUGO
},
385 .show
= queue_discard_granularity_show
,
388 static struct queue_sysfs_entry queue_discard_max_entry
= {
389 .attr
= {.name
= "discard_max_bytes", .mode
= S_IRUGO
},
390 .show
= queue_discard_max_show
,
393 static struct queue_sysfs_entry queue_discard_zeroes_data_entry
= {
394 .attr
= {.name
= "discard_zeroes_data", .mode
= S_IRUGO
},
395 .show
= queue_discard_zeroes_data_show
,
398 static struct queue_sysfs_entry queue_write_same_max_entry
= {
399 .attr
= {.name
= "write_same_max_bytes", .mode
= S_IRUGO
},
400 .show
= queue_write_same_max_show
,
403 static struct queue_sysfs_entry queue_nonrot_entry
= {
404 .attr
= {.name
= "rotational", .mode
= S_IRUGO
| S_IWUSR
},
405 .show
= queue_show_nonrot
,
406 .store
= queue_store_nonrot
,
409 static struct queue_sysfs_entry queue_nomerges_entry
= {
410 .attr
= {.name
= "nomerges", .mode
= S_IRUGO
| S_IWUSR
},
411 .show
= queue_nomerges_show
,
412 .store
= queue_nomerges_store
,
415 static struct queue_sysfs_entry queue_rq_affinity_entry
= {
416 .attr
= {.name
= "rq_affinity", .mode
= S_IRUGO
| S_IWUSR
},
417 .show
= queue_rq_affinity_show
,
418 .store
= queue_rq_affinity_store
,
421 static struct queue_sysfs_entry queue_iostats_entry
= {
422 .attr
= {.name
= "iostats", .mode
= S_IRUGO
| S_IWUSR
},
423 .show
= queue_show_iostats
,
424 .store
= queue_store_iostats
,
427 static struct queue_sysfs_entry queue_random_entry
= {
428 .attr
= {.name
= "add_random", .mode
= S_IRUGO
| S_IWUSR
},
429 .show
= queue_show_random
,
430 .store
= queue_store_random
,
433 static struct attribute
*default_attrs
[] = {
434 &queue_requests_entry
.attr
,
435 &queue_ra_entry
.attr
,
436 &queue_max_hw_sectors_entry
.attr
,
437 &queue_max_sectors_entry
.attr
,
438 &queue_max_segments_entry
.attr
,
439 &queue_max_integrity_segments_entry
.attr
,
440 &queue_max_segment_size_entry
.attr
,
441 &queue_iosched_entry
.attr
,
442 &queue_hw_sector_size_entry
.attr
,
443 &queue_logical_block_size_entry
.attr
,
444 &queue_physical_block_size_entry
.attr
,
445 &queue_io_min_entry
.attr
,
446 &queue_io_opt_entry
.attr
,
447 &queue_discard_granularity_entry
.attr
,
448 &queue_discard_max_entry
.attr
,
449 &queue_discard_zeroes_data_entry
.attr
,
450 &queue_write_same_max_entry
.attr
,
451 &queue_nonrot_entry
.attr
,
452 &queue_nomerges_entry
.attr
,
453 &queue_rq_affinity_entry
.attr
,
454 &queue_iostats_entry
.attr
,
455 &queue_random_entry
.attr
,
459 #define to_queue(atr) container_of((atr), struct queue_sysfs_entry, attr)
462 queue_attr_show(struct kobject
*kobj
, struct attribute
*attr
, char *page
)
464 struct queue_sysfs_entry
*entry
= to_queue(attr
);
465 struct request_queue
*q
=
466 container_of(kobj
, struct request_queue
, kobj
);
471 mutex_lock(&q
->sysfs_lock
);
472 if (blk_queue_dying(q
)) {
473 mutex_unlock(&q
->sysfs_lock
);
476 res
= entry
->show(q
, page
);
477 mutex_unlock(&q
->sysfs_lock
);
482 queue_attr_store(struct kobject
*kobj
, struct attribute
*attr
,
483 const char *page
, size_t length
)
485 struct queue_sysfs_entry
*entry
= to_queue(attr
);
486 struct request_queue
*q
;
492 q
= container_of(kobj
, struct request_queue
, kobj
);
493 mutex_lock(&q
->sysfs_lock
);
494 if (blk_queue_dying(q
)) {
495 mutex_unlock(&q
->sysfs_lock
);
498 res
= entry
->store(q
, page
, length
);
499 mutex_unlock(&q
->sysfs_lock
);
503 static void blk_free_queue_rcu(struct rcu_head
*rcu_head
)
505 struct request_queue
*q
= container_of(rcu_head
, struct request_queue
,
507 kmem_cache_free(blk_requestq_cachep
, q
);
511 * blk_release_queue: - release a &struct request_queue when it is no longer needed
512 * @kobj: the kobj belonging to the request queue to be released
515 * blk_release_queue is the pair to blk_init_queue() or
516 * blk_queue_make_request(). It should be called when a request queue is
517 * being released; typically when a block device is being de-registered.
518 * Currently, its primary task it to free all the &struct request
519 * structures that were allocated to the queue and the queue itself.
522 * Hopefully the low level driver will have finished any
523 * outstanding requests first...
525 static void blk_release_queue(struct kobject
*kobj
)
527 struct request_queue
*q
=
528 container_of(kobj
, struct request_queue
, kobj
);
535 spin_lock_irq(q
->queue_lock
);
537 spin_unlock_irq(q
->queue_lock
);
538 elevator_exit(q
->elevator
);
541 blk_exit_rl(&q
->root_rl
);
544 __blk_queue_free_tags(q
);
546 percpu_counter_destroy(&q
->mq_usage_counter
);
549 blk_mq_free_queue(q
);
551 blk_trace_shutdown(q
);
553 bdi_destroy(&q
->backing_dev_info
);
555 ida_simple_remove(&blk_queue_ida
, q
->id
);
556 call_rcu(&q
->rcu_head
, blk_free_queue_rcu
);
559 static const struct sysfs_ops queue_sysfs_ops
= {
560 .show
= queue_attr_show
,
561 .store
= queue_attr_store
,
564 struct kobj_type blk_queue_ktype
= {
565 .sysfs_ops
= &queue_sysfs_ops
,
566 .default_attrs
= default_attrs
,
567 .release
= blk_release_queue
,
570 int blk_register_queue(struct gendisk
*disk
)
573 struct device
*dev
= disk_to_dev(disk
);
574 struct request_queue
*q
= disk
->queue
;
580 * Initialization must be complete by now. Finish the initial
581 * bypass from queue allocation.
583 blk_queue_bypass_end(q
);
584 queue_flag_set_unlocked(QUEUE_FLAG_INIT_DONE
, q
);
586 ret
= blk_trace_init_sysfs(dev
);
590 ret
= kobject_add(&q
->kobj
, kobject_get(&dev
->kobj
), "%s", "queue");
592 blk_trace_remove_sysfs(dev
);
596 kobject_uevent(&q
->kobj
, KOBJ_ADD
);
599 blk_mq_register_disk(disk
);
604 ret
= elv_register_queue(q
);
606 kobject_uevent(&q
->kobj
, KOBJ_REMOVE
);
607 kobject_del(&q
->kobj
);
608 blk_trace_remove_sysfs(dev
);
609 kobject_put(&dev
->kobj
);
616 void blk_unregister_queue(struct gendisk
*disk
)
618 struct request_queue
*q
= disk
->queue
;
624 blk_mq_unregister_disk(disk
);
627 elv_unregister_queue(q
);
629 kobject_uevent(&q
->kobj
, KOBJ_REMOVE
);
630 kobject_del(&q
->kobj
);
631 blk_trace_remove_sysfs(disk_to_dev(disk
));
632 kobject_put(&disk_to_dev(disk
)->kobj
);