xref: /openbmc/linux/block/blk-sysfs.c (revision add48ba4)
1 // SPDX-License-Identifier: GPL-2.0
2 /*
3  * Functions related to sysfs handling
4  */
5 #include <linux/kernel.h>
6 #include <linux/slab.h>
7 #include <linux/module.h>
8 #include <linux/bio.h>
9 #include <linux/blkdev.h>
10 #include <linux/backing-dev.h>
11 #include <linux/blktrace_api.h>
12 #include <linux/blk-mq.h>
13 #include <linux/blk-cgroup.h>
14 
15 #include "blk.h"
16 #include "blk-mq.h"
17 #include "blk-mq-debugfs.h"
18 #include "blk-wbt.h"
19 
20 struct queue_sysfs_entry {
21 	struct attribute attr;
22 	ssize_t (*show)(struct request_queue *, char *);
23 	ssize_t (*store)(struct request_queue *, const char *, size_t);
24 };
25 
26 static ssize_t
27 queue_var_show(unsigned long var, char *page)
28 {
29 	return sprintf(page, "%lu\n", var);
30 }
31 
32 static ssize_t
33 queue_var_store(unsigned long *var, const char *page, size_t count)
34 {
35 	int err;
36 	unsigned long v;
37 
38 	err = kstrtoul(page, 10, &v);
39 	if (err || v > UINT_MAX)
40 		return -EINVAL;
41 
42 	*var = v;
43 
44 	return count;
45 }
46 
47 static ssize_t queue_var_store64(s64 *var, const char *page)
48 {
49 	int err;
50 	s64 v;
51 
52 	err = kstrtos64(page, 10, &v);
53 	if (err < 0)
54 		return err;
55 
56 	*var = v;
57 	return 0;
58 }
59 
60 static ssize_t queue_requests_show(struct request_queue *q, char *page)
61 {
62 	return queue_var_show(q->nr_requests, (page));
63 }
64 
65 static ssize_t
66 queue_requests_store(struct request_queue *q, const char *page, size_t count)
67 {
68 	unsigned long nr;
69 	int ret, err;
70 
71 	if (!queue_is_mq(q))
72 		return -EINVAL;
73 
74 	ret = queue_var_store(&nr, page, count);
75 	if (ret < 0)
76 		return ret;
77 
78 	if (nr < BLKDEV_MIN_RQ)
79 		nr = BLKDEV_MIN_RQ;
80 
81 	err = blk_mq_update_nr_requests(q, nr);
82 	if (err)
83 		return err;
84 
85 	return ret;
86 }
87 
88 static ssize_t queue_ra_show(struct request_queue *q, char *page)
89 {
90 	unsigned long ra_kb = q->backing_dev_info->ra_pages <<
91 					(PAGE_SHIFT - 10);
92 
93 	return queue_var_show(ra_kb, (page));
94 }
95 
96 static ssize_t
97 queue_ra_store(struct request_queue *q, const char *page, size_t count)
98 {
99 	unsigned long ra_kb;
100 	ssize_t ret = queue_var_store(&ra_kb, page, count);
101 
102 	if (ret < 0)
103 		return ret;
104 
105 	q->backing_dev_info->ra_pages = ra_kb >> (PAGE_SHIFT - 10);
106 
107 	return ret;
108 }
109 
110 static ssize_t queue_max_sectors_show(struct request_queue *q, char *page)
111 {
112 	int max_sectors_kb = queue_max_sectors(q) >> 1;
113 
114 	return queue_var_show(max_sectors_kb, (page));
115 }
116 
117 static ssize_t queue_max_segments_show(struct request_queue *q, char *page)
118 {
119 	return queue_var_show(queue_max_segments(q), (page));
120 }
121 
122 static ssize_t queue_max_discard_segments_show(struct request_queue *q,
123 		char *page)
124 {
125 	return queue_var_show(queue_max_discard_segments(q), (page));
126 }
127 
128 static ssize_t queue_max_integrity_segments_show(struct request_queue *q, char *page)
129 {
130 	return queue_var_show(q->limits.max_integrity_segments, (page));
131 }
132 
133 static ssize_t queue_max_segment_size_show(struct request_queue *q, char *page)
134 {
135 	return queue_var_show(queue_max_segment_size(q), (page));
136 }
137 
138 static ssize_t queue_logical_block_size_show(struct request_queue *q, char *page)
139 {
140 	return queue_var_show(queue_logical_block_size(q), page);
141 }
142 
143 static ssize_t queue_physical_block_size_show(struct request_queue *q, char *page)
144 {
145 	return queue_var_show(queue_physical_block_size(q), page);
146 }
147 
148 static ssize_t queue_chunk_sectors_show(struct request_queue *q, char *page)
149 {
150 	return queue_var_show(q->limits.chunk_sectors, page);
151 }
152 
153 static ssize_t queue_io_min_show(struct request_queue *q, char *page)
154 {
155 	return queue_var_show(queue_io_min(q), page);
156 }
157 
158 static ssize_t queue_io_opt_show(struct request_queue *q, char *page)
159 {
160 	return queue_var_show(queue_io_opt(q), page);
161 }
162 
163 static ssize_t queue_discard_granularity_show(struct request_queue *q, char *page)
164 {
165 	return queue_var_show(q->limits.discard_granularity, page);
166 }
167 
168 static ssize_t queue_discard_max_hw_show(struct request_queue *q, char *page)
169 {
170 
171 	return sprintf(page, "%llu\n",
172 		(unsigned long long)q->limits.max_hw_discard_sectors << 9);
173 }
174 
175 static ssize_t queue_discard_max_show(struct request_queue *q, char *page)
176 {
177 	return sprintf(page, "%llu\n",
178 		       (unsigned long long)q->limits.max_discard_sectors << 9);
179 }
180 
181 static ssize_t queue_discard_max_store(struct request_queue *q,
182 				       const char *page, size_t count)
183 {
184 	unsigned long max_discard;
185 	ssize_t ret = queue_var_store(&max_discard, page, count);
186 
187 	if (ret < 0)
188 		return ret;
189 
190 	if (max_discard & (q->limits.discard_granularity - 1))
191 		return -EINVAL;
192 
193 	max_discard >>= 9;
194 	if (max_discard > UINT_MAX)
195 		return -EINVAL;
196 
197 	if (max_discard > q->limits.max_hw_discard_sectors)
198 		max_discard = q->limits.max_hw_discard_sectors;
199 
200 	q->limits.max_discard_sectors = max_discard;
201 	return ret;
202 }
203 
204 static ssize_t queue_discard_zeroes_data_show(struct request_queue *q, char *page)
205 {
206 	return queue_var_show(0, page);
207 }
208 
209 static ssize_t queue_write_same_max_show(struct request_queue *q, char *page)
210 {
211 	return sprintf(page, "%llu\n",
212 		(unsigned long long)q->limits.max_write_same_sectors << 9);
213 }
214 
215 static ssize_t queue_write_zeroes_max_show(struct request_queue *q, char *page)
216 {
217 	return sprintf(page, "%llu\n",
218 		(unsigned long long)q->limits.max_write_zeroes_sectors << 9);
219 }
220 
221 static ssize_t queue_zone_append_max_show(struct request_queue *q, char *page)
222 {
223 	unsigned long long max_sectors = q->limits.max_zone_append_sectors;
224 
225 	return sprintf(page, "%llu\n", max_sectors << SECTOR_SHIFT);
226 }
227 
228 static ssize_t
229 queue_max_sectors_store(struct request_queue *q, const char *page, size_t count)
230 {
231 	unsigned long max_sectors_kb,
232 		max_hw_sectors_kb = queue_max_hw_sectors(q) >> 1,
233 			page_kb = 1 << (PAGE_SHIFT - 10);
234 	ssize_t ret = queue_var_store(&max_sectors_kb, page, count);
235 
236 	if (ret < 0)
237 		return ret;
238 
239 	max_hw_sectors_kb = min_not_zero(max_hw_sectors_kb, (unsigned long)
240 					 q->limits.max_dev_sectors >> 1);
241 
242 	if (max_sectors_kb > max_hw_sectors_kb || max_sectors_kb < page_kb)
243 		return -EINVAL;
244 
245 	spin_lock_irq(&q->queue_lock);
246 	q->limits.max_sectors = max_sectors_kb << 1;
247 	q->backing_dev_info->io_pages = max_sectors_kb >> (PAGE_SHIFT - 10);
248 	spin_unlock_irq(&q->queue_lock);
249 
250 	return ret;
251 }
252 
253 static ssize_t queue_max_hw_sectors_show(struct request_queue *q, char *page)
254 {
255 	int max_hw_sectors_kb = queue_max_hw_sectors(q) >> 1;
256 
257 	return queue_var_show(max_hw_sectors_kb, (page));
258 }
259 
260 #define QUEUE_SYSFS_BIT_FNS(name, flag, neg)				\
261 static ssize_t								\
262 queue_show_##name(struct request_queue *q, char *page)			\
263 {									\
264 	int bit;							\
265 	bit = test_bit(QUEUE_FLAG_##flag, &q->queue_flags);		\
266 	return queue_var_show(neg ? !bit : bit, page);			\
267 }									\
268 static ssize_t								\
269 queue_store_##name(struct request_queue *q, const char *page, size_t count) \
270 {									\
271 	unsigned long val;						\
272 	ssize_t ret;							\
273 	ret = queue_var_store(&val, page, count);			\
274 	if (ret < 0)							\
275 		 return ret;						\
276 	if (neg)							\
277 		val = !val;						\
278 									\
279 	if (val)							\
280 		blk_queue_flag_set(QUEUE_FLAG_##flag, q);		\
281 	else								\
282 		blk_queue_flag_clear(QUEUE_FLAG_##flag, q);		\
283 	return ret;							\
284 }
285 
286 QUEUE_SYSFS_BIT_FNS(nonrot, NONROT, 1);
287 QUEUE_SYSFS_BIT_FNS(random, ADD_RANDOM, 0);
288 QUEUE_SYSFS_BIT_FNS(iostats, IO_STAT, 0);
289 #undef QUEUE_SYSFS_BIT_FNS
290 
291 static ssize_t queue_zoned_show(struct request_queue *q, char *page)
292 {
293 	switch (blk_queue_zoned_model(q)) {
294 	case BLK_ZONED_HA:
295 		return sprintf(page, "host-aware\n");
296 	case BLK_ZONED_HM:
297 		return sprintf(page, "host-managed\n");
298 	default:
299 		return sprintf(page, "none\n");
300 	}
301 }
302 
303 static ssize_t queue_nr_zones_show(struct request_queue *q, char *page)
304 {
305 	return queue_var_show(blk_queue_nr_zones(q), page);
306 }
307 
308 static ssize_t queue_nomerges_show(struct request_queue *q, char *page)
309 {
310 	return queue_var_show((blk_queue_nomerges(q) << 1) |
311 			       blk_queue_noxmerges(q), page);
312 }
313 
314 static ssize_t queue_nomerges_store(struct request_queue *q, const char *page,
315 				    size_t count)
316 {
317 	unsigned long nm;
318 	ssize_t ret = queue_var_store(&nm, page, count);
319 
320 	if (ret < 0)
321 		return ret;
322 
323 	blk_queue_flag_clear(QUEUE_FLAG_NOMERGES, q);
324 	blk_queue_flag_clear(QUEUE_FLAG_NOXMERGES, q);
325 	if (nm == 2)
326 		blk_queue_flag_set(QUEUE_FLAG_NOMERGES, q);
327 	else if (nm)
328 		blk_queue_flag_set(QUEUE_FLAG_NOXMERGES, q);
329 
330 	return ret;
331 }
332 
333 static ssize_t queue_rq_affinity_show(struct request_queue *q, char *page)
334 {
335 	bool set = test_bit(QUEUE_FLAG_SAME_COMP, &q->queue_flags);
336 	bool force = test_bit(QUEUE_FLAG_SAME_FORCE, &q->queue_flags);
337 
338 	return queue_var_show(set << force, page);
339 }
340 
341 static ssize_t
342 queue_rq_affinity_store(struct request_queue *q, const char *page, size_t count)
343 {
344 	ssize_t ret = -EINVAL;
345 #ifdef CONFIG_SMP
346 	unsigned long val;
347 
348 	ret = queue_var_store(&val, page, count);
349 	if (ret < 0)
350 		return ret;
351 
352 	if (val == 2) {
353 		blk_queue_flag_set(QUEUE_FLAG_SAME_COMP, q);
354 		blk_queue_flag_set(QUEUE_FLAG_SAME_FORCE, q);
355 	} else if (val == 1) {
356 		blk_queue_flag_set(QUEUE_FLAG_SAME_COMP, q);
357 		blk_queue_flag_clear(QUEUE_FLAG_SAME_FORCE, q);
358 	} else if (val == 0) {
359 		blk_queue_flag_clear(QUEUE_FLAG_SAME_COMP, q);
360 		blk_queue_flag_clear(QUEUE_FLAG_SAME_FORCE, q);
361 	}
362 #endif
363 	return ret;
364 }
365 
366 static ssize_t queue_poll_delay_show(struct request_queue *q, char *page)
367 {
368 	int val;
369 
370 	if (q->poll_nsec == BLK_MQ_POLL_CLASSIC)
371 		val = BLK_MQ_POLL_CLASSIC;
372 	else
373 		val = q->poll_nsec / 1000;
374 
375 	return sprintf(page, "%d\n", val);
376 }
377 
378 static ssize_t queue_poll_delay_store(struct request_queue *q, const char *page,
379 				size_t count)
380 {
381 	int err, val;
382 
383 	if (!q->mq_ops || !q->mq_ops->poll)
384 		return -EINVAL;
385 
386 	err = kstrtoint(page, 10, &val);
387 	if (err < 0)
388 		return err;
389 
390 	if (val == BLK_MQ_POLL_CLASSIC)
391 		q->poll_nsec = BLK_MQ_POLL_CLASSIC;
392 	else if (val >= 0)
393 		q->poll_nsec = val * 1000;
394 	else
395 		return -EINVAL;
396 
397 	return count;
398 }
399 
400 static ssize_t queue_poll_show(struct request_queue *q, char *page)
401 {
402 	return queue_var_show(test_bit(QUEUE_FLAG_POLL, &q->queue_flags), page);
403 }
404 
405 static ssize_t queue_poll_store(struct request_queue *q, const char *page,
406 				size_t count)
407 {
408 	unsigned long poll_on;
409 	ssize_t ret;
410 
411 	if (!q->tag_set || q->tag_set->nr_maps <= HCTX_TYPE_POLL ||
412 	    !q->tag_set->map[HCTX_TYPE_POLL].nr_queues)
413 		return -EINVAL;
414 
415 	ret = queue_var_store(&poll_on, page, count);
416 	if (ret < 0)
417 		return ret;
418 
419 	if (poll_on)
420 		blk_queue_flag_set(QUEUE_FLAG_POLL, q);
421 	else
422 		blk_queue_flag_clear(QUEUE_FLAG_POLL, q);
423 
424 	return ret;
425 }
426 
427 static ssize_t queue_io_timeout_show(struct request_queue *q, char *page)
428 {
429 	return sprintf(page, "%u\n", jiffies_to_msecs(q->rq_timeout));
430 }
431 
432 static ssize_t queue_io_timeout_store(struct request_queue *q, const char *page,
433 				  size_t count)
434 {
435 	unsigned int val;
436 	int err;
437 
438 	err = kstrtou32(page, 10, &val);
439 	if (err || val == 0)
440 		return -EINVAL;
441 
442 	blk_queue_rq_timeout(q, msecs_to_jiffies(val));
443 
444 	return count;
445 }
446 
447 static ssize_t queue_wb_lat_show(struct request_queue *q, char *page)
448 {
449 	if (!wbt_rq_qos(q))
450 		return -EINVAL;
451 
452 	return sprintf(page, "%llu\n", div_u64(wbt_get_min_lat(q), 1000));
453 }
454 
455 static ssize_t queue_wb_lat_store(struct request_queue *q, const char *page,
456 				  size_t count)
457 {
458 	struct rq_qos *rqos;
459 	ssize_t ret;
460 	s64 val;
461 
462 	ret = queue_var_store64(&val, page);
463 	if (ret < 0)
464 		return ret;
465 	if (val < -1)
466 		return -EINVAL;
467 
468 	rqos = wbt_rq_qos(q);
469 	if (!rqos) {
470 		ret = wbt_init(q);
471 		if (ret)
472 			return ret;
473 	}
474 
475 	if (val == -1)
476 		val = wbt_default_latency_nsec(q);
477 	else if (val >= 0)
478 		val *= 1000ULL;
479 
480 	if (wbt_get_min_lat(q) == val)
481 		return count;
482 
483 	/*
484 	 * Ensure that the queue is idled, in case the latency update
485 	 * ends up either enabling or disabling wbt completely. We can't
486 	 * have IO inflight if that happens.
487 	 */
488 	blk_mq_freeze_queue(q);
489 	blk_mq_quiesce_queue(q);
490 
491 	wbt_set_min_lat(q, val);
492 
493 	blk_mq_unquiesce_queue(q);
494 	blk_mq_unfreeze_queue(q);
495 
496 	return count;
497 }
498 
499 static ssize_t queue_wc_show(struct request_queue *q, char *page)
500 {
501 	if (test_bit(QUEUE_FLAG_WC, &q->queue_flags))
502 		return sprintf(page, "write back\n");
503 
504 	return sprintf(page, "write through\n");
505 }
506 
507 static ssize_t queue_wc_store(struct request_queue *q, const char *page,
508 			      size_t count)
509 {
510 	int set = -1;
511 
512 	if (!strncmp(page, "write back", 10))
513 		set = 1;
514 	else if (!strncmp(page, "write through", 13) ||
515 		 !strncmp(page, "none", 4))
516 		set = 0;
517 
518 	if (set == -1)
519 		return -EINVAL;
520 
521 	if (set)
522 		blk_queue_flag_set(QUEUE_FLAG_WC, q);
523 	else
524 		blk_queue_flag_clear(QUEUE_FLAG_WC, q);
525 
526 	return count;
527 }
528 
529 static ssize_t queue_fua_show(struct request_queue *q, char *page)
530 {
531 	return sprintf(page, "%u\n", test_bit(QUEUE_FLAG_FUA, &q->queue_flags));
532 }
533 
534 static ssize_t queue_dax_show(struct request_queue *q, char *page)
535 {
536 	return queue_var_show(blk_queue_dax(q), page);
537 }
538 
539 static struct queue_sysfs_entry queue_requests_entry = {
540 	.attr = {.name = "nr_requests", .mode = 0644 },
541 	.show = queue_requests_show,
542 	.store = queue_requests_store,
543 };
544 
545 static struct queue_sysfs_entry queue_ra_entry = {
546 	.attr = {.name = "read_ahead_kb", .mode = 0644 },
547 	.show = queue_ra_show,
548 	.store = queue_ra_store,
549 };
550 
551 static struct queue_sysfs_entry queue_max_sectors_entry = {
552 	.attr = {.name = "max_sectors_kb", .mode = 0644 },
553 	.show = queue_max_sectors_show,
554 	.store = queue_max_sectors_store,
555 };
556 
557 static struct queue_sysfs_entry queue_max_hw_sectors_entry = {
558 	.attr = {.name = "max_hw_sectors_kb", .mode = 0444 },
559 	.show = queue_max_hw_sectors_show,
560 };
561 
562 static struct queue_sysfs_entry queue_max_segments_entry = {
563 	.attr = {.name = "max_segments", .mode = 0444 },
564 	.show = queue_max_segments_show,
565 };
566 
567 static struct queue_sysfs_entry queue_max_discard_segments_entry = {
568 	.attr = {.name = "max_discard_segments", .mode = 0444 },
569 	.show = queue_max_discard_segments_show,
570 };
571 
572 static struct queue_sysfs_entry queue_max_integrity_segments_entry = {
573 	.attr = {.name = "max_integrity_segments", .mode = 0444 },
574 	.show = queue_max_integrity_segments_show,
575 };
576 
577 static struct queue_sysfs_entry queue_max_segment_size_entry = {
578 	.attr = {.name = "max_segment_size", .mode = 0444 },
579 	.show = queue_max_segment_size_show,
580 };
581 
582 static struct queue_sysfs_entry queue_iosched_entry = {
583 	.attr = {.name = "scheduler", .mode = 0644 },
584 	.show = elv_iosched_show,
585 	.store = elv_iosched_store,
586 };
587 
588 static struct queue_sysfs_entry queue_hw_sector_size_entry = {
589 	.attr = {.name = "hw_sector_size", .mode = 0444 },
590 	.show = queue_logical_block_size_show,
591 };
592 
593 static struct queue_sysfs_entry queue_logical_block_size_entry = {
594 	.attr = {.name = "logical_block_size", .mode = 0444 },
595 	.show = queue_logical_block_size_show,
596 };
597 
598 static struct queue_sysfs_entry queue_physical_block_size_entry = {
599 	.attr = {.name = "physical_block_size", .mode = 0444 },
600 	.show = queue_physical_block_size_show,
601 };
602 
603 static struct queue_sysfs_entry queue_chunk_sectors_entry = {
604 	.attr = {.name = "chunk_sectors", .mode = 0444 },
605 	.show = queue_chunk_sectors_show,
606 };
607 
608 static struct queue_sysfs_entry queue_io_min_entry = {
609 	.attr = {.name = "minimum_io_size", .mode = 0444 },
610 	.show = queue_io_min_show,
611 };
612 
613 static struct queue_sysfs_entry queue_io_opt_entry = {
614 	.attr = {.name = "optimal_io_size", .mode = 0444 },
615 	.show = queue_io_opt_show,
616 };
617 
618 static struct queue_sysfs_entry queue_discard_granularity_entry = {
619 	.attr = {.name = "discard_granularity", .mode = 0444 },
620 	.show = queue_discard_granularity_show,
621 };
622 
623 static struct queue_sysfs_entry queue_discard_max_hw_entry = {
624 	.attr = {.name = "discard_max_hw_bytes", .mode = 0444 },
625 	.show = queue_discard_max_hw_show,
626 };
627 
628 static struct queue_sysfs_entry queue_discard_max_entry = {
629 	.attr = {.name = "discard_max_bytes", .mode = 0644 },
630 	.show = queue_discard_max_show,
631 	.store = queue_discard_max_store,
632 };
633 
634 static struct queue_sysfs_entry queue_discard_zeroes_data_entry = {
635 	.attr = {.name = "discard_zeroes_data", .mode = 0444 },
636 	.show = queue_discard_zeroes_data_show,
637 };
638 
639 static struct queue_sysfs_entry queue_write_same_max_entry = {
640 	.attr = {.name = "write_same_max_bytes", .mode = 0444 },
641 	.show = queue_write_same_max_show,
642 };
643 
644 static struct queue_sysfs_entry queue_write_zeroes_max_entry = {
645 	.attr = {.name = "write_zeroes_max_bytes", .mode = 0444 },
646 	.show = queue_write_zeroes_max_show,
647 };
648 
649 static struct queue_sysfs_entry queue_zone_append_max_entry = {
650 	.attr = {.name = "zone_append_max_bytes", .mode = 0444 },
651 	.show = queue_zone_append_max_show,
652 };
653 
654 static struct queue_sysfs_entry queue_nonrot_entry = {
655 	.attr = {.name = "rotational", .mode = 0644 },
656 	.show = queue_show_nonrot,
657 	.store = queue_store_nonrot,
658 };
659 
660 static struct queue_sysfs_entry queue_zoned_entry = {
661 	.attr = {.name = "zoned", .mode = 0444 },
662 	.show = queue_zoned_show,
663 };
664 
665 static struct queue_sysfs_entry queue_nr_zones_entry = {
666 	.attr = {.name = "nr_zones", .mode = 0444 },
667 	.show = queue_nr_zones_show,
668 };
669 
670 static struct queue_sysfs_entry queue_nomerges_entry = {
671 	.attr = {.name = "nomerges", .mode = 0644 },
672 	.show = queue_nomerges_show,
673 	.store = queue_nomerges_store,
674 };
675 
676 static struct queue_sysfs_entry queue_rq_affinity_entry = {
677 	.attr = {.name = "rq_affinity", .mode = 0644 },
678 	.show = queue_rq_affinity_show,
679 	.store = queue_rq_affinity_store,
680 };
681 
682 static struct queue_sysfs_entry queue_iostats_entry = {
683 	.attr = {.name = "iostats", .mode = 0644 },
684 	.show = queue_show_iostats,
685 	.store = queue_store_iostats,
686 };
687 
688 static struct queue_sysfs_entry queue_random_entry = {
689 	.attr = {.name = "add_random", .mode = 0644 },
690 	.show = queue_show_random,
691 	.store = queue_store_random,
692 };
693 
694 static struct queue_sysfs_entry queue_poll_entry = {
695 	.attr = {.name = "io_poll", .mode = 0644 },
696 	.show = queue_poll_show,
697 	.store = queue_poll_store,
698 };
699 
700 static struct queue_sysfs_entry queue_poll_delay_entry = {
701 	.attr = {.name = "io_poll_delay", .mode = 0644 },
702 	.show = queue_poll_delay_show,
703 	.store = queue_poll_delay_store,
704 };
705 
706 static struct queue_sysfs_entry queue_wc_entry = {
707 	.attr = {.name = "write_cache", .mode = 0644 },
708 	.show = queue_wc_show,
709 	.store = queue_wc_store,
710 };
711 
712 static struct queue_sysfs_entry queue_fua_entry = {
713 	.attr = {.name = "fua", .mode = 0444 },
714 	.show = queue_fua_show,
715 };
716 
717 static struct queue_sysfs_entry queue_dax_entry = {
718 	.attr = {.name = "dax", .mode = 0444 },
719 	.show = queue_dax_show,
720 };
721 
722 static struct queue_sysfs_entry queue_io_timeout_entry = {
723 	.attr = {.name = "io_timeout", .mode = 0644 },
724 	.show = queue_io_timeout_show,
725 	.store = queue_io_timeout_store,
726 };
727 
728 static struct queue_sysfs_entry queue_wb_lat_entry = {
729 	.attr = {.name = "wbt_lat_usec", .mode = 0644 },
730 	.show = queue_wb_lat_show,
731 	.store = queue_wb_lat_store,
732 };
733 
734 #ifdef CONFIG_BLK_DEV_THROTTLING_LOW
735 static struct queue_sysfs_entry throtl_sample_time_entry = {
736 	.attr = {.name = "throttle_sample_time", .mode = 0644 },
737 	.show = blk_throtl_sample_time_show,
738 	.store = blk_throtl_sample_time_store,
739 };
740 #endif
741 
742 static struct attribute *queue_attrs[] = {
743 	&queue_requests_entry.attr,
744 	&queue_ra_entry.attr,
745 	&queue_max_hw_sectors_entry.attr,
746 	&queue_max_sectors_entry.attr,
747 	&queue_max_segments_entry.attr,
748 	&queue_max_discard_segments_entry.attr,
749 	&queue_max_integrity_segments_entry.attr,
750 	&queue_max_segment_size_entry.attr,
751 	&queue_iosched_entry.attr,
752 	&queue_hw_sector_size_entry.attr,
753 	&queue_logical_block_size_entry.attr,
754 	&queue_physical_block_size_entry.attr,
755 	&queue_chunk_sectors_entry.attr,
756 	&queue_io_min_entry.attr,
757 	&queue_io_opt_entry.attr,
758 	&queue_discard_granularity_entry.attr,
759 	&queue_discard_max_entry.attr,
760 	&queue_discard_max_hw_entry.attr,
761 	&queue_discard_zeroes_data_entry.attr,
762 	&queue_write_same_max_entry.attr,
763 	&queue_write_zeroes_max_entry.attr,
764 	&queue_zone_append_max_entry.attr,
765 	&queue_nonrot_entry.attr,
766 	&queue_zoned_entry.attr,
767 	&queue_nr_zones_entry.attr,
768 	&queue_nomerges_entry.attr,
769 	&queue_rq_affinity_entry.attr,
770 	&queue_iostats_entry.attr,
771 	&queue_random_entry.attr,
772 	&queue_poll_entry.attr,
773 	&queue_wc_entry.attr,
774 	&queue_fua_entry.attr,
775 	&queue_dax_entry.attr,
776 	&queue_wb_lat_entry.attr,
777 	&queue_poll_delay_entry.attr,
778 	&queue_io_timeout_entry.attr,
779 #ifdef CONFIG_BLK_DEV_THROTTLING_LOW
780 	&throtl_sample_time_entry.attr,
781 #endif
782 	NULL,
783 };
784 
785 static umode_t queue_attr_visible(struct kobject *kobj, struct attribute *attr,
786 				int n)
787 {
788 	struct request_queue *q =
789 		container_of(kobj, struct request_queue, kobj);
790 
791 	if (attr == &queue_io_timeout_entry.attr &&
792 		(!q->mq_ops || !q->mq_ops->timeout))
793 			return 0;
794 
795 	return attr->mode;
796 }
797 
798 static struct attribute_group queue_attr_group = {
799 	.attrs = queue_attrs,
800 	.is_visible = queue_attr_visible,
801 };
802 
803 
804 #define to_queue(atr) container_of((atr), struct queue_sysfs_entry, attr)
805 
806 static ssize_t
807 queue_attr_show(struct kobject *kobj, struct attribute *attr, char *page)
808 {
809 	struct queue_sysfs_entry *entry = to_queue(attr);
810 	struct request_queue *q =
811 		container_of(kobj, struct request_queue, kobj);
812 	ssize_t res;
813 
814 	if (!entry->show)
815 		return -EIO;
816 	mutex_lock(&q->sysfs_lock);
817 	res = entry->show(q, page);
818 	mutex_unlock(&q->sysfs_lock);
819 	return res;
820 }
821 
822 static ssize_t
823 queue_attr_store(struct kobject *kobj, struct attribute *attr,
824 		    const char *page, size_t length)
825 {
826 	struct queue_sysfs_entry *entry = to_queue(attr);
827 	struct request_queue *q;
828 	ssize_t res;
829 
830 	if (!entry->store)
831 		return -EIO;
832 
833 	q = container_of(kobj, struct request_queue, kobj);
834 	mutex_lock(&q->sysfs_lock);
835 	res = entry->store(q, page, length);
836 	mutex_unlock(&q->sysfs_lock);
837 	return res;
838 }
839 
840 static void blk_free_queue_rcu(struct rcu_head *rcu_head)
841 {
842 	struct request_queue *q = container_of(rcu_head, struct request_queue,
843 					       rcu_head);
844 	kmem_cache_free(blk_requestq_cachep, q);
845 }
846 
847 /* Unconfigure the I/O scheduler and dissociate from the cgroup controller. */
848 static void blk_exit_queue(struct request_queue *q)
849 {
850 	/*
851 	 * Since the I/O scheduler exit code may access cgroup information,
852 	 * perform I/O scheduler exit before disassociating from the block
853 	 * cgroup controller.
854 	 */
855 	if (q->elevator) {
856 		ioc_clear_queue(q);
857 		__elevator_exit(q, q->elevator);
858 		q->elevator = NULL;
859 	}
860 
861 	/*
862 	 * Remove all references to @q from the block cgroup controller before
863 	 * restoring @q->queue_lock to avoid that restoring this pointer causes
864 	 * e.g. blkcg_print_blkgs() to crash.
865 	 */
866 	blkcg_exit_queue(q);
867 
868 	/*
869 	 * Since the cgroup code may dereference the @q->backing_dev_info
870 	 * pointer, only decrease its reference count after having removed the
871 	 * association with the block cgroup controller.
872 	 */
873 	bdi_put(q->backing_dev_info);
874 }
875 
876 
877 /**
878  * __blk_release_queue - release a request queue
879  * @work: pointer to the release_work member of the request queue to be released
880  *
881  * Description:
882  *     This function is called when a block device is being unregistered. The
883  *     process of releasing a request queue starts with blk_cleanup_queue, which
884  *     set the appropriate flags and then calls blk_put_queue, that decrements
885  *     the reference counter of the request queue. Once the reference counter
886  *     of the request queue reaches zero, blk_release_queue is called to release
887  *     all allocated resources of the request queue.
888  */
889 static void __blk_release_queue(struct work_struct *work)
890 {
891 	struct request_queue *q = container_of(work, typeof(*q), release_work);
892 
893 	if (test_bit(QUEUE_FLAG_POLL_STATS, &q->queue_flags))
894 		blk_stat_remove_callback(q, q->poll_cb);
895 	blk_stat_free_callback(q->poll_cb);
896 
897 	blk_free_queue_stats(q->stats);
898 
899 	if (queue_is_mq(q))
900 		cancel_delayed_work_sync(&q->requeue_work);
901 
902 	blk_exit_queue(q);
903 
904 	blk_queue_free_zone_bitmaps(q);
905 
906 	if (queue_is_mq(q))
907 		blk_mq_release(q);
908 
909 	blk_trace_shutdown(q);
910 
911 	if (queue_is_mq(q))
912 		blk_mq_debugfs_unregister(q);
913 
914 	bioset_exit(&q->bio_split);
915 
916 	ida_simple_remove(&blk_queue_ida, q->id);
917 	call_rcu(&q->rcu_head, blk_free_queue_rcu);
918 }
919 
920 static void blk_release_queue(struct kobject *kobj)
921 {
922 	struct request_queue *q =
923 		container_of(kobj, struct request_queue, kobj);
924 
925 	INIT_WORK(&q->release_work, __blk_release_queue);
926 	schedule_work(&q->release_work);
927 }
928 
929 static const struct sysfs_ops queue_sysfs_ops = {
930 	.show	= queue_attr_show,
931 	.store	= queue_attr_store,
932 };
933 
934 struct kobj_type blk_queue_ktype = {
935 	.sysfs_ops	= &queue_sysfs_ops,
936 	.release	= blk_release_queue,
937 };
938 
939 /**
940  * blk_register_queue - register a block layer queue with sysfs
941  * @disk: Disk of which the request queue should be registered with sysfs.
942  */
943 int blk_register_queue(struct gendisk *disk)
944 {
945 	int ret;
946 	struct device *dev = disk_to_dev(disk);
947 	struct request_queue *q = disk->queue;
948 	bool has_elevator = false;
949 
950 	if (WARN_ON(!q))
951 		return -ENXIO;
952 
953 	WARN_ONCE(blk_queue_registered(q),
954 		  "%s is registering an already registered queue\n",
955 		  kobject_name(&dev->kobj));
956 
957 	/*
958 	 * SCSI probing may synchronously create and destroy a lot of
959 	 * request_queues for non-existent devices.  Shutting down a fully
960 	 * functional queue takes measureable wallclock time as RCU grace
961 	 * periods are involved.  To avoid excessive latency in these
962 	 * cases, a request_queue starts out in a degraded mode which is
963 	 * faster to shut down and is made fully functional here as
964 	 * request_queues for non-existent devices never get registered.
965 	 */
966 	if (!blk_queue_init_done(q)) {
967 		blk_queue_flag_set(QUEUE_FLAG_INIT_DONE, q);
968 		percpu_ref_switch_to_percpu(&q->q_usage_counter);
969 	}
970 
971 	ret = blk_trace_init_sysfs(dev);
972 	if (ret)
973 		return ret;
974 
975 	mutex_lock(&q->sysfs_dir_lock);
976 
977 	ret = kobject_add(&q->kobj, kobject_get(&dev->kobj), "%s", "queue");
978 	if (ret < 0) {
979 		blk_trace_remove_sysfs(dev);
980 		goto unlock;
981 	}
982 
983 	ret = sysfs_create_group(&q->kobj, &queue_attr_group);
984 	if (ret) {
985 		blk_trace_remove_sysfs(dev);
986 		kobject_del(&q->kobj);
987 		kobject_put(&dev->kobj);
988 		goto unlock;
989 	}
990 
991 	if (queue_is_mq(q)) {
992 		__blk_mq_register_dev(dev, q);
993 		blk_mq_debugfs_register(q);
994 	}
995 
996 	mutex_lock(&q->sysfs_lock);
997 	if (q->elevator) {
998 		ret = elv_register_queue(q, false);
999 		if (ret) {
1000 			mutex_unlock(&q->sysfs_lock);
1001 			mutex_unlock(&q->sysfs_dir_lock);
1002 			kobject_del(&q->kobj);
1003 			blk_trace_remove_sysfs(dev);
1004 			kobject_put(&dev->kobj);
1005 			return ret;
1006 		}
1007 		has_elevator = true;
1008 	}
1009 
1010 	blk_queue_flag_set(QUEUE_FLAG_REGISTERED, q);
1011 	wbt_enable_default(q);
1012 	blk_throtl_register_queue(q);
1013 
1014 	/* Now everything is ready and send out KOBJ_ADD uevent */
1015 	kobject_uevent(&q->kobj, KOBJ_ADD);
1016 	if (has_elevator)
1017 		kobject_uevent(&q->elevator->kobj, KOBJ_ADD);
1018 	mutex_unlock(&q->sysfs_lock);
1019 
1020 	ret = 0;
1021 unlock:
1022 	mutex_unlock(&q->sysfs_dir_lock);
1023 	return ret;
1024 }
1025 EXPORT_SYMBOL_GPL(blk_register_queue);
1026 
1027 /**
1028  * blk_unregister_queue - counterpart of blk_register_queue()
1029  * @disk: Disk of which the request queue should be unregistered from sysfs.
1030  *
1031  * Note: the caller is responsible for guaranteeing that this function is called
1032  * after blk_register_queue() has finished.
1033  */
1034 void blk_unregister_queue(struct gendisk *disk)
1035 {
1036 	struct request_queue *q = disk->queue;
1037 
1038 	if (WARN_ON(!q))
1039 		return;
1040 
1041 	/* Return early if disk->queue was never registered. */
1042 	if (!blk_queue_registered(q))
1043 		return;
1044 
1045 	/*
1046 	 * Since sysfs_remove_dir() prevents adding new directory entries
1047 	 * before removal of existing entries starts, protect against
1048 	 * concurrent elv_iosched_store() calls.
1049 	 */
1050 	mutex_lock(&q->sysfs_lock);
1051 	blk_queue_flag_clear(QUEUE_FLAG_REGISTERED, q);
1052 	mutex_unlock(&q->sysfs_lock);
1053 
1054 	mutex_lock(&q->sysfs_dir_lock);
1055 	/*
1056 	 * Remove the sysfs attributes before unregistering the queue data
1057 	 * structures that can be modified through sysfs.
1058 	 */
1059 	if (queue_is_mq(q))
1060 		blk_mq_unregister_dev(disk_to_dev(disk), q);
1061 
1062 	kobject_uevent(&q->kobj, KOBJ_REMOVE);
1063 	kobject_del(&q->kobj);
1064 	blk_trace_remove_sysfs(disk_to_dev(disk));
1065 
1066 	mutex_lock(&q->sysfs_lock);
1067 	if (q->elevator)
1068 		elv_unregister_queue(q);
1069 	mutex_unlock(&q->sysfs_lock);
1070 	mutex_unlock(&q->sysfs_dir_lock);
1071 
1072 	kobject_put(&disk_to_dev(disk)->kobj);
1073 }
1074