xref: /openbmc/linux/block/blk-sysfs.c (revision 2fa5ebe3)
1 // SPDX-License-Identifier: GPL-2.0
2 /*
3  * Functions related to sysfs handling
4  */
5 #include <linux/kernel.h>
6 #include <linux/slab.h>
7 #include <linux/module.h>
8 #include <linux/bio.h>
9 #include <linux/blkdev.h>
10 #include <linux/backing-dev.h>
11 #include <linux/blktrace_api.h>
12 #include <linux/blk-mq.h>
13 #include <linux/debugfs.h>
14 
15 #include "blk.h"
16 #include "blk-mq.h"
17 #include "blk-mq-debugfs.h"
18 #include "blk-mq-sched.h"
19 #include "blk-rq-qos.h"
20 #include "blk-wbt.h"
21 #include "blk-cgroup.h"
22 #include "blk-throttle.h"
23 
24 struct queue_sysfs_entry {
25 	struct attribute attr;
26 	ssize_t (*show)(struct request_queue *, char *);
27 	ssize_t (*store)(struct request_queue *, const char *, size_t);
28 };
29 
30 static ssize_t
31 queue_var_show(unsigned long var, char *page)
32 {
33 	return sprintf(page, "%lu\n", var);
34 }
35 
36 static ssize_t
37 queue_var_store(unsigned long *var, const char *page, size_t count)
38 {
39 	int err;
40 	unsigned long v;
41 
42 	err = kstrtoul(page, 10, &v);
43 	if (err || v > UINT_MAX)
44 		return -EINVAL;
45 
46 	*var = v;
47 
48 	return count;
49 }
50 
51 static ssize_t queue_var_store64(s64 *var, const char *page)
52 {
53 	int err;
54 	s64 v;
55 
56 	err = kstrtos64(page, 10, &v);
57 	if (err < 0)
58 		return err;
59 
60 	*var = v;
61 	return 0;
62 }
63 
64 static ssize_t queue_requests_show(struct request_queue *q, char *page)
65 {
66 	return queue_var_show(q->nr_requests, page);
67 }
68 
69 static ssize_t
70 queue_requests_store(struct request_queue *q, const char *page, size_t count)
71 {
72 	unsigned long nr;
73 	int ret, err;
74 
75 	if (!queue_is_mq(q))
76 		return -EINVAL;
77 
78 	ret = queue_var_store(&nr, page, count);
79 	if (ret < 0)
80 		return ret;
81 
82 	if (nr < BLKDEV_MIN_RQ)
83 		nr = BLKDEV_MIN_RQ;
84 
85 	err = blk_mq_update_nr_requests(q, nr);
86 	if (err)
87 		return err;
88 
89 	return ret;
90 }
91 
92 static ssize_t queue_ra_show(struct request_queue *q, char *page)
93 {
94 	unsigned long ra_kb;
95 
96 	if (!q->disk)
97 		return -EINVAL;
98 	ra_kb = q->disk->bdi->ra_pages << (PAGE_SHIFT - 10);
99 	return queue_var_show(ra_kb, page);
100 }
101 
102 static ssize_t
103 queue_ra_store(struct request_queue *q, const char *page, size_t count)
104 {
105 	unsigned long ra_kb;
106 	ssize_t ret;
107 
108 	if (!q->disk)
109 		return -EINVAL;
110 	ret = queue_var_store(&ra_kb, page, count);
111 	if (ret < 0)
112 		return ret;
113 	q->disk->bdi->ra_pages = ra_kb >> (PAGE_SHIFT - 10);
114 	return ret;
115 }
116 
117 static ssize_t queue_max_sectors_show(struct request_queue *q, char *page)
118 {
119 	int max_sectors_kb = queue_max_sectors(q) >> 1;
120 
121 	return queue_var_show(max_sectors_kb, page);
122 }
123 
124 static ssize_t queue_max_segments_show(struct request_queue *q, char *page)
125 {
126 	return queue_var_show(queue_max_segments(q), page);
127 }
128 
129 static ssize_t queue_max_discard_segments_show(struct request_queue *q,
130 		char *page)
131 {
132 	return queue_var_show(queue_max_discard_segments(q), page);
133 }
134 
135 static ssize_t queue_max_integrity_segments_show(struct request_queue *q, char *page)
136 {
137 	return queue_var_show(q->limits.max_integrity_segments, page);
138 }
139 
140 static ssize_t queue_max_segment_size_show(struct request_queue *q, char *page)
141 {
142 	return queue_var_show(queue_max_segment_size(q), page);
143 }
144 
145 static ssize_t queue_logical_block_size_show(struct request_queue *q, char *page)
146 {
147 	return queue_var_show(queue_logical_block_size(q), page);
148 }
149 
150 static ssize_t queue_physical_block_size_show(struct request_queue *q, char *page)
151 {
152 	return queue_var_show(queue_physical_block_size(q), page);
153 }
154 
155 static ssize_t queue_chunk_sectors_show(struct request_queue *q, char *page)
156 {
157 	return queue_var_show(q->limits.chunk_sectors, page);
158 }
159 
160 static ssize_t queue_io_min_show(struct request_queue *q, char *page)
161 {
162 	return queue_var_show(queue_io_min(q), page);
163 }
164 
165 static ssize_t queue_io_opt_show(struct request_queue *q, char *page)
166 {
167 	return queue_var_show(queue_io_opt(q), page);
168 }
169 
170 static ssize_t queue_discard_granularity_show(struct request_queue *q, char *page)
171 {
172 	return queue_var_show(q->limits.discard_granularity, page);
173 }
174 
175 static ssize_t queue_discard_max_hw_show(struct request_queue *q, char *page)
176 {
177 
178 	return sprintf(page, "%llu\n",
179 		(unsigned long long)q->limits.max_hw_discard_sectors << 9);
180 }
181 
182 static ssize_t queue_discard_max_show(struct request_queue *q, char *page)
183 {
184 	return sprintf(page, "%llu\n",
185 		       (unsigned long long)q->limits.max_discard_sectors << 9);
186 }
187 
188 static ssize_t queue_discard_max_store(struct request_queue *q,
189 				       const char *page, size_t count)
190 {
191 	unsigned long max_discard;
192 	ssize_t ret = queue_var_store(&max_discard, page, count);
193 
194 	if (ret < 0)
195 		return ret;
196 
197 	if (max_discard & (q->limits.discard_granularity - 1))
198 		return -EINVAL;
199 
200 	max_discard >>= 9;
201 	if (max_discard > UINT_MAX)
202 		return -EINVAL;
203 
204 	if (max_discard > q->limits.max_hw_discard_sectors)
205 		max_discard = q->limits.max_hw_discard_sectors;
206 
207 	q->limits.max_discard_sectors = max_discard;
208 	return ret;
209 }
210 
211 static ssize_t queue_discard_zeroes_data_show(struct request_queue *q, char *page)
212 {
213 	return queue_var_show(0, page);
214 }
215 
216 static ssize_t queue_write_same_max_show(struct request_queue *q, char *page)
217 {
218 	return queue_var_show(0, page);
219 }
220 
221 static ssize_t queue_write_zeroes_max_show(struct request_queue *q, char *page)
222 {
223 	return sprintf(page, "%llu\n",
224 		(unsigned long long)q->limits.max_write_zeroes_sectors << 9);
225 }
226 
227 static ssize_t queue_zone_write_granularity_show(struct request_queue *q,
228 						 char *page)
229 {
230 	return queue_var_show(queue_zone_write_granularity(q), page);
231 }
232 
233 static ssize_t queue_zone_append_max_show(struct request_queue *q, char *page)
234 {
235 	unsigned long long max_sectors = q->limits.max_zone_append_sectors;
236 
237 	return sprintf(page, "%llu\n", max_sectors << SECTOR_SHIFT);
238 }
239 
240 static ssize_t
241 queue_max_sectors_store(struct request_queue *q, const char *page, size_t count)
242 {
243 	unsigned long var;
244 	unsigned int max_sectors_kb,
245 		max_hw_sectors_kb = queue_max_hw_sectors(q) >> 1,
246 			page_kb = 1 << (PAGE_SHIFT - 10);
247 	ssize_t ret = queue_var_store(&var, page, count);
248 
249 	if (ret < 0)
250 		return ret;
251 
252 	max_sectors_kb = (unsigned int)var;
253 	max_hw_sectors_kb = min_not_zero(max_hw_sectors_kb,
254 					 q->limits.max_dev_sectors >> 1);
255 	if (max_sectors_kb == 0) {
256 		q->limits.max_user_sectors = 0;
257 		max_sectors_kb = min(max_hw_sectors_kb,
258 				     BLK_DEF_MAX_SECTORS >> 1);
259 	} else {
260 		if (max_sectors_kb > max_hw_sectors_kb ||
261 		    max_sectors_kb < page_kb)
262 			return -EINVAL;
263 		q->limits.max_user_sectors = max_sectors_kb << 1;
264 	}
265 
266 	spin_lock_irq(&q->queue_lock);
267 	q->limits.max_sectors = max_sectors_kb << 1;
268 	if (q->disk)
269 		q->disk->bdi->io_pages = max_sectors_kb >> (PAGE_SHIFT - 10);
270 	spin_unlock_irq(&q->queue_lock);
271 
272 	return ret;
273 }
274 
275 static ssize_t queue_max_hw_sectors_show(struct request_queue *q, char *page)
276 {
277 	int max_hw_sectors_kb = queue_max_hw_sectors(q) >> 1;
278 
279 	return queue_var_show(max_hw_sectors_kb, page);
280 }
281 
282 static ssize_t queue_virt_boundary_mask_show(struct request_queue *q, char *page)
283 {
284 	return queue_var_show(q->limits.virt_boundary_mask, page);
285 }
286 
287 static ssize_t queue_dma_alignment_show(struct request_queue *q, char *page)
288 {
289 	return queue_var_show(queue_dma_alignment(q), page);
290 }
291 
292 #define QUEUE_SYSFS_BIT_FNS(name, flag, neg)				\
293 static ssize_t								\
294 queue_##name##_show(struct request_queue *q, char *page)		\
295 {									\
296 	int bit;							\
297 	bit = test_bit(QUEUE_FLAG_##flag, &q->queue_flags);		\
298 	return queue_var_show(neg ? !bit : bit, page);			\
299 }									\
300 static ssize_t								\
301 queue_##name##_store(struct request_queue *q, const char *page, size_t count) \
302 {									\
303 	unsigned long val;						\
304 	ssize_t ret;							\
305 	ret = queue_var_store(&val, page, count);			\
306 	if (ret < 0)							\
307 		 return ret;						\
308 	if (neg)							\
309 		val = !val;						\
310 									\
311 	if (val)							\
312 		blk_queue_flag_set(QUEUE_FLAG_##flag, q);		\
313 	else								\
314 		blk_queue_flag_clear(QUEUE_FLAG_##flag, q);		\
315 	return ret;							\
316 }
317 
318 QUEUE_SYSFS_BIT_FNS(nonrot, NONROT, 1);
319 QUEUE_SYSFS_BIT_FNS(random, ADD_RANDOM, 0);
320 QUEUE_SYSFS_BIT_FNS(iostats, IO_STAT, 0);
321 QUEUE_SYSFS_BIT_FNS(stable_writes, STABLE_WRITES, 0);
322 #undef QUEUE_SYSFS_BIT_FNS
323 
324 static ssize_t queue_zoned_show(struct request_queue *q, char *page)
325 {
326 	switch (blk_queue_zoned_model(q)) {
327 	case BLK_ZONED_HA:
328 		return sprintf(page, "host-aware\n");
329 	case BLK_ZONED_HM:
330 		return sprintf(page, "host-managed\n");
331 	default:
332 		return sprintf(page, "none\n");
333 	}
334 }
335 
336 static ssize_t queue_nr_zones_show(struct request_queue *q, char *page)
337 {
338 	return queue_var_show(disk_nr_zones(q->disk), page);
339 }
340 
341 static ssize_t queue_max_open_zones_show(struct request_queue *q, char *page)
342 {
343 	return queue_var_show(bdev_max_open_zones(q->disk->part0), page);
344 }
345 
346 static ssize_t queue_max_active_zones_show(struct request_queue *q, char *page)
347 {
348 	return queue_var_show(bdev_max_active_zones(q->disk->part0), page);
349 }
350 
351 static ssize_t queue_nomerges_show(struct request_queue *q, char *page)
352 {
353 	return queue_var_show((blk_queue_nomerges(q) << 1) |
354 			       blk_queue_noxmerges(q), page);
355 }
356 
357 static ssize_t queue_nomerges_store(struct request_queue *q, const char *page,
358 				    size_t count)
359 {
360 	unsigned long nm;
361 	ssize_t ret = queue_var_store(&nm, page, count);
362 
363 	if (ret < 0)
364 		return ret;
365 
366 	blk_queue_flag_clear(QUEUE_FLAG_NOMERGES, q);
367 	blk_queue_flag_clear(QUEUE_FLAG_NOXMERGES, q);
368 	if (nm == 2)
369 		blk_queue_flag_set(QUEUE_FLAG_NOMERGES, q);
370 	else if (nm)
371 		blk_queue_flag_set(QUEUE_FLAG_NOXMERGES, q);
372 
373 	return ret;
374 }
375 
376 static ssize_t queue_rq_affinity_show(struct request_queue *q, char *page)
377 {
378 	bool set = test_bit(QUEUE_FLAG_SAME_COMP, &q->queue_flags);
379 	bool force = test_bit(QUEUE_FLAG_SAME_FORCE, &q->queue_flags);
380 
381 	return queue_var_show(set << force, page);
382 }
383 
384 static ssize_t
385 queue_rq_affinity_store(struct request_queue *q, const char *page, size_t count)
386 {
387 	ssize_t ret = -EINVAL;
388 #ifdef CONFIG_SMP
389 	unsigned long val;
390 
391 	ret = queue_var_store(&val, page, count);
392 	if (ret < 0)
393 		return ret;
394 
395 	if (val == 2) {
396 		blk_queue_flag_set(QUEUE_FLAG_SAME_COMP, q);
397 		blk_queue_flag_set(QUEUE_FLAG_SAME_FORCE, q);
398 	} else if (val == 1) {
399 		blk_queue_flag_set(QUEUE_FLAG_SAME_COMP, q);
400 		blk_queue_flag_clear(QUEUE_FLAG_SAME_FORCE, q);
401 	} else if (val == 0) {
402 		blk_queue_flag_clear(QUEUE_FLAG_SAME_COMP, q);
403 		blk_queue_flag_clear(QUEUE_FLAG_SAME_FORCE, q);
404 	}
405 #endif
406 	return ret;
407 }
408 
409 static ssize_t queue_poll_delay_show(struct request_queue *q, char *page)
410 {
411 	int val;
412 
413 	if (q->poll_nsec == BLK_MQ_POLL_CLASSIC)
414 		val = BLK_MQ_POLL_CLASSIC;
415 	else
416 		val = q->poll_nsec / 1000;
417 
418 	return sprintf(page, "%d\n", val);
419 }
420 
421 static ssize_t queue_poll_delay_store(struct request_queue *q, const char *page,
422 				size_t count)
423 {
424 	int err, val;
425 
426 	if (!q->mq_ops || !q->mq_ops->poll)
427 		return -EINVAL;
428 
429 	err = kstrtoint(page, 10, &val);
430 	if (err < 0)
431 		return err;
432 
433 	if (val == BLK_MQ_POLL_CLASSIC)
434 		q->poll_nsec = BLK_MQ_POLL_CLASSIC;
435 	else if (val >= 0)
436 		q->poll_nsec = val * 1000;
437 	else
438 		return -EINVAL;
439 
440 	return count;
441 }
442 
443 static ssize_t queue_poll_show(struct request_queue *q, char *page)
444 {
445 	return queue_var_show(test_bit(QUEUE_FLAG_POLL, &q->queue_flags), page);
446 }
447 
448 static ssize_t queue_poll_store(struct request_queue *q, const char *page,
449 				size_t count)
450 {
451 	if (!test_bit(QUEUE_FLAG_POLL, &q->queue_flags))
452 		return -EINVAL;
453 	pr_info_ratelimited("writes to the poll attribute are ignored.\n");
454 	pr_info_ratelimited("please use driver specific parameters instead.\n");
455 	return count;
456 }
457 
458 static ssize_t queue_io_timeout_show(struct request_queue *q, char *page)
459 {
460 	return sprintf(page, "%u\n", jiffies_to_msecs(q->rq_timeout));
461 }
462 
463 static ssize_t queue_io_timeout_store(struct request_queue *q, const char *page,
464 				  size_t count)
465 {
466 	unsigned int val;
467 	int err;
468 
469 	err = kstrtou32(page, 10, &val);
470 	if (err || val == 0)
471 		return -EINVAL;
472 
473 	blk_queue_rq_timeout(q, msecs_to_jiffies(val));
474 
475 	return count;
476 }
477 
478 static ssize_t queue_wb_lat_show(struct request_queue *q, char *page)
479 {
480 	if (!wbt_rq_qos(q))
481 		return -EINVAL;
482 
483 	if (wbt_disabled(q))
484 		return sprintf(page, "0\n");
485 
486 	return sprintf(page, "%llu\n", div_u64(wbt_get_min_lat(q), 1000));
487 }
488 
489 static ssize_t queue_wb_lat_store(struct request_queue *q, const char *page,
490 				  size_t count)
491 {
492 	struct rq_qos *rqos;
493 	ssize_t ret;
494 	s64 val;
495 
496 	ret = queue_var_store64(&val, page);
497 	if (ret < 0)
498 		return ret;
499 	if (val < -1)
500 		return -EINVAL;
501 
502 	rqos = wbt_rq_qos(q);
503 	if (!rqos) {
504 		ret = wbt_init(q->disk);
505 		if (ret)
506 			return ret;
507 	}
508 
509 	if (val == -1)
510 		val = wbt_default_latency_nsec(q);
511 	else if (val >= 0)
512 		val *= 1000ULL;
513 
514 	if (wbt_get_min_lat(q) == val)
515 		return count;
516 
517 	/*
518 	 * Ensure that the queue is idled, in case the latency update
519 	 * ends up either enabling or disabling wbt completely. We can't
520 	 * have IO inflight if that happens.
521 	 */
522 	blk_mq_freeze_queue(q);
523 	blk_mq_quiesce_queue(q);
524 
525 	wbt_set_min_lat(q, val);
526 
527 	blk_mq_unquiesce_queue(q);
528 	blk_mq_unfreeze_queue(q);
529 
530 	return count;
531 }
532 
533 static ssize_t queue_wc_show(struct request_queue *q, char *page)
534 {
535 	if (test_bit(QUEUE_FLAG_WC, &q->queue_flags))
536 		return sprintf(page, "write back\n");
537 
538 	return sprintf(page, "write through\n");
539 }
540 
541 static ssize_t queue_wc_store(struct request_queue *q, const char *page,
542 			      size_t count)
543 {
544 	int set = -1;
545 
546 	if (!strncmp(page, "write back", 10))
547 		set = 1;
548 	else if (!strncmp(page, "write through", 13) ||
549 		 !strncmp(page, "none", 4))
550 		set = 0;
551 
552 	if (set == -1)
553 		return -EINVAL;
554 
555 	if (set)
556 		blk_queue_flag_set(QUEUE_FLAG_WC, q);
557 	else
558 		blk_queue_flag_clear(QUEUE_FLAG_WC, q);
559 
560 	return count;
561 }
562 
563 static ssize_t queue_fua_show(struct request_queue *q, char *page)
564 {
565 	return sprintf(page, "%u\n", test_bit(QUEUE_FLAG_FUA, &q->queue_flags));
566 }
567 
568 static ssize_t queue_dax_show(struct request_queue *q, char *page)
569 {
570 	return queue_var_show(blk_queue_dax(q), page);
571 }
572 
573 #define QUEUE_RO_ENTRY(_prefix, _name)			\
574 static struct queue_sysfs_entry _prefix##_entry = {	\
575 	.attr	= { .name = _name, .mode = 0444 },	\
576 	.show	= _prefix##_show,			\
577 };
578 
579 #define QUEUE_RW_ENTRY(_prefix, _name)			\
580 static struct queue_sysfs_entry _prefix##_entry = {	\
581 	.attr	= { .name = _name, .mode = 0644 },	\
582 	.show	= _prefix##_show,			\
583 	.store	= _prefix##_store,			\
584 };
585 
586 QUEUE_RW_ENTRY(queue_requests, "nr_requests");
587 QUEUE_RW_ENTRY(queue_ra, "read_ahead_kb");
588 QUEUE_RW_ENTRY(queue_max_sectors, "max_sectors_kb");
589 QUEUE_RO_ENTRY(queue_max_hw_sectors, "max_hw_sectors_kb");
590 QUEUE_RO_ENTRY(queue_max_segments, "max_segments");
591 QUEUE_RO_ENTRY(queue_max_integrity_segments, "max_integrity_segments");
592 QUEUE_RO_ENTRY(queue_max_segment_size, "max_segment_size");
593 QUEUE_RW_ENTRY(elv_iosched, "scheduler");
594 
595 QUEUE_RO_ENTRY(queue_logical_block_size, "logical_block_size");
596 QUEUE_RO_ENTRY(queue_physical_block_size, "physical_block_size");
597 QUEUE_RO_ENTRY(queue_chunk_sectors, "chunk_sectors");
598 QUEUE_RO_ENTRY(queue_io_min, "minimum_io_size");
599 QUEUE_RO_ENTRY(queue_io_opt, "optimal_io_size");
600 
601 QUEUE_RO_ENTRY(queue_max_discard_segments, "max_discard_segments");
602 QUEUE_RO_ENTRY(queue_discard_granularity, "discard_granularity");
603 QUEUE_RO_ENTRY(queue_discard_max_hw, "discard_max_hw_bytes");
604 QUEUE_RW_ENTRY(queue_discard_max, "discard_max_bytes");
605 QUEUE_RO_ENTRY(queue_discard_zeroes_data, "discard_zeroes_data");
606 
607 QUEUE_RO_ENTRY(queue_write_same_max, "write_same_max_bytes");
608 QUEUE_RO_ENTRY(queue_write_zeroes_max, "write_zeroes_max_bytes");
609 QUEUE_RO_ENTRY(queue_zone_append_max, "zone_append_max_bytes");
610 QUEUE_RO_ENTRY(queue_zone_write_granularity, "zone_write_granularity");
611 
612 QUEUE_RO_ENTRY(queue_zoned, "zoned");
613 QUEUE_RO_ENTRY(queue_nr_zones, "nr_zones");
614 QUEUE_RO_ENTRY(queue_max_open_zones, "max_open_zones");
615 QUEUE_RO_ENTRY(queue_max_active_zones, "max_active_zones");
616 
617 QUEUE_RW_ENTRY(queue_nomerges, "nomerges");
618 QUEUE_RW_ENTRY(queue_rq_affinity, "rq_affinity");
619 QUEUE_RW_ENTRY(queue_poll, "io_poll");
620 QUEUE_RW_ENTRY(queue_poll_delay, "io_poll_delay");
621 QUEUE_RW_ENTRY(queue_wc, "write_cache");
622 QUEUE_RO_ENTRY(queue_fua, "fua");
623 QUEUE_RO_ENTRY(queue_dax, "dax");
624 QUEUE_RW_ENTRY(queue_io_timeout, "io_timeout");
625 QUEUE_RW_ENTRY(queue_wb_lat, "wbt_lat_usec");
626 QUEUE_RO_ENTRY(queue_virt_boundary_mask, "virt_boundary_mask");
627 QUEUE_RO_ENTRY(queue_dma_alignment, "dma_alignment");
628 
629 #ifdef CONFIG_BLK_DEV_THROTTLING_LOW
630 QUEUE_RW_ENTRY(blk_throtl_sample_time, "throttle_sample_time");
631 #endif
632 
633 /* legacy alias for logical_block_size: */
634 static struct queue_sysfs_entry queue_hw_sector_size_entry = {
635 	.attr = {.name = "hw_sector_size", .mode = 0444 },
636 	.show = queue_logical_block_size_show,
637 };
638 
639 QUEUE_RW_ENTRY(queue_nonrot, "rotational");
640 QUEUE_RW_ENTRY(queue_iostats, "iostats");
641 QUEUE_RW_ENTRY(queue_random, "add_random");
642 QUEUE_RW_ENTRY(queue_stable_writes, "stable_writes");
643 
644 static struct attribute *queue_attrs[] = {
645 	&queue_requests_entry.attr,
646 	&queue_ra_entry.attr,
647 	&queue_max_hw_sectors_entry.attr,
648 	&queue_max_sectors_entry.attr,
649 	&queue_max_segments_entry.attr,
650 	&queue_max_discard_segments_entry.attr,
651 	&queue_max_integrity_segments_entry.attr,
652 	&queue_max_segment_size_entry.attr,
653 	&elv_iosched_entry.attr,
654 	&queue_hw_sector_size_entry.attr,
655 	&queue_logical_block_size_entry.attr,
656 	&queue_physical_block_size_entry.attr,
657 	&queue_chunk_sectors_entry.attr,
658 	&queue_io_min_entry.attr,
659 	&queue_io_opt_entry.attr,
660 	&queue_discard_granularity_entry.attr,
661 	&queue_discard_max_entry.attr,
662 	&queue_discard_max_hw_entry.attr,
663 	&queue_discard_zeroes_data_entry.attr,
664 	&queue_write_same_max_entry.attr,
665 	&queue_write_zeroes_max_entry.attr,
666 	&queue_zone_append_max_entry.attr,
667 	&queue_zone_write_granularity_entry.attr,
668 	&queue_nonrot_entry.attr,
669 	&queue_zoned_entry.attr,
670 	&queue_nr_zones_entry.attr,
671 	&queue_max_open_zones_entry.attr,
672 	&queue_max_active_zones_entry.attr,
673 	&queue_nomerges_entry.attr,
674 	&queue_rq_affinity_entry.attr,
675 	&queue_iostats_entry.attr,
676 	&queue_stable_writes_entry.attr,
677 	&queue_random_entry.attr,
678 	&queue_poll_entry.attr,
679 	&queue_wc_entry.attr,
680 	&queue_fua_entry.attr,
681 	&queue_dax_entry.attr,
682 	&queue_wb_lat_entry.attr,
683 	&queue_poll_delay_entry.attr,
684 	&queue_io_timeout_entry.attr,
685 #ifdef CONFIG_BLK_DEV_THROTTLING_LOW
686 	&blk_throtl_sample_time_entry.attr,
687 #endif
688 	&queue_virt_boundary_mask_entry.attr,
689 	&queue_dma_alignment_entry.attr,
690 	NULL,
691 };
692 
693 static umode_t queue_attr_visible(struct kobject *kobj, struct attribute *attr,
694 				int n)
695 {
696 	struct gendisk *disk = container_of(kobj, struct gendisk, queue_kobj);
697 	struct request_queue *q = disk->queue;
698 
699 	if (attr == &queue_io_timeout_entry.attr &&
700 		(!q->mq_ops || !q->mq_ops->timeout))
701 			return 0;
702 
703 	if ((attr == &queue_max_open_zones_entry.attr ||
704 	     attr == &queue_max_active_zones_entry.attr) &&
705 	    !blk_queue_is_zoned(q))
706 		return 0;
707 
708 	return attr->mode;
709 }
710 
711 static struct attribute_group queue_attr_group = {
712 	.attrs = queue_attrs,
713 	.is_visible = queue_attr_visible,
714 };
715 
716 
717 #define to_queue(atr) container_of((atr), struct queue_sysfs_entry, attr)
718 
719 static ssize_t
720 queue_attr_show(struct kobject *kobj, struct attribute *attr, char *page)
721 {
722 	struct queue_sysfs_entry *entry = to_queue(attr);
723 	struct gendisk *disk = container_of(kobj, struct gendisk, queue_kobj);
724 	struct request_queue *q = disk->queue;
725 	ssize_t res;
726 
727 	if (!entry->show)
728 		return -EIO;
729 	mutex_lock(&q->sysfs_lock);
730 	res = entry->show(q, page);
731 	mutex_unlock(&q->sysfs_lock);
732 	return res;
733 }
734 
735 static ssize_t
736 queue_attr_store(struct kobject *kobj, struct attribute *attr,
737 		    const char *page, size_t length)
738 {
739 	struct queue_sysfs_entry *entry = to_queue(attr);
740 	struct gendisk *disk = container_of(kobj, struct gendisk, queue_kobj);
741 	struct request_queue *q = disk->queue;
742 	ssize_t res;
743 
744 	if (!entry->store)
745 		return -EIO;
746 
747 	mutex_lock(&q->sysfs_lock);
748 	res = entry->store(q, page, length);
749 	mutex_unlock(&q->sysfs_lock);
750 	return res;
751 }
752 
753 static const struct sysfs_ops queue_sysfs_ops = {
754 	.show	= queue_attr_show,
755 	.store	= queue_attr_store,
756 };
757 
758 static const struct attribute_group *blk_queue_attr_groups[] = {
759 	&queue_attr_group,
760 	NULL
761 };
762 
763 static void blk_queue_release(struct kobject *kobj)
764 {
765 	/* nothing to do here, all data is associated with the parent gendisk */
766 }
767 
768 static const struct kobj_type blk_queue_ktype = {
769 	.default_groups = blk_queue_attr_groups,
770 	.sysfs_ops	= &queue_sysfs_ops,
771 	.release	= blk_queue_release,
772 };
773 
774 static void blk_debugfs_remove(struct gendisk *disk)
775 {
776 	struct request_queue *q = disk->queue;
777 
778 	mutex_lock(&q->debugfs_mutex);
779 	blk_trace_shutdown(q);
780 	debugfs_remove_recursive(q->debugfs_dir);
781 	q->debugfs_dir = NULL;
782 	q->sched_debugfs_dir = NULL;
783 	q->rqos_debugfs_dir = NULL;
784 	mutex_unlock(&q->debugfs_mutex);
785 }
786 
787 /**
788  * blk_register_queue - register a block layer queue with sysfs
789  * @disk: Disk of which the request queue should be registered with sysfs.
790  */
791 int blk_register_queue(struct gendisk *disk)
792 {
793 	struct request_queue *q = disk->queue;
794 	int ret;
795 
796 	mutex_lock(&q->sysfs_dir_lock);
797 	kobject_init(&disk->queue_kobj, &blk_queue_ktype);
798 	ret = kobject_add(&disk->queue_kobj, &disk_to_dev(disk)->kobj, "queue");
799 	if (ret < 0)
800 		goto out_put_queue_kobj;
801 
802 	if (queue_is_mq(q)) {
803 		ret = blk_mq_sysfs_register(disk);
804 		if (ret)
805 			goto out_put_queue_kobj;
806 	}
807 	mutex_lock(&q->sysfs_lock);
808 
809 	mutex_lock(&q->debugfs_mutex);
810 	q->debugfs_dir = debugfs_create_dir(disk->disk_name, blk_debugfs_root);
811 	if (queue_is_mq(q))
812 		blk_mq_debugfs_register(q);
813 	mutex_unlock(&q->debugfs_mutex);
814 
815 	ret = disk_register_independent_access_ranges(disk);
816 	if (ret)
817 		goto out_debugfs_remove;
818 
819 	if (q->elevator) {
820 		ret = elv_register_queue(q, false);
821 		if (ret)
822 			goto out_unregister_ia_ranges;
823 	}
824 
825 	ret = blk_crypto_sysfs_register(disk);
826 	if (ret)
827 		goto out_elv_unregister;
828 
829 	blk_queue_flag_set(QUEUE_FLAG_REGISTERED, q);
830 	wbt_enable_default(disk);
831 	blk_throtl_register(disk);
832 
833 	/* Now everything is ready and send out KOBJ_ADD uevent */
834 	kobject_uevent(&disk->queue_kobj, KOBJ_ADD);
835 	if (q->elevator)
836 		kobject_uevent(&q->elevator->kobj, KOBJ_ADD);
837 	mutex_unlock(&q->sysfs_lock);
838 	mutex_unlock(&q->sysfs_dir_lock);
839 
840 	/*
841 	 * SCSI probing may synchronously create and destroy a lot of
842 	 * request_queues for non-existent devices.  Shutting down a fully
843 	 * functional queue takes measureable wallclock time as RCU grace
844 	 * periods are involved.  To avoid excessive latency in these
845 	 * cases, a request_queue starts out in a degraded mode which is
846 	 * faster to shut down and is made fully functional here as
847 	 * request_queues for non-existent devices never get registered.
848 	 */
849 	if (!blk_queue_init_done(q)) {
850 		blk_queue_flag_set(QUEUE_FLAG_INIT_DONE, q);
851 		percpu_ref_switch_to_percpu(&q->q_usage_counter);
852 	}
853 
854 	return ret;
855 
856 out_elv_unregister:
857 	elv_unregister_queue(q);
858 out_unregister_ia_ranges:
859 	disk_unregister_independent_access_ranges(disk);
860 out_debugfs_remove:
861 	blk_debugfs_remove(disk);
862 	mutex_unlock(&q->sysfs_lock);
863 out_put_queue_kobj:
864 	kobject_put(&disk->queue_kobj);
865 	mutex_unlock(&q->sysfs_dir_lock);
866 	return ret;
867 }
868 
869 /**
870  * blk_unregister_queue - counterpart of blk_register_queue()
871  * @disk: Disk of which the request queue should be unregistered from sysfs.
872  *
873  * Note: the caller is responsible for guaranteeing that this function is called
874  * after blk_register_queue() has finished.
875  */
876 void blk_unregister_queue(struct gendisk *disk)
877 {
878 	struct request_queue *q = disk->queue;
879 
880 	if (WARN_ON(!q))
881 		return;
882 
883 	/* Return early if disk->queue was never registered. */
884 	if (!blk_queue_registered(q))
885 		return;
886 
887 	/*
888 	 * Since sysfs_remove_dir() prevents adding new directory entries
889 	 * before removal of existing entries starts, protect against
890 	 * concurrent elv_iosched_store() calls.
891 	 */
892 	mutex_lock(&q->sysfs_lock);
893 	blk_queue_flag_clear(QUEUE_FLAG_REGISTERED, q);
894 	mutex_unlock(&q->sysfs_lock);
895 
896 	mutex_lock(&q->sysfs_dir_lock);
897 	/*
898 	 * Remove the sysfs attributes before unregistering the queue data
899 	 * structures that can be modified through sysfs.
900 	 */
901 	if (queue_is_mq(q))
902 		blk_mq_sysfs_unregister(disk);
903 	blk_crypto_sysfs_unregister(disk);
904 
905 	mutex_lock(&q->sysfs_lock);
906 	elv_unregister_queue(q);
907 	disk_unregister_independent_access_ranges(disk);
908 	mutex_unlock(&q->sysfs_lock);
909 
910 	/* Now that we've deleted all child objects, we can delete the queue. */
911 	kobject_uevent(&disk->queue_kobj, KOBJ_REMOVE);
912 	kobject_del(&disk->queue_kobj);
913 	mutex_unlock(&q->sysfs_dir_lock);
914 
915 	blk_debugfs_remove(disk);
916 }
917