Merge tag 'clk-fixes-for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git...
[linux-2.6-microblaze.git] / block / blk-sysfs.c
1 // SPDX-License-Identifier: GPL-2.0
2 /*
3  * Functions related to sysfs handling
4  */
5 #include <linux/kernel.h>
6 #include <linux/slab.h>
7 #include <linux/module.h>
8 #include <linux/bio.h>
9 #include <linux/blkdev.h>
10 #include <linux/backing-dev.h>
11 #include <linux/blktrace_api.h>
12 #include <linux/blk-mq.h>
13 #include <linux/blk-cgroup.h>
14 #include <linux/debugfs.h>
15
16 #include "blk.h"
17 #include "blk-mq.h"
18 #include "blk-mq-debugfs.h"
19 #include "blk-wbt.h"
20
21 struct queue_sysfs_entry {
22         struct attribute attr;
23         ssize_t (*show)(struct request_queue *, char *);
24         ssize_t (*store)(struct request_queue *, const char *, size_t);
25 };
26
27 static ssize_t
28 queue_var_show(unsigned long var, char *page)
29 {
30         return sprintf(page, "%lu\n", var);
31 }
32
33 static ssize_t
34 queue_var_store(unsigned long *var, const char *page, size_t count)
35 {
36         int err;
37         unsigned long v;
38
39         err = kstrtoul(page, 10, &v);
40         if (err || v > UINT_MAX)
41                 return -EINVAL;
42
43         *var = v;
44
45         return count;
46 }
47
48 static ssize_t queue_var_store64(s64 *var, const char *page)
49 {
50         int err;
51         s64 v;
52
53         err = kstrtos64(page, 10, &v);
54         if (err < 0)
55                 return err;
56
57         *var = v;
58         return 0;
59 }
60
61 static ssize_t queue_requests_show(struct request_queue *q, char *page)
62 {
63         return queue_var_show(q->nr_requests, (page));
64 }
65
66 static ssize_t
67 queue_requests_store(struct request_queue *q, const char *page, size_t count)
68 {
69         unsigned long nr;
70         int ret, err;
71
72         if (!queue_is_mq(q))
73                 return -EINVAL;
74
75         ret = queue_var_store(&nr, page, count);
76         if (ret < 0)
77                 return ret;
78
79         if (nr < BLKDEV_MIN_RQ)
80                 nr = BLKDEV_MIN_RQ;
81
82         err = blk_mq_update_nr_requests(q, nr);
83         if (err)
84                 return err;
85
86         return ret;
87 }
88
89 static ssize_t queue_ra_show(struct request_queue *q, char *page)
90 {
91         unsigned long ra_kb = q->backing_dev_info->ra_pages <<
92                                         (PAGE_SHIFT - 10);
93
94         return queue_var_show(ra_kb, (page));
95 }
96
97 static ssize_t
98 queue_ra_store(struct request_queue *q, const char *page, size_t count)
99 {
100         unsigned long ra_kb;
101         ssize_t ret = queue_var_store(&ra_kb, page, count);
102
103         if (ret < 0)
104                 return ret;
105
106         q->backing_dev_info->ra_pages = ra_kb >> (PAGE_SHIFT - 10);
107
108         return ret;
109 }
110
111 static ssize_t queue_max_sectors_show(struct request_queue *q, char *page)
112 {
113         int max_sectors_kb = queue_max_sectors(q) >> 1;
114
115         return queue_var_show(max_sectors_kb, (page));
116 }
117
118 static ssize_t queue_max_segments_show(struct request_queue *q, char *page)
119 {
120         return queue_var_show(queue_max_segments(q), (page));
121 }
122
123 static ssize_t queue_max_discard_segments_show(struct request_queue *q,
124                 char *page)
125 {
126         return queue_var_show(queue_max_discard_segments(q), (page));
127 }
128
129 static ssize_t queue_max_integrity_segments_show(struct request_queue *q, char *page)
130 {
131         return queue_var_show(q->limits.max_integrity_segments, (page));
132 }
133
134 static ssize_t queue_max_segment_size_show(struct request_queue *q, char *page)
135 {
136         return queue_var_show(queue_max_segment_size(q), (page));
137 }
138
139 static ssize_t queue_logical_block_size_show(struct request_queue *q, char *page)
140 {
141         return queue_var_show(queue_logical_block_size(q), page);
142 }
143
144 static ssize_t queue_physical_block_size_show(struct request_queue *q, char *page)
145 {
146         return queue_var_show(queue_physical_block_size(q), page);
147 }
148
149 static ssize_t queue_chunk_sectors_show(struct request_queue *q, char *page)
150 {
151         return queue_var_show(q->limits.chunk_sectors, page);
152 }
153
154 static ssize_t queue_io_min_show(struct request_queue *q, char *page)
155 {
156         return queue_var_show(queue_io_min(q), page);
157 }
158
159 static ssize_t queue_io_opt_show(struct request_queue *q, char *page)
160 {
161         return queue_var_show(queue_io_opt(q), page);
162 }
163
164 static ssize_t queue_discard_granularity_show(struct request_queue *q, char *page)
165 {
166         return queue_var_show(q->limits.discard_granularity, page);
167 }
168
169 static ssize_t queue_discard_max_hw_show(struct request_queue *q, char *page)
170 {
171
172         return sprintf(page, "%llu\n",
173                 (unsigned long long)q->limits.max_hw_discard_sectors << 9);
174 }
175
176 static ssize_t queue_discard_max_show(struct request_queue *q, char *page)
177 {
178         return sprintf(page, "%llu\n",
179                        (unsigned long long)q->limits.max_discard_sectors << 9);
180 }
181
182 static ssize_t queue_discard_max_store(struct request_queue *q,
183                                        const char *page, size_t count)
184 {
185         unsigned long max_discard;
186         ssize_t ret = queue_var_store(&max_discard, page, count);
187
188         if (ret < 0)
189                 return ret;
190
191         if (max_discard & (q->limits.discard_granularity - 1))
192                 return -EINVAL;
193
194         max_discard >>= 9;
195         if (max_discard > UINT_MAX)
196                 return -EINVAL;
197
198         if (max_discard > q->limits.max_hw_discard_sectors)
199                 max_discard = q->limits.max_hw_discard_sectors;
200
201         q->limits.max_discard_sectors = max_discard;
202         return ret;
203 }
204
205 static ssize_t queue_discard_zeroes_data_show(struct request_queue *q, char *page)
206 {
207         return queue_var_show(0, page);
208 }
209
210 static ssize_t queue_write_same_max_show(struct request_queue *q, char *page)
211 {
212         return sprintf(page, "%llu\n",
213                 (unsigned long long)q->limits.max_write_same_sectors << 9);
214 }
215
216 static ssize_t queue_write_zeroes_max_show(struct request_queue *q, char *page)
217 {
218         return sprintf(page, "%llu\n",
219                 (unsigned long long)q->limits.max_write_zeroes_sectors << 9);
220 }
221
222 static ssize_t queue_zone_append_max_show(struct request_queue *q, char *page)
223 {
224         unsigned long long max_sectors = q->limits.max_zone_append_sectors;
225
226         return sprintf(page, "%llu\n", max_sectors << SECTOR_SHIFT);
227 }
228
229 static ssize_t
230 queue_max_sectors_store(struct request_queue *q, const char *page, size_t count)
231 {
232         unsigned long max_sectors_kb,
233                 max_hw_sectors_kb = queue_max_hw_sectors(q) >> 1,
234                         page_kb = 1 << (PAGE_SHIFT - 10);
235         ssize_t ret = queue_var_store(&max_sectors_kb, page, count);
236
237         if (ret < 0)
238                 return ret;
239
240         max_hw_sectors_kb = min_not_zero(max_hw_sectors_kb, (unsigned long)
241                                          q->limits.max_dev_sectors >> 1);
242
243         if (max_sectors_kb > max_hw_sectors_kb || max_sectors_kb < page_kb)
244                 return -EINVAL;
245
246         spin_lock_irq(&q->queue_lock);
247         q->limits.max_sectors = max_sectors_kb << 1;
248         q->backing_dev_info->io_pages = max_sectors_kb >> (PAGE_SHIFT - 10);
249         spin_unlock_irq(&q->queue_lock);
250
251         return ret;
252 }
253
254 static ssize_t queue_max_hw_sectors_show(struct request_queue *q, char *page)
255 {
256         int max_hw_sectors_kb = queue_max_hw_sectors(q) >> 1;
257
258         return queue_var_show(max_hw_sectors_kb, (page));
259 }
260
261 #define QUEUE_SYSFS_BIT_FNS(name, flag, neg)                            \
262 static ssize_t                                                          \
263 queue_show_##name(struct request_queue *q, char *page)                  \
264 {                                                                       \
265         int bit;                                                        \
266         bit = test_bit(QUEUE_FLAG_##flag, &q->queue_flags);             \
267         return queue_var_show(neg ? !bit : bit, page);                  \
268 }                                                                       \
269 static ssize_t                                                          \
270 queue_store_##name(struct request_queue *q, const char *page, size_t count) \
271 {                                                                       \
272         unsigned long val;                                              \
273         ssize_t ret;                                                    \
274         ret = queue_var_store(&val, page, count);                       \
275         if (ret < 0)                                                    \
276                  return ret;                                            \
277         if (neg)                                                        \
278                 val = !val;                                             \
279                                                                         \
280         if (val)                                                        \
281                 blk_queue_flag_set(QUEUE_FLAG_##flag, q);               \
282         else                                                            \
283                 blk_queue_flag_clear(QUEUE_FLAG_##flag, q);             \
284         return ret;                                                     \
285 }
286
287 QUEUE_SYSFS_BIT_FNS(nonrot, NONROT, 1);
288 QUEUE_SYSFS_BIT_FNS(random, ADD_RANDOM, 0);
289 QUEUE_SYSFS_BIT_FNS(iostats, IO_STAT, 0);
290 #undef QUEUE_SYSFS_BIT_FNS
291
292 static ssize_t queue_zoned_show(struct request_queue *q, char *page)
293 {
294         switch (blk_queue_zoned_model(q)) {
295         case BLK_ZONED_HA:
296                 return sprintf(page, "host-aware\n");
297         case BLK_ZONED_HM:
298                 return sprintf(page, "host-managed\n");
299         default:
300                 return sprintf(page, "none\n");
301         }
302 }
303
304 static ssize_t queue_nr_zones_show(struct request_queue *q, char *page)
305 {
306         return queue_var_show(blk_queue_nr_zones(q), page);
307 }
308
309 static ssize_t queue_max_open_zones_show(struct request_queue *q, char *page)
310 {
311         return queue_var_show(queue_max_open_zones(q), page);
312 }
313
314 static ssize_t queue_max_active_zones_show(struct request_queue *q, char *page)
315 {
316         return queue_var_show(queue_max_active_zones(q), page);
317 }
318
319 static ssize_t queue_nomerges_show(struct request_queue *q, char *page)
320 {
321         return queue_var_show((blk_queue_nomerges(q) << 1) |
322                                blk_queue_noxmerges(q), page);
323 }
324
325 static ssize_t queue_nomerges_store(struct request_queue *q, const char *page,
326                                     size_t count)
327 {
328         unsigned long nm;
329         ssize_t ret = queue_var_store(&nm, page, count);
330
331         if (ret < 0)
332                 return ret;
333
334         blk_queue_flag_clear(QUEUE_FLAG_NOMERGES, q);
335         blk_queue_flag_clear(QUEUE_FLAG_NOXMERGES, q);
336         if (nm == 2)
337                 blk_queue_flag_set(QUEUE_FLAG_NOMERGES, q);
338         else if (nm)
339                 blk_queue_flag_set(QUEUE_FLAG_NOXMERGES, q);
340
341         return ret;
342 }
343
344 static ssize_t queue_rq_affinity_show(struct request_queue *q, char *page)
345 {
346         bool set = test_bit(QUEUE_FLAG_SAME_COMP, &q->queue_flags);
347         bool force = test_bit(QUEUE_FLAG_SAME_FORCE, &q->queue_flags);
348
349         return queue_var_show(set << force, page);
350 }
351
352 static ssize_t
353 queue_rq_affinity_store(struct request_queue *q, const char *page, size_t count)
354 {
355         ssize_t ret = -EINVAL;
356 #ifdef CONFIG_SMP
357         unsigned long val;
358
359         ret = queue_var_store(&val, page, count);
360         if (ret < 0)
361                 return ret;
362
363         if (val == 2) {
364                 blk_queue_flag_set(QUEUE_FLAG_SAME_COMP, q);
365                 blk_queue_flag_set(QUEUE_FLAG_SAME_FORCE, q);
366         } else if (val == 1) {
367                 blk_queue_flag_set(QUEUE_FLAG_SAME_COMP, q);
368                 blk_queue_flag_clear(QUEUE_FLAG_SAME_FORCE, q);
369         } else if (val == 0) {
370                 blk_queue_flag_clear(QUEUE_FLAG_SAME_COMP, q);
371                 blk_queue_flag_clear(QUEUE_FLAG_SAME_FORCE, q);
372         }
373 #endif
374         return ret;
375 }
376
377 static ssize_t queue_poll_delay_show(struct request_queue *q, char *page)
378 {
379         int val;
380
381         if (q->poll_nsec == BLK_MQ_POLL_CLASSIC)
382                 val = BLK_MQ_POLL_CLASSIC;
383         else
384                 val = q->poll_nsec / 1000;
385
386         return sprintf(page, "%d\n", val);
387 }
388
389 static ssize_t queue_poll_delay_store(struct request_queue *q, const char *page,
390                                 size_t count)
391 {
392         int err, val;
393
394         if (!q->mq_ops || !q->mq_ops->poll)
395                 return -EINVAL;
396
397         err = kstrtoint(page, 10, &val);
398         if (err < 0)
399                 return err;
400
401         if (val == BLK_MQ_POLL_CLASSIC)
402                 q->poll_nsec = BLK_MQ_POLL_CLASSIC;
403         else if (val >= 0)
404                 q->poll_nsec = val * 1000;
405         else
406                 return -EINVAL;
407
408         return count;
409 }
410
411 static ssize_t queue_poll_show(struct request_queue *q, char *page)
412 {
413         return queue_var_show(test_bit(QUEUE_FLAG_POLL, &q->queue_flags), page);
414 }
415
416 static ssize_t queue_poll_store(struct request_queue *q, const char *page,
417                                 size_t count)
418 {
419         unsigned long poll_on;
420         ssize_t ret;
421
422         if (!q->tag_set || q->tag_set->nr_maps <= HCTX_TYPE_POLL ||
423             !q->tag_set->map[HCTX_TYPE_POLL].nr_queues)
424                 return -EINVAL;
425
426         ret = queue_var_store(&poll_on, page, count);
427         if (ret < 0)
428                 return ret;
429
430         if (poll_on)
431                 blk_queue_flag_set(QUEUE_FLAG_POLL, q);
432         else
433                 blk_queue_flag_clear(QUEUE_FLAG_POLL, q);
434
435         return ret;
436 }
437
438 static ssize_t queue_io_timeout_show(struct request_queue *q, char *page)
439 {
440         return sprintf(page, "%u\n", jiffies_to_msecs(q->rq_timeout));
441 }
442
443 static ssize_t queue_io_timeout_store(struct request_queue *q, const char *page,
444                                   size_t count)
445 {
446         unsigned int val;
447         int err;
448
449         err = kstrtou32(page, 10, &val);
450         if (err || val == 0)
451                 return -EINVAL;
452
453         blk_queue_rq_timeout(q, msecs_to_jiffies(val));
454
455         return count;
456 }
457
458 static ssize_t queue_wb_lat_show(struct request_queue *q, char *page)
459 {
460         if (!wbt_rq_qos(q))
461                 return -EINVAL;
462
463         return sprintf(page, "%llu\n", div_u64(wbt_get_min_lat(q), 1000));
464 }
465
466 static ssize_t queue_wb_lat_store(struct request_queue *q, const char *page,
467                                   size_t count)
468 {
469         struct rq_qos *rqos;
470         ssize_t ret;
471         s64 val;
472
473         ret = queue_var_store64(&val, page);
474         if (ret < 0)
475                 return ret;
476         if (val < -1)
477                 return -EINVAL;
478
479         rqos = wbt_rq_qos(q);
480         if (!rqos) {
481                 ret = wbt_init(q);
482                 if (ret)
483                         return ret;
484         }
485
486         if (val == -1)
487                 val = wbt_default_latency_nsec(q);
488         else if (val >= 0)
489                 val *= 1000ULL;
490
491         if (wbt_get_min_lat(q) == val)
492                 return count;
493
494         /*
495          * Ensure that the queue is idled, in case the latency update
496          * ends up either enabling or disabling wbt completely. We can't
497          * have IO inflight if that happens.
498          */
499         blk_mq_freeze_queue(q);
500         blk_mq_quiesce_queue(q);
501
502         wbt_set_min_lat(q, val);
503
504         blk_mq_unquiesce_queue(q);
505         blk_mq_unfreeze_queue(q);
506
507         return count;
508 }
509
510 static ssize_t queue_wc_show(struct request_queue *q, char *page)
511 {
512         if (test_bit(QUEUE_FLAG_WC, &q->queue_flags))
513                 return sprintf(page, "write back\n");
514
515         return sprintf(page, "write through\n");
516 }
517
518 static ssize_t queue_wc_store(struct request_queue *q, const char *page,
519                               size_t count)
520 {
521         int set = -1;
522
523         if (!strncmp(page, "write back", 10))
524                 set = 1;
525         else if (!strncmp(page, "write through", 13) ||
526                  !strncmp(page, "none", 4))
527                 set = 0;
528
529         if (set == -1)
530                 return -EINVAL;
531
532         if (set)
533                 blk_queue_flag_set(QUEUE_FLAG_WC, q);
534         else
535                 blk_queue_flag_clear(QUEUE_FLAG_WC, q);
536
537         return count;
538 }
539
540 static ssize_t queue_fua_show(struct request_queue *q, char *page)
541 {
542         return sprintf(page, "%u\n", test_bit(QUEUE_FLAG_FUA, &q->queue_flags));
543 }
544
545 static ssize_t queue_dax_show(struct request_queue *q, char *page)
546 {
547         return queue_var_show(blk_queue_dax(q), page);
548 }
549
550 static struct queue_sysfs_entry queue_requests_entry = {
551         .attr = {.name = "nr_requests", .mode = 0644 },
552         .show = queue_requests_show,
553         .store = queue_requests_store,
554 };
555
556 static struct queue_sysfs_entry queue_ra_entry = {
557         .attr = {.name = "read_ahead_kb", .mode = 0644 },
558         .show = queue_ra_show,
559         .store = queue_ra_store,
560 };
561
562 static struct queue_sysfs_entry queue_max_sectors_entry = {
563         .attr = {.name = "max_sectors_kb", .mode = 0644 },
564         .show = queue_max_sectors_show,
565         .store = queue_max_sectors_store,
566 };
567
568 static struct queue_sysfs_entry queue_max_hw_sectors_entry = {
569         .attr = {.name = "max_hw_sectors_kb", .mode = 0444 },
570         .show = queue_max_hw_sectors_show,
571 };
572
573 static struct queue_sysfs_entry queue_max_segments_entry = {
574         .attr = {.name = "max_segments", .mode = 0444 },
575         .show = queue_max_segments_show,
576 };
577
578 static struct queue_sysfs_entry queue_max_discard_segments_entry = {
579         .attr = {.name = "max_discard_segments", .mode = 0444 },
580         .show = queue_max_discard_segments_show,
581 };
582
583 static struct queue_sysfs_entry queue_max_integrity_segments_entry = {
584         .attr = {.name = "max_integrity_segments", .mode = 0444 },
585         .show = queue_max_integrity_segments_show,
586 };
587
588 static struct queue_sysfs_entry queue_max_segment_size_entry = {
589         .attr = {.name = "max_segment_size", .mode = 0444 },
590         .show = queue_max_segment_size_show,
591 };
592
593 static struct queue_sysfs_entry queue_iosched_entry = {
594         .attr = {.name = "scheduler", .mode = 0644 },
595         .show = elv_iosched_show,
596         .store = elv_iosched_store,
597 };
598
599 static struct queue_sysfs_entry queue_hw_sector_size_entry = {
600         .attr = {.name = "hw_sector_size", .mode = 0444 },
601         .show = queue_logical_block_size_show,
602 };
603
604 static struct queue_sysfs_entry queue_logical_block_size_entry = {
605         .attr = {.name = "logical_block_size", .mode = 0444 },
606         .show = queue_logical_block_size_show,
607 };
608
609 static struct queue_sysfs_entry queue_physical_block_size_entry = {
610         .attr = {.name = "physical_block_size", .mode = 0444 },
611         .show = queue_physical_block_size_show,
612 };
613
614 static struct queue_sysfs_entry queue_chunk_sectors_entry = {
615         .attr = {.name = "chunk_sectors", .mode = 0444 },
616         .show = queue_chunk_sectors_show,
617 };
618
619 static struct queue_sysfs_entry queue_io_min_entry = {
620         .attr = {.name = "minimum_io_size", .mode = 0444 },
621         .show = queue_io_min_show,
622 };
623
624 static struct queue_sysfs_entry queue_io_opt_entry = {
625         .attr = {.name = "optimal_io_size", .mode = 0444 },
626         .show = queue_io_opt_show,
627 };
628
629 static struct queue_sysfs_entry queue_discard_granularity_entry = {
630         .attr = {.name = "discard_granularity", .mode = 0444 },
631         .show = queue_discard_granularity_show,
632 };
633
634 static struct queue_sysfs_entry queue_discard_max_hw_entry = {
635         .attr = {.name = "discard_max_hw_bytes", .mode = 0444 },
636         .show = queue_discard_max_hw_show,
637 };
638
639 static struct queue_sysfs_entry queue_discard_max_entry = {
640         .attr = {.name = "discard_max_bytes", .mode = 0644 },
641         .show = queue_discard_max_show,
642         .store = queue_discard_max_store,
643 };
644
645 static struct queue_sysfs_entry queue_discard_zeroes_data_entry = {
646         .attr = {.name = "discard_zeroes_data", .mode = 0444 },
647         .show = queue_discard_zeroes_data_show,
648 };
649
650 static struct queue_sysfs_entry queue_write_same_max_entry = {
651         .attr = {.name = "write_same_max_bytes", .mode = 0444 },
652         .show = queue_write_same_max_show,
653 };
654
655 static struct queue_sysfs_entry queue_write_zeroes_max_entry = {
656         .attr = {.name = "write_zeroes_max_bytes", .mode = 0444 },
657         .show = queue_write_zeroes_max_show,
658 };
659
660 static struct queue_sysfs_entry queue_zone_append_max_entry = {
661         .attr = {.name = "zone_append_max_bytes", .mode = 0444 },
662         .show = queue_zone_append_max_show,
663 };
664
665 static struct queue_sysfs_entry queue_nonrot_entry = {
666         .attr = {.name = "rotational", .mode = 0644 },
667         .show = queue_show_nonrot,
668         .store = queue_store_nonrot,
669 };
670
671 static struct queue_sysfs_entry queue_zoned_entry = {
672         .attr = {.name = "zoned", .mode = 0444 },
673         .show = queue_zoned_show,
674 };
675
676 static struct queue_sysfs_entry queue_nr_zones_entry = {
677         .attr = {.name = "nr_zones", .mode = 0444 },
678         .show = queue_nr_zones_show,
679 };
680
681 static struct queue_sysfs_entry queue_max_open_zones_entry = {
682         .attr = {.name = "max_open_zones", .mode = 0444 },
683         .show = queue_max_open_zones_show,
684 };
685
686 static struct queue_sysfs_entry queue_max_active_zones_entry = {
687         .attr = {.name = "max_active_zones", .mode = 0444 },
688         .show = queue_max_active_zones_show,
689 };
690
691 static struct queue_sysfs_entry queue_nomerges_entry = {
692         .attr = {.name = "nomerges", .mode = 0644 },
693         .show = queue_nomerges_show,
694         .store = queue_nomerges_store,
695 };
696
697 static struct queue_sysfs_entry queue_rq_affinity_entry = {
698         .attr = {.name = "rq_affinity", .mode = 0644 },
699         .show = queue_rq_affinity_show,
700         .store = queue_rq_affinity_store,
701 };
702
703 static struct queue_sysfs_entry queue_iostats_entry = {
704         .attr = {.name = "iostats", .mode = 0644 },
705         .show = queue_show_iostats,
706         .store = queue_store_iostats,
707 };
708
709 static struct queue_sysfs_entry queue_random_entry = {
710         .attr = {.name = "add_random", .mode = 0644 },
711         .show = queue_show_random,
712         .store = queue_store_random,
713 };
714
715 static struct queue_sysfs_entry queue_poll_entry = {
716         .attr = {.name = "io_poll", .mode = 0644 },
717         .show = queue_poll_show,
718         .store = queue_poll_store,
719 };
720
721 static struct queue_sysfs_entry queue_poll_delay_entry = {
722         .attr = {.name = "io_poll_delay", .mode = 0644 },
723         .show = queue_poll_delay_show,
724         .store = queue_poll_delay_store,
725 };
726
727 static struct queue_sysfs_entry queue_wc_entry = {
728         .attr = {.name = "write_cache", .mode = 0644 },
729         .show = queue_wc_show,
730         .store = queue_wc_store,
731 };
732
733 static struct queue_sysfs_entry queue_fua_entry = {
734         .attr = {.name = "fua", .mode = 0444 },
735         .show = queue_fua_show,
736 };
737
738 static struct queue_sysfs_entry queue_dax_entry = {
739         .attr = {.name = "dax", .mode = 0444 },
740         .show = queue_dax_show,
741 };
742
743 static struct queue_sysfs_entry queue_io_timeout_entry = {
744         .attr = {.name = "io_timeout", .mode = 0644 },
745         .show = queue_io_timeout_show,
746         .store = queue_io_timeout_store,
747 };
748
749 static struct queue_sysfs_entry queue_wb_lat_entry = {
750         .attr = {.name = "wbt_lat_usec", .mode = 0644 },
751         .show = queue_wb_lat_show,
752         .store = queue_wb_lat_store,
753 };
754
755 #ifdef CONFIG_BLK_DEV_THROTTLING_LOW
756 static struct queue_sysfs_entry throtl_sample_time_entry = {
757         .attr = {.name = "throttle_sample_time", .mode = 0644 },
758         .show = blk_throtl_sample_time_show,
759         .store = blk_throtl_sample_time_store,
760 };
761 #endif
762
763 static struct attribute *queue_attrs[] = {
764         &queue_requests_entry.attr,
765         &queue_ra_entry.attr,
766         &queue_max_hw_sectors_entry.attr,
767         &queue_max_sectors_entry.attr,
768         &queue_max_segments_entry.attr,
769         &queue_max_discard_segments_entry.attr,
770         &queue_max_integrity_segments_entry.attr,
771         &queue_max_segment_size_entry.attr,
772         &queue_iosched_entry.attr,
773         &queue_hw_sector_size_entry.attr,
774         &queue_logical_block_size_entry.attr,
775         &queue_physical_block_size_entry.attr,
776         &queue_chunk_sectors_entry.attr,
777         &queue_io_min_entry.attr,
778         &queue_io_opt_entry.attr,
779         &queue_discard_granularity_entry.attr,
780         &queue_discard_max_entry.attr,
781         &queue_discard_max_hw_entry.attr,
782         &queue_discard_zeroes_data_entry.attr,
783         &queue_write_same_max_entry.attr,
784         &queue_write_zeroes_max_entry.attr,
785         &queue_zone_append_max_entry.attr,
786         &queue_nonrot_entry.attr,
787         &queue_zoned_entry.attr,
788         &queue_nr_zones_entry.attr,
789         &queue_max_open_zones_entry.attr,
790         &queue_max_active_zones_entry.attr,
791         &queue_nomerges_entry.attr,
792         &queue_rq_affinity_entry.attr,
793         &queue_iostats_entry.attr,
794         &queue_random_entry.attr,
795         &queue_poll_entry.attr,
796         &queue_wc_entry.attr,
797         &queue_fua_entry.attr,
798         &queue_dax_entry.attr,
799         &queue_wb_lat_entry.attr,
800         &queue_poll_delay_entry.attr,
801         &queue_io_timeout_entry.attr,
802 #ifdef CONFIG_BLK_DEV_THROTTLING_LOW
803         &throtl_sample_time_entry.attr,
804 #endif
805         NULL,
806 };
807
808 static umode_t queue_attr_visible(struct kobject *kobj, struct attribute *attr,
809                                 int n)
810 {
811         struct request_queue *q =
812                 container_of(kobj, struct request_queue, kobj);
813
814         if (attr == &queue_io_timeout_entry.attr &&
815                 (!q->mq_ops || !q->mq_ops->timeout))
816                         return 0;
817
818         if ((attr == &queue_max_open_zones_entry.attr ||
819              attr == &queue_max_active_zones_entry.attr) &&
820             !blk_queue_is_zoned(q))
821                 return 0;
822
823         return attr->mode;
824 }
825
826 static struct attribute_group queue_attr_group = {
827         .attrs = queue_attrs,
828         .is_visible = queue_attr_visible,
829 };
830
831
832 #define to_queue(atr) container_of((atr), struct queue_sysfs_entry, attr)
833
834 static ssize_t
835 queue_attr_show(struct kobject *kobj, struct attribute *attr, char *page)
836 {
837         struct queue_sysfs_entry *entry = to_queue(attr);
838         struct request_queue *q =
839                 container_of(kobj, struct request_queue, kobj);
840         ssize_t res;
841
842         if (!entry->show)
843                 return -EIO;
844         mutex_lock(&q->sysfs_lock);
845         res = entry->show(q, page);
846         mutex_unlock(&q->sysfs_lock);
847         return res;
848 }
849
850 static ssize_t
851 queue_attr_store(struct kobject *kobj, struct attribute *attr,
852                     const char *page, size_t length)
853 {
854         struct queue_sysfs_entry *entry = to_queue(attr);
855         struct request_queue *q;
856         ssize_t res;
857
858         if (!entry->store)
859                 return -EIO;
860
861         q = container_of(kobj, struct request_queue, kobj);
862         mutex_lock(&q->sysfs_lock);
863         res = entry->store(q, page, length);
864         mutex_unlock(&q->sysfs_lock);
865         return res;
866 }
867
868 static void blk_free_queue_rcu(struct rcu_head *rcu_head)
869 {
870         struct request_queue *q = container_of(rcu_head, struct request_queue,
871                                                rcu_head);
872         kmem_cache_free(blk_requestq_cachep, q);
873 }
874
875 /* Unconfigure the I/O scheduler and dissociate from the cgroup controller. */
876 static void blk_exit_queue(struct request_queue *q)
877 {
878         /*
879          * Since the I/O scheduler exit code may access cgroup information,
880          * perform I/O scheduler exit before disassociating from the block
881          * cgroup controller.
882          */
883         if (q->elevator) {
884                 ioc_clear_queue(q);
885                 __elevator_exit(q, q->elevator);
886                 q->elevator = NULL;
887         }
888
889         /*
890          * Remove all references to @q from the block cgroup controller before
891          * restoring @q->queue_lock to avoid that restoring this pointer causes
892          * e.g. blkcg_print_blkgs() to crash.
893          */
894         blkcg_exit_queue(q);
895
896         /*
897          * Since the cgroup code may dereference the @q->backing_dev_info
898          * pointer, only decrease its reference count after having removed the
899          * association with the block cgroup controller.
900          */
901         bdi_put(q->backing_dev_info);
902 }
903
904 /**
905  * blk_release_queue - releases all allocated resources of the request_queue
906  * @kobj: pointer to a kobject, whose container is a request_queue
907  *
908  * This function releases all allocated resources of the request queue.
909  *
910  * The struct request_queue refcount is incremented with blk_get_queue() and
911  * decremented with blk_put_queue(). Once the refcount reaches 0 this function
912  * is called.
913  *
914  * For drivers that have a request_queue on a gendisk and added with
915  * __device_add_disk() the refcount to request_queue will reach 0 with
916  * the last put_disk() called by the driver. For drivers which don't use
917  * __device_add_disk() this happens with blk_cleanup_queue().
918  *
919  * Drivers exist which depend on the release of the request_queue to be
920  * synchronous, it should not be deferred.
921  *
922  * Context: can sleep
923  */
924 static void blk_release_queue(struct kobject *kobj)
925 {
926         struct request_queue *q =
927                 container_of(kobj, struct request_queue, kobj);
928
929         might_sleep();
930
931         if (test_bit(QUEUE_FLAG_POLL_STATS, &q->queue_flags))
932                 blk_stat_remove_callback(q, q->poll_cb);
933         blk_stat_free_callback(q->poll_cb);
934
935         blk_free_queue_stats(q->stats);
936
937         if (queue_is_mq(q))
938                 cancel_delayed_work_sync(&q->requeue_work);
939
940         blk_exit_queue(q);
941
942         blk_queue_free_zone_bitmaps(q);
943
944         if (queue_is_mq(q))
945                 blk_mq_release(q);
946
947         blk_trace_shutdown(q);
948         mutex_lock(&q->debugfs_mutex);
949         debugfs_remove_recursive(q->debugfs_dir);
950         mutex_unlock(&q->debugfs_mutex);
951
952         if (queue_is_mq(q))
953                 blk_mq_debugfs_unregister(q);
954
955         bioset_exit(&q->bio_split);
956
957         ida_simple_remove(&blk_queue_ida, q->id);
958         call_rcu(&q->rcu_head, blk_free_queue_rcu);
959 }
960
961 static const struct sysfs_ops queue_sysfs_ops = {
962         .show   = queue_attr_show,
963         .store  = queue_attr_store,
964 };
965
966 struct kobj_type blk_queue_ktype = {
967         .sysfs_ops      = &queue_sysfs_ops,
968         .release        = blk_release_queue,
969 };
970
971 /**
972  * blk_register_queue - register a block layer queue with sysfs
973  * @disk: Disk of which the request queue should be registered with sysfs.
974  */
975 int blk_register_queue(struct gendisk *disk)
976 {
977         int ret;
978         struct device *dev = disk_to_dev(disk);
979         struct request_queue *q = disk->queue;
980         bool has_elevator = false;
981
982         if (WARN_ON(!q))
983                 return -ENXIO;
984
985         WARN_ONCE(blk_queue_registered(q),
986                   "%s is registering an already registered queue\n",
987                   kobject_name(&dev->kobj));
988
989         /*
990          * SCSI probing may synchronously create and destroy a lot of
991          * request_queues for non-existent devices.  Shutting down a fully
992          * functional queue takes measureable wallclock time as RCU grace
993          * periods are involved.  To avoid excessive latency in these
994          * cases, a request_queue starts out in a degraded mode which is
995          * faster to shut down and is made fully functional here as
996          * request_queues for non-existent devices never get registered.
997          */
998         if (!blk_queue_init_done(q)) {
999                 blk_queue_flag_set(QUEUE_FLAG_INIT_DONE, q);
1000                 percpu_ref_switch_to_percpu(&q->q_usage_counter);
1001         }
1002
1003         ret = blk_trace_init_sysfs(dev);
1004         if (ret)
1005                 return ret;
1006
1007         mutex_lock(&q->sysfs_dir_lock);
1008
1009         ret = kobject_add(&q->kobj, kobject_get(&dev->kobj), "%s", "queue");
1010         if (ret < 0) {
1011                 blk_trace_remove_sysfs(dev);
1012                 goto unlock;
1013         }
1014
1015         ret = sysfs_create_group(&q->kobj, &queue_attr_group);
1016         if (ret) {
1017                 blk_trace_remove_sysfs(dev);
1018                 kobject_del(&q->kobj);
1019                 kobject_put(&dev->kobj);
1020                 goto unlock;
1021         }
1022
1023         mutex_lock(&q->debugfs_mutex);
1024         q->debugfs_dir = debugfs_create_dir(kobject_name(q->kobj.parent),
1025                                             blk_debugfs_root);
1026         mutex_unlock(&q->debugfs_mutex);
1027
1028         if (queue_is_mq(q)) {
1029                 __blk_mq_register_dev(dev, q);
1030                 blk_mq_debugfs_register(q);
1031         }
1032
1033         mutex_lock(&q->sysfs_lock);
1034         if (q->elevator) {
1035                 ret = elv_register_queue(q, false);
1036                 if (ret) {
1037                         mutex_unlock(&q->sysfs_lock);
1038                         mutex_unlock(&q->sysfs_dir_lock);
1039                         kobject_del(&q->kobj);
1040                         blk_trace_remove_sysfs(dev);
1041                         kobject_put(&dev->kobj);
1042                         return ret;
1043                 }
1044                 has_elevator = true;
1045         }
1046
1047         blk_queue_flag_set(QUEUE_FLAG_REGISTERED, q);
1048         wbt_enable_default(q);
1049         blk_throtl_register_queue(q);
1050
1051         /* Now everything is ready and send out KOBJ_ADD uevent */
1052         kobject_uevent(&q->kobj, KOBJ_ADD);
1053         if (has_elevator)
1054                 kobject_uevent(&q->elevator->kobj, KOBJ_ADD);
1055         mutex_unlock(&q->sysfs_lock);
1056
1057         ret = 0;
1058 unlock:
1059         mutex_unlock(&q->sysfs_dir_lock);
1060         return ret;
1061 }
1062 EXPORT_SYMBOL_GPL(blk_register_queue);
1063
1064 /**
1065  * blk_unregister_queue - counterpart of blk_register_queue()
1066  * @disk: Disk of which the request queue should be unregistered from sysfs.
1067  *
1068  * Note: the caller is responsible for guaranteeing that this function is called
1069  * after blk_register_queue() has finished.
1070  */
1071 void blk_unregister_queue(struct gendisk *disk)
1072 {
1073         struct request_queue *q = disk->queue;
1074
1075         if (WARN_ON(!q))
1076                 return;
1077
1078         /* Return early if disk->queue was never registered. */
1079         if (!blk_queue_registered(q))
1080                 return;
1081
1082         /*
1083          * Since sysfs_remove_dir() prevents adding new directory entries
1084          * before removal of existing entries starts, protect against
1085          * concurrent elv_iosched_store() calls.
1086          */
1087         mutex_lock(&q->sysfs_lock);
1088         blk_queue_flag_clear(QUEUE_FLAG_REGISTERED, q);
1089         mutex_unlock(&q->sysfs_lock);
1090
1091         mutex_lock(&q->sysfs_dir_lock);
1092         /*
1093          * Remove the sysfs attributes before unregistering the queue data
1094          * structures that can be modified through sysfs.
1095          */
1096         if (queue_is_mq(q))
1097                 blk_mq_unregister_dev(disk_to_dev(disk), q);
1098
1099         kobject_uevent(&q->kobj, KOBJ_REMOVE);
1100         kobject_del(&q->kobj);
1101         blk_trace_remove_sysfs(disk_to_dev(disk));
1102
1103         mutex_lock(&q->sysfs_lock);
1104         if (q->elevator)
1105                 elv_unregister_queue(q);
1106         mutex_unlock(&q->sysfs_lock);
1107         mutex_unlock(&q->sysfs_dir_lock);
1108
1109         kobject_put(&disk_to_dev(disk)->kobj);
1110 }