1 // SPDX-License-Identifier: GPL-2.0
2 #include <linux/kernel.h>
3 #include <linux/module.h>
4 #include <linux/backing-dev.h>
5 #include <linux/bio.h>
6 #include <linux/blkdev.h>
7 #include <linux/mm.h>
8 #include <linux/init.h>
9 #include <linux/slab.h>
10 #include <linux/workqueue.h>
11 #include <linux/smp.h>
12
13 #include "blk.h"
14 #include "blk-mq.h"
15
blk_mq_sysfs_release(struct kobject * kobj)16 static void blk_mq_sysfs_release(struct kobject *kobj)
17 {
18 struct blk_mq_ctxs *ctxs = container_of(kobj, struct blk_mq_ctxs, kobj);
19
20 free_percpu(ctxs->queue_ctx);
21 kfree(ctxs);
22 }
23
blk_mq_ctx_sysfs_release(struct kobject * kobj)24 static void blk_mq_ctx_sysfs_release(struct kobject *kobj)
25 {
26 struct blk_mq_ctx *ctx = container_of(kobj, struct blk_mq_ctx, kobj);
27
28 /* ctx->ctxs won't be released until all ctx are freed */
29 kobject_put(&ctx->ctxs->kobj);
30 }
31
blk_mq_hw_sysfs_release(struct kobject * kobj)32 static void blk_mq_hw_sysfs_release(struct kobject *kobj)
33 {
34 struct blk_mq_hw_ctx *hctx = container_of(kobj, struct blk_mq_hw_ctx,
35 kobj);
36
37 blk_free_flush_queue(hctx->fq);
38 sbitmap_free(&hctx->ctx_map);
39 free_cpumask_var(hctx->cpumask);
40 kfree(hctx->ctxs);
41 kfree(hctx);
42 }
43
44 struct blk_mq_hw_ctx_sysfs_entry {
45 struct attribute attr;
46 ssize_t (*show)(struct blk_mq_hw_ctx *, char *);
47 };
48
blk_mq_hw_sysfs_show(struct kobject * kobj,struct attribute * attr,char * page)49 static ssize_t blk_mq_hw_sysfs_show(struct kobject *kobj,
50 struct attribute *attr, char *page)
51 {
52 struct blk_mq_hw_ctx_sysfs_entry *entry;
53 struct blk_mq_hw_ctx *hctx;
54 struct request_queue *q;
55 ssize_t res;
56
57 entry = container_of(attr, struct blk_mq_hw_ctx_sysfs_entry, attr);
58 hctx = container_of(kobj, struct blk_mq_hw_ctx, kobj);
59 q = hctx->queue;
60
61 if (!entry->show)
62 return -EIO;
63
64 mutex_lock(&q->sysfs_lock);
65 res = entry->show(hctx, page);
66 mutex_unlock(&q->sysfs_lock);
67 return res;
68 }
69
blk_mq_hw_sysfs_nr_tags_show(struct blk_mq_hw_ctx * hctx,char * page)70 static ssize_t blk_mq_hw_sysfs_nr_tags_show(struct blk_mq_hw_ctx *hctx,
71 char *page)
72 {
73 return sprintf(page, "%u\n", hctx->tags->nr_tags);
74 }
75
blk_mq_hw_sysfs_nr_reserved_tags_show(struct blk_mq_hw_ctx * hctx,char * page)76 static ssize_t blk_mq_hw_sysfs_nr_reserved_tags_show(struct blk_mq_hw_ctx *hctx,
77 char *page)
78 {
79 return sprintf(page, "%u\n", hctx->tags->nr_reserved_tags);
80 }
81
blk_mq_hw_sysfs_cpus_show(struct blk_mq_hw_ctx * hctx,char * page)82 static ssize_t blk_mq_hw_sysfs_cpus_show(struct blk_mq_hw_ctx *hctx, char *page)
83 {
84 const size_t size = PAGE_SIZE - 1;
85 unsigned int i, first = 1;
86 int ret = 0, pos = 0;
87
88 for_each_cpu(i, hctx->cpumask) {
89 if (first)
90 ret = snprintf(pos + page, size - pos, "%u", i);
91 else
92 ret = snprintf(pos + page, size - pos, ", %u", i);
93
94 if (ret >= size - pos)
95 break;
96
97 first = 0;
98 pos += ret;
99 }
100
101 ret = snprintf(pos + page, size + 1 - pos, "\n");
102 return pos + ret;
103 }
104
105 static struct blk_mq_hw_ctx_sysfs_entry blk_mq_hw_sysfs_nr_tags = {
106 .attr = {.name = "nr_tags", .mode = 0444 },
107 .show = blk_mq_hw_sysfs_nr_tags_show,
108 };
109 static struct blk_mq_hw_ctx_sysfs_entry blk_mq_hw_sysfs_nr_reserved_tags = {
110 .attr = {.name = "nr_reserved_tags", .mode = 0444 },
111 .show = blk_mq_hw_sysfs_nr_reserved_tags_show,
112 };
113 static struct blk_mq_hw_ctx_sysfs_entry blk_mq_hw_sysfs_cpus = {
114 .attr = {.name = "cpu_list", .mode = 0444 },
115 .show = blk_mq_hw_sysfs_cpus_show,
116 };
117
118 static struct attribute *default_hw_ctx_attrs[] = {
119 &blk_mq_hw_sysfs_nr_tags.attr,
120 &blk_mq_hw_sysfs_nr_reserved_tags.attr,
121 &blk_mq_hw_sysfs_cpus.attr,
122 NULL,
123 };
124 ATTRIBUTE_GROUPS(default_hw_ctx);
125
126 static const struct sysfs_ops blk_mq_hw_sysfs_ops = {
127 .show = blk_mq_hw_sysfs_show,
128 };
129
130 static const struct kobj_type blk_mq_ktype = {
131 .release = blk_mq_sysfs_release,
132 };
133
134 static const struct kobj_type blk_mq_ctx_ktype = {
135 .release = blk_mq_ctx_sysfs_release,
136 };
137
138 static const struct kobj_type blk_mq_hw_ktype = {
139 .sysfs_ops = &blk_mq_hw_sysfs_ops,
140 .default_groups = default_hw_ctx_groups,
141 .release = blk_mq_hw_sysfs_release,
142 };
143
blk_mq_unregister_hctx(struct blk_mq_hw_ctx * hctx)144 static void blk_mq_unregister_hctx(struct blk_mq_hw_ctx *hctx)
145 {
146 struct blk_mq_ctx *ctx;
147 int i;
148
149 if (!hctx->nr_ctx)
150 return;
151
152 hctx_for_each_ctx(hctx, ctx, i)
153 kobject_del(&ctx->kobj);
154
155 kobject_del(&hctx->kobj);
156 }
157
blk_mq_register_hctx(struct blk_mq_hw_ctx * hctx)158 static int blk_mq_register_hctx(struct blk_mq_hw_ctx *hctx)
159 {
160 struct request_queue *q = hctx->queue;
161 struct blk_mq_ctx *ctx;
162 int i, j, ret;
163
164 if (!hctx->nr_ctx)
165 return 0;
166
167 ret = kobject_add(&hctx->kobj, q->mq_kobj, "%u", hctx->queue_num);
168 if (ret)
169 return ret;
170
171 hctx_for_each_ctx(hctx, ctx, i) {
172 ret = kobject_add(&ctx->kobj, &hctx->kobj, "cpu%u", ctx->cpu);
173 if (ret)
174 goto out;
175 }
176
177 return 0;
178 out:
179 hctx_for_each_ctx(hctx, ctx, j) {
180 if (j < i)
181 kobject_del(&ctx->kobj);
182 }
183 kobject_del(&hctx->kobj);
184 return ret;
185 }
186
blk_mq_hctx_kobj_init(struct blk_mq_hw_ctx * hctx)187 void blk_mq_hctx_kobj_init(struct blk_mq_hw_ctx *hctx)
188 {
189 kobject_init(&hctx->kobj, &blk_mq_hw_ktype);
190 }
191
blk_mq_sysfs_deinit(struct request_queue * q)192 void blk_mq_sysfs_deinit(struct request_queue *q)
193 {
194 struct blk_mq_ctx *ctx;
195 int cpu;
196
197 for_each_possible_cpu(cpu) {
198 ctx = per_cpu_ptr(q->queue_ctx, cpu);
199 kobject_put(&ctx->kobj);
200 }
201 kobject_put(q->mq_kobj);
202 }
203
blk_mq_sysfs_init(struct request_queue * q)204 void blk_mq_sysfs_init(struct request_queue *q)
205 {
206 struct blk_mq_ctx *ctx;
207 int cpu;
208
209 kobject_init(q->mq_kobj, &blk_mq_ktype);
210
211 for_each_possible_cpu(cpu) {
212 ctx = per_cpu_ptr(q->queue_ctx, cpu);
213
214 kobject_get(q->mq_kobj);
215 kobject_init(&ctx->kobj, &blk_mq_ctx_ktype);
216 }
217 }
218
blk_mq_sysfs_register(struct gendisk * disk)219 int blk_mq_sysfs_register(struct gendisk *disk)
220 {
221 struct request_queue *q = disk->queue;
222 struct blk_mq_hw_ctx *hctx;
223 unsigned long i, j;
224 int ret;
225
226 lockdep_assert_held(&q->sysfs_dir_lock);
227
228 ret = kobject_add(q->mq_kobj, &disk_to_dev(disk)->kobj, "mq");
229 if (ret < 0)
230 goto out;
231
232 kobject_uevent(q->mq_kobj, KOBJ_ADD);
233
234 queue_for_each_hw_ctx(q, hctx, i) {
235 ret = blk_mq_register_hctx(hctx);
236 if (ret)
237 goto unreg;
238 }
239
240 q->mq_sysfs_init_done = true;
241
242 out:
243 return ret;
244
245 unreg:
246 queue_for_each_hw_ctx(q, hctx, j) {
247 if (j < i)
248 blk_mq_unregister_hctx(hctx);
249 }
250
251 kobject_uevent(q->mq_kobj, KOBJ_REMOVE);
252 kobject_del(q->mq_kobj);
253 return ret;
254 }
255
blk_mq_sysfs_unregister(struct gendisk * disk)256 void blk_mq_sysfs_unregister(struct gendisk *disk)
257 {
258 struct request_queue *q = disk->queue;
259 struct blk_mq_hw_ctx *hctx;
260 unsigned long i;
261
262 lockdep_assert_held(&q->sysfs_dir_lock);
263
264 queue_for_each_hw_ctx(q, hctx, i)
265 blk_mq_unregister_hctx(hctx);
266
267 kobject_uevent(q->mq_kobj, KOBJ_REMOVE);
268 kobject_del(q->mq_kobj);
269
270 q->mq_sysfs_init_done = false;
271 }
272
blk_mq_sysfs_unregister_hctxs(struct request_queue * q)273 void blk_mq_sysfs_unregister_hctxs(struct request_queue *q)
274 {
275 struct blk_mq_hw_ctx *hctx;
276 unsigned long i;
277
278 mutex_lock(&q->sysfs_dir_lock);
279 if (!q->mq_sysfs_init_done)
280 goto unlock;
281
282 queue_for_each_hw_ctx(q, hctx, i)
283 blk_mq_unregister_hctx(hctx);
284
285 unlock:
286 mutex_unlock(&q->sysfs_dir_lock);
287 }
288
blk_mq_sysfs_register_hctxs(struct request_queue * q)289 int blk_mq_sysfs_register_hctxs(struct request_queue *q)
290 {
291 struct blk_mq_hw_ctx *hctx;
292 unsigned long i;
293 int ret = 0;
294
295 mutex_lock(&q->sysfs_dir_lock);
296 if (!q->mq_sysfs_init_done)
297 goto unlock;
298
299 queue_for_each_hw_ctx(q, hctx, i) {
300 ret = blk_mq_register_hctx(hctx);
301 if (ret)
302 break;
303 }
304
305 unlock:
306 mutex_unlock(&q->sysfs_dir_lock);
307
308 return ret;
309 }
310