1 // SPDX-License-Identifier: GPL-2.0-only
2 /* Copyright(c) 2020 Intel Corporation. All rights reserved. */
3 #include <linux/platform_device.h>
4 #include <linux/memregion.h>
5 #include <linux/workqueue.h>
6 #include <linux/debugfs.h>
7 #include <linux/device.h>
8 #include <linux/module.h>
9 #include <linux/pci.h>
10 #include <linux/slab.h>
11 #include <linux/idr.h>
12 #include <linux/node.h>
13 #include <cxl/einj.h>
14 #include <cxlmem.h>
15 #include <cxlpci.h>
16 #include <cxl.h>
17 #include "core.h"
18
19 /**
20 * DOC: cxl core
21 *
22 * The CXL core provides a set of interfaces that can be consumed by CXL aware
23 * drivers. The interfaces allow for creation, modification, and destruction of
24 * regions, memory devices, ports, and decoders. CXL aware drivers must register
25 * with the CXL core via these interfaces in order to be able to participate in
26 * cross-device interleave coordination. The CXL core also establishes and
27 * maintains the bridge to the nvdimm subsystem.
28 *
29 * CXL core introduces sysfs hierarchy to control the devices that are
30 * instantiated by the core.
31 */
32
33 /*
34 * All changes to the interleave configuration occur with this lock held
35 * for write.
36 */
37 DECLARE_RWSEM(cxl_region_rwsem);
38
39 static DEFINE_IDA(cxl_port_ida);
40 static DEFINE_XARRAY(cxl_root_buses);
41
cxl_num_decoders_committed(struct cxl_port * port)42 int cxl_num_decoders_committed(struct cxl_port *port)
43 {
44 lockdep_assert_held(&cxl_region_rwsem);
45
46 return port->commit_end + 1;
47 }
48
devtype_show(struct device * dev,struct device_attribute * attr,char * buf)49 static ssize_t devtype_show(struct device *dev, struct device_attribute *attr,
50 char *buf)
51 {
52 return sysfs_emit(buf, "%s\n", dev->type->name);
53 }
54 static DEVICE_ATTR_RO(devtype);
55
cxl_device_id(const struct device * dev)56 static int cxl_device_id(const struct device *dev)
57 {
58 if (dev->type == &cxl_nvdimm_bridge_type)
59 return CXL_DEVICE_NVDIMM_BRIDGE;
60 if (dev->type == &cxl_nvdimm_type)
61 return CXL_DEVICE_NVDIMM;
62 if (dev->type == CXL_PMEM_REGION_TYPE())
63 return CXL_DEVICE_PMEM_REGION;
64 if (dev->type == CXL_DAX_REGION_TYPE())
65 return CXL_DEVICE_DAX_REGION;
66 if (is_cxl_port(dev)) {
67 if (is_cxl_root(to_cxl_port(dev)))
68 return CXL_DEVICE_ROOT;
69 return CXL_DEVICE_PORT;
70 }
71 if (is_cxl_memdev(dev))
72 return CXL_DEVICE_MEMORY_EXPANDER;
73 if (dev->type == CXL_REGION_TYPE())
74 return CXL_DEVICE_REGION;
75 if (dev->type == &cxl_pmu_type)
76 return CXL_DEVICE_PMU;
77 return 0;
78 }
79
modalias_show(struct device * dev,struct device_attribute * attr,char * buf)80 static ssize_t modalias_show(struct device *dev, struct device_attribute *attr,
81 char *buf)
82 {
83 return sysfs_emit(buf, CXL_MODALIAS_FMT "\n", cxl_device_id(dev));
84 }
85 static DEVICE_ATTR_RO(modalias);
86
87 static struct attribute *cxl_base_attributes[] = {
88 &dev_attr_devtype.attr,
89 &dev_attr_modalias.attr,
90 NULL,
91 };
92
93 struct attribute_group cxl_base_attribute_group = {
94 .attrs = cxl_base_attributes,
95 };
96
start_show(struct device * dev,struct device_attribute * attr,char * buf)97 static ssize_t start_show(struct device *dev, struct device_attribute *attr,
98 char *buf)
99 {
100 struct cxl_decoder *cxld = to_cxl_decoder(dev);
101
102 return sysfs_emit(buf, "%#llx\n", cxld->hpa_range.start);
103 }
104 static DEVICE_ATTR_ADMIN_RO(start);
105
size_show(struct device * dev,struct device_attribute * attr,char * buf)106 static ssize_t size_show(struct device *dev, struct device_attribute *attr,
107 char *buf)
108 {
109 struct cxl_decoder *cxld = to_cxl_decoder(dev);
110
111 return sysfs_emit(buf, "%#llx\n", range_len(&cxld->hpa_range));
112 }
113 static DEVICE_ATTR_RO(size);
114
115 #define CXL_DECODER_FLAG_ATTR(name, flag) \
116 static ssize_t name##_show(struct device *dev, \
117 struct device_attribute *attr, char *buf) \
118 { \
119 struct cxl_decoder *cxld = to_cxl_decoder(dev); \
120 \
121 return sysfs_emit(buf, "%s\n", \
122 (cxld->flags & (flag)) ? "1" : "0"); \
123 } \
124 static DEVICE_ATTR_RO(name)
125
126 CXL_DECODER_FLAG_ATTR(cap_pmem, CXL_DECODER_F_PMEM);
127 CXL_DECODER_FLAG_ATTR(cap_ram, CXL_DECODER_F_RAM);
128 CXL_DECODER_FLAG_ATTR(cap_type2, CXL_DECODER_F_TYPE2);
129 CXL_DECODER_FLAG_ATTR(cap_type3, CXL_DECODER_F_TYPE3);
130 CXL_DECODER_FLAG_ATTR(locked, CXL_DECODER_F_LOCK);
131
target_type_show(struct device * dev,struct device_attribute * attr,char * buf)132 static ssize_t target_type_show(struct device *dev,
133 struct device_attribute *attr, char *buf)
134 {
135 struct cxl_decoder *cxld = to_cxl_decoder(dev);
136
137 switch (cxld->target_type) {
138 case CXL_DECODER_DEVMEM:
139 return sysfs_emit(buf, "accelerator\n");
140 case CXL_DECODER_HOSTONLYMEM:
141 return sysfs_emit(buf, "expander\n");
142 }
143 return -ENXIO;
144 }
145 static DEVICE_ATTR_RO(target_type);
146
emit_target_list(struct cxl_switch_decoder * cxlsd,char * buf)147 static ssize_t emit_target_list(struct cxl_switch_decoder *cxlsd, char *buf)
148 {
149 struct cxl_decoder *cxld = &cxlsd->cxld;
150 ssize_t offset = 0;
151 int i, rc = 0;
152
153 for (i = 0; i < cxld->interleave_ways; i++) {
154 struct cxl_dport *dport = cxlsd->target[i];
155 struct cxl_dport *next = NULL;
156
157 if (!dport)
158 break;
159
160 if (i + 1 < cxld->interleave_ways)
161 next = cxlsd->target[i + 1];
162 rc = sysfs_emit_at(buf, offset, "%d%s", dport->port_id,
163 next ? "," : "");
164 if (rc < 0)
165 return rc;
166 offset += rc;
167 }
168
169 return offset;
170 }
171
target_list_show(struct device * dev,struct device_attribute * attr,char * buf)172 static ssize_t target_list_show(struct device *dev,
173 struct device_attribute *attr, char *buf)
174 {
175 struct cxl_switch_decoder *cxlsd = to_cxl_switch_decoder(dev);
176 ssize_t offset;
177 int rc;
178
179 guard(rwsem_read)(&cxl_region_rwsem);
180 rc = emit_target_list(cxlsd, buf);
181 if (rc < 0)
182 return rc;
183 offset = rc;
184
185 rc = sysfs_emit_at(buf, offset, "\n");
186 if (rc < 0)
187 return rc;
188
189 return offset + rc;
190 }
191 static DEVICE_ATTR_RO(target_list);
192
mode_show(struct device * dev,struct device_attribute * attr,char * buf)193 static ssize_t mode_show(struct device *dev, struct device_attribute *attr,
194 char *buf)
195 {
196 struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
197 struct cxl_memdev *cxlmd = cxled_to_memdev(cxled);
198 struct cxl_dev_state *cxlds = cxlmd->cxlds;
199 /* without @cxl_dpa_rwsem, make sure @part is not reloaded */
200 int part = READ_ONCE(cxled->part);
201 const char *desc;
202
203 if (part < 0)
204 desc = "none";
205 else
206 desc = cxlds->part[part].res.name;
207
208 return sysfs_emit(buf, "%s\n", desc);
209 }
210
mode_store(struct device * dev,struct device_attribute * attr,const char * buf,size_t len)211 static ssize_t mode_store(struct device *dev, struct device_attribute *attr,
212 const char *buf, size_t len)
213 {
214 struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
215 enum cxl_partition_mode mode;
216 ssize_t rc;
217
218 if (sysfs_streq(buf, "pmem"))
219 mode = CXL_PARTMODE_PMEM;
220 else if (sysfs_streq(buf, "ram"))
221 mode = CXL_PARTMODE_RAM;
222 else
223 return -EINVAL;
224
225 rc = cxl_dpa_set_part(cxled, mode);
226 if (rc)
227 return rc;
228
229 return len;
230 }
231 static DEVICE_ATTR_RW(mode);
232
dpa_resource_show(struct device * dev,struct device_attribute * attr,char * buf)233 static ssize_t dpa_resource_show(struct device *dev, struct device_attribute *attr,
234 char *buf)
235 {
236 struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
237
238 guard(rwsem_read)(&cxl_dpa_rwsem);
239 return sysfs_emit(buf, "%#llx\n", (u64)cxl_dpa_resource_start(cxled));
240 }
241 static DEVICE_ATTR_RO(dpa_resource);
242
dpa_size_show(struct device * dev,struct device_attribute * attr,char * buf)243 static ssize_t dpa_size_show(struct device *dev, struct device_attribute *attr,
244 char *buf)
245 {
246 struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
247 resource_size_t size = cxl_dpa_size(cxled);
248
249 return sysfs_emit(buf, "%pa\n", &size);
250 }
251
dpa_size_store(struct device * dev,struct device_attribute * attr,const char * buf,size_t len)252 static ssize_t dpa_size_store(struct device *dev, struct device_attribute *attr,
253 const char *buf, size_t len)
254 {
255 struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
256 unsigned long long size;
257 ssize_t rc;
258
259 rc = kstrtoull(buf, 0, &size);
260 if (rc)
261 return rc;
262
263 if (!IS_ALIGNED(size, SZ_256M))
264 return -EINVAL;
265
266 rc = cxl_dpa_free(cxled);
267 if (rc)
268 return rc;
269
270 if (size == 0)
271 return len;
272
273 rc = cxl_dpa_alloc(cxled, size);
274 if (rc)
275 return rc;
276
277 return len;
278 }
279 static DEVICE_ATTR_RW(dpa_size);
280
interleave_granularity_show(struct device * dev,struct device_attribute * attr,char * buf)281 static ssize_t interleave_granularity_show(struct device *dev,
282 struct device_attribute *attr,
283 char *buf)
284 {
285 struct cxl_decoder *cxld = to_cxl_decoder(dev);
286
287 return sysfs_emit(buf, "%d\n", cxld->interleave_granularity);
288 }
289
290 static DEVICE_ATTR_RO(interleave_granularity);
291
interleave_ways_show(struct device * dev,struct device_attribute * attr,char * buf)292 static ssize_t interleave_ways_show(struct device *dev,
293 struct device_attribute *attr, char *buf)
294 {
295 struct cxl_decoder *cxld = to_cxl_decoder(dev);
296
297 return sysfs_emit(buf, "%d\n", cxld->interleave_ways);
298 }
299
300 static DEVICE_ATTR_RO(interleave_ways);
301
qos_class_show(struct device * dev,struct device_attribute * attr,char * buf)302 static ssize_t qos_class_show(struct device *dev,
303 struct device_attribute *attr, char *buf)
304 {
305 struct cxl_root_decoder *cxlrd = to_cxl_root_decoder(dev);
306
307 return sysfs_emit(buf, "%d\n", cxlrd->qos_class);
308 }
309 static DEVICE_ATTR_RO(qos_class);
310
311 static struct attribute *cxl_decoder_base_attrs[] = {
312 &dev_attr_start.attr,
313 &dev_attr_size.attr,
314 &dev_attr_locked.attr,
315 &dev_attr_interleave_granularity.attr,
316 &dev_attr_interleave_ways.attr,
317 NULL,
318 };
319
320 static struct attribute_group cxl_decoder_base_attribute_group = {
321 .attrs = cxl_decoder_base_attrs,
322 };
323
324 static struct attribute *cxl_decoder_root_attrs[] = {
325 &dev_attr_cap_pmem.attr,
326 &dev_attr_cap_ram.attr,
327 &dev_attr_cap_type2.attr,
328 &dev_attr_cap_type3.attr,
329 &dev_attr_target_list.attr,
330 &dev_attr_qos_class.attr,
331 SET_CXL_REGION_ATTR(create_pmem_region)
332 SET_CXL_REGION_ATTR(create_ram_region)
333 SET_CXL_REGION_ATTR(delete_region)
334 NULL,
335 };
336
can_create_pmem(struct cxl_root_decoder * cxlrd)337 static bool can_create_pmem(struct cxl_root_decoder *cxlrd)
338 {
339 unsigned long flags = CXL_DECODER_F_TYPE3 | CXL_DECODER_F_PMEM;
340
341 return (cxlrd->cxlsd.cxld.flags & flags) == flags;
342 }
343
can_create_ram(struct cxl_root_decoder * cxlrd)344 static bool can_create_ram(struct cxl_root_decoder *cxlrd)
345 {
346 unsigned long flags = CXL_DECODER_F_TYPE3 | CXL_DECODER_F_RAM;
347
348 return (cxlrd->cxlsd.cxld.flags & flags) == flags;
349 }
350
cxl_root_decoder_visible(struct kobject * kobj,struct attribute * a,int n)351 static umode_t cxl_root_decoder_visible(struct kobject *kobj, struct attribute *a, int n)
352 {
353 struct device *dev = kobj_to_dev(kobj);
354 struct cxl_root_decoder *cxlrd = to_cxl_root_decoder(dev);
355
356 if (a == CXL_REGION_ATTR(create_pmem_region) && !can_create_pmem(cxlrd))
357 return 0;
358
359 if (a == CXL_REGION_ATTR(create_ram_region) && !can_create_ram(cxlrd))
360 return 0;
361
362 if (a == CXL_REGION_ATTR(delete_region) &&
363 !(can_create_pmem(cxlrd) || can_create_ram(cxlrd)))
364 return 0;
365
366 return a->mode;
367 }
368
369 static struct attribute_group cxl_decoder_root_attribute_group = {
370 .attrs = cxl_decoder_root_attrs,
371 .is_visible = cxl_root_decoder_visible,
372 };
373
374 static const struct attribute_group *cxl_decoder_root_attribute_groups[] = {
375 &cxl_decoder_root_attribute_group,
376 &cxl_decoder_base_attribute_group,
377 &cxl_base_attribute_group,
378 NULL,
379 };
380
381 static struct attribute *cxl_decoder_switch_attrs[] = {
382 &dev_attr_target_type.attr,
383 &dev_attr_target_list.attr,
384 SET_CXL_REGION_ATTR(region)
385 NULL,
386 };
387
388 static struct attribute_group cxl_decoder_switch_attribute_group = {
389 .attrs = cxl_decoder_switch_attrs,
390 };
391
392 static const struct attribute_group *cxl_decoder_switch_attribute_groups[] = {
393 &cxl_decoder_switch_attribute_group,
394 &cxl_decoder_base_attribute_group,
395 &cxl_base_attribute_group,
396 NULL,
397 };
398
399 static struct attribute *cxl_decoder_endpoint_attrs[] = {
400 &dev_attr_target_type.attr,
401 &dev_attr_mode.attr,
402 &dev_attr_dpa_size.attr,
403 &dev_attr_dpa_resource.attr,
404 SET_CXL_REGION_ATTR(region)
405 NULL,
406 };
407
408 static struct attribute_group cxl_decoder_endpoint_attribute_group = {
409 .attrs = cxl_decoder_endpoint_attrs,
410 };
411
412 static const struct attribute_group *cxl_decoder_endpoint_attribute_groups[] = {
413 &cxl_decoder_base_attribute_group,
414 &cxl_decoder_endpoint_attribute_group,
415 &cxl_base_attribute_group,
416 NULL,
417 };
418
__cxl_decoder_release(struct cxl_decoder * cxld)419 static void __cxl_decoder_release(struct cxl_decoder *cxld)
420 {
421 struct cxl_port *port = to_cxl_port(cxld->dev.parent);
422
423 ida_free(&port->decoder_ida, cxld->id);
424 put_device(&port->dev);
425 }
426
cxl_endpoint_decoder_release(struct device * dev)427 static void cxl_endpoint_decoder_release(struct device *dev)
428 {
429 struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
430
431 __cxl_decoder_release(&cxled->cxld);
432 kfree(cxled);
433 }
434
cxl_switch_decoder_release(struct device * dev)435 static void cxl_switch_decoder_release(struct device *dev)
436 {
437 struct cxl_switch_decoder *cxlsd = to_cxl_switch_decoder(dev);
438
439 __cxl_decoder_release(&cxlsd->cxld);
440 kfree(cxlsd);
441 }
442
to_cxl_root_decoder(struct device * dev)443 struct cxl_root_decoder *to_cxl_root_decoder(struct device *dev)
444 {
445 if (dev_WARN_ONCE(dev, !is_root_decoder(dev),
446 "not a cxl_root_decoder device\n"))
447 return NULL;
448 return container_of(dev, struct cxl_root_decoder, cxlsd.cxld.dev);
449 }
450 EXPORT_SYMBOL_NS_GPL(to_cxl_root_decoder, "CXL");
451
cxl_root_decoder_release(struct device * dev)452 static void cxl_root_decoder_release(struct device *dev)
453 {
454 struct cxl_root_decoder *cxlrd = to_cxl_root_decoder(dev);
455
456 if (atomic_read(&cxlrd->region_id) >= 0)
457 memregion_free(atomic_read(&cxlrd->region_id));
458 __cxl_decoder_release(&cxlrd->cxlsd.cxld);
459 kfree(cxlrd);
460 }
461
462 static const struct device_type cxl_decoder_endpoint_type = {
463 .name = "cxl_decoder_endpoint",
464 .release = cxl_endpoint_decoder_release,
465 .groups = cxl_decoder_endpoint_attribute_groups,
466 };
467
468 static const struct device_type cxl_decoder_switch_type = {
469 .name = "cxl_decoder_switch",
470 .release = cxl_switch_decoder_release,
471 .groups = cxl_decoder_switch_attribute_groups,
472 };
473
474 static const struct device_type cxl_decoder_root_type = {
475 .name = "cxl_decoder_root",
476 .release = cxl_root_decoder_release,
477 .groups = cxl_decoder_root_attribute_groups,
478 };
479
is_endpoint_decoder(struct device * dev)480 bool is_endpoint_decoder(struct device *dev)
481 {
482 return dev->type == &cxl_decoder_endpoint_type;
483 }
484 EXPORT_SYMBOL_NS_GPL(is_endpoint_decoder, "CXL");
485
is_root_decoder(struct device * dev)486 bool is_root_decoder(struct device *dev)
487 {
488 return dev->type == &cxl_decoder_root_type;
489 }
490 EXPORT_SYMBOL_NS_GPL(is_root_decoder, "CXL");
491
is_switch_decoder(struct device * dev)492 bool is_switch_decoder(struct device *dev)
493 {
494 return is_root_decoder(dev) || dev->type == &cxl_decoder_switch_type;
495 }
496 EXPORT_SYMBOL_NS_GPL(is_switch_decoder, "CXL");
497
to_cxl_decoder(struct device * dev)498 struct cxl_decoder *to_cxl_decoder(struct device *dev)
499 {
500 if (dev_WARN_ONCE(dev,
501 !is_switch_decoder(dev) && !is_endpoint_decoder(dev),
502 "not a cxl_decoder device\n"))
503 return NULL;
504 return container_of(dev, struct cxl_decoder, dev);
505 }
506 EXPORT_SYMBOL_NS_GPL(to_cxl_decoder, "CXL");
507
to_cxl_endpoint_decoder(struct device * dev)508 struct cxl_endpoint_decoder *to_cxl_endpoint_decoder(struct device *dev)
509 {
510 if (dev_WARN_ONCE(dev, !is_endpoint_decoder(dev),
511 "not a cxl_endpoint_decoder device\n"))
512 return NULL;
513 return container_of(dev, struct cxl_endpoint_decoder, cxld.dev);
514 }
515 EXPORT_SYMBOL_NS_GPL(to_cxl_endpoint_decoder, "CXL");
516
to_cxl_switch_decoder(struct device * dev)517 struct cxl_switch_decoder *to_cxl_switch_decoder(struct device *dev)
518 {
519 if (dev_WARN_ONCE(dev, !is_switch_decoder(dev),
520 "not a cxl_switch_decoder device\n"))
521 return NULL;
522 return container_of(dev, struct cxl_switch_decoder, cxld.dev);
523 }
524 EXPORT_SYMBOL_NS_GPL(to_cxl_switch_decoder, "CXL");
525
cxl_ep_release(struct cxl_ep * ep)526 static void cxl_ep_release(struct cxl_ep *ep)
527 {
528 put_device(ep->ep);
529 kfree(ep);
530 }
531
cxl_ep_remove(struct cxl_port * port,struct cxl_ep * ep)532 static void cxl_ep_remove(struct cxl_port *port, struct cxl_ep *ep)
533 {
534 if (!ep)
535 return;
536 xa_erase(&port->endpoints, (unsigned long) ep->ep);
537 cxl_ep_release(ep);
538 }
539
cxl_port_release(struct device * dev)540 static void cxl_port_release(struct device *dev)
541 {
542 struct cxl_port *port = to_cxl_port(dev);
543 unsigned long index;
544 struct cxl_ep *ep;
545
546 xa_for_each(&port->endpoints, index, ep)
547 cxl_ep_remove(port, ep);
548 xa_destroy(&port->endpoints);
549 xa_destroy(&port->dports);
550 xa_destroy(&port->regions);
551 ida_free(&cxl_port_ida, port->id);
552 if (is_cxl_root(port))
553 kfree(to_cxl_root(port));
554 else
555 kfree(port);
556 }
557
decoders_committed_show(struct device * dev,struct device_attribute * attr,char * buf)558 static ssize_t decoders_committed_show(struct device *dev,
559 struct device_attribute *attr, char *buf)
560 {
561 struct cxl_port *port = to_cxl_port(dev);
562
563 guard(rwsem_read)(&cxl_region_rwsem);
564 return sysfs_emit(buf, "%d\n", cxl_num_decoders_committed(port));
565 }
566
567 static DEVICE_ATTR_RO(decoders_committed);
568
569 static struct attribute *cxl_port_attrs[] = {
570 &dev_attr_decoders_committed.attr,
571 NULL,
572 };
573
574 static struct attribute_group cxl_port_attribute_group = {
575 .attrs = cxl_port_attrs,
576 };
577
578 static const struct attribute_group *cxl_port_attribute_groups[] = {
579 &cxl_base_attribute_group,
580 &cxl_port_attribute_group,
581 NULL,
582 };
583
584 static const struct device_type cxl_port_type = {
585 .name = "cxl_port",
586 .release = cxl_port_release,
587 .groups = cxl_port_attribute_groups,
588 };
589
is_cxl_port(const struct device * dev)590 bool is_cxl_port(const struct device *dev)
591 {
592 return dev->type == &cxl_port_type;
593 }
594 EXPORT_SYMBOL_NS_GPL(is_cxl_port, "CXL");
595
to_cxl_port(const struct device * dev)596 struct cxl_port *to_cxl_port(const struct device *dev)
597 {
598 if (dev_WARN_ONCE(dev, dev->type != &cxl_port_type,
599 "not a cxl_port device\n"))
600 return NULL;
601 return container_of(dev, struct cxl_port, dev);
602 }
603 EXPORT_SYMBOL_NS_GPL(to_cxl_port, "CXL");
604
parent_port_of(struct cxl_port * port)605 struct cxl_port *parent_port_of(struct cxl_port *port)
606 {
607 if (!port || !port->parent_dport)
608 return NULL;
609 return port->parent_dport->port;
610 }
611
unregister_port(void * _port)612 static void unregister_port(void *_port)
613 {
614 struct cxl_port *port = _port;
615 struct cxl_port *parent = parent_port_of(port);
616 struct device *lock_dev;
617
618 /*
619 * CXL root port's and the first level of ports are unregistered
620 * under the platform firmware device lock, all other ports are
621 * unregistered while holding their parent port lock.
622 */
623 if (!parent)
624 lock_dev = port->uport_dev;
625 else if (is_cxl_root(parent))
626 lock_dev = parent->uport_dev;
627 else
628 lock_dev = &parent->dev;
629
630 device_lock_assert(lock_dev);
631 port->dead = true;
632 device_unregister(&port->dev);
633 }
634
cxl_unlink_uport(void * _port)635 static void cxl_unlink_uport(void *_port)
636 {
637 struct cxl_port *port = _port;
638
639 sysfs_remove_link(&port->dev.kobj, "uport");
640 }
641
devm_cxl_link_uport(struct device * host,struct cxl_port * port)642 static int devm_cxl_link_uport(struct device *host, struct cxl_port *port)
643 {
644 int rc;
645
646 rc = sysfs_create_link(&port->dev.kobj, &port->uport_dev->kobj,
647 "uport");
648 if (rc)
649 return rc;
650 return devm_add_action_or_reset(host, cxl_unlink_uport, port);
651 }
652
cxl_unlink_parent_dport(void * _port)653 static void cxl_unlink_parent_dport(void *_port)
654 {
655 struct cxl_port *port = _port;
656
657 sysfs_remove_link(&port->dev.kobj, "parent_dport");
658 }
659
devm_cxl_link_parent_dport(struct device * host,struct cxl_port * port,struct cxl_dport * parent_dport)660 static int devm_cxl_link_parent_dport(struct device *host,
661 struct cxl_port *port,
662 struct cxl_dport *parent_dport)
663 {
664 int rc;
665
666 if (!parent_dport)
667 return 0;
668
669 rc = sysfs_create_link(&port->dev.kobj, &parent_dport->dport_dev->kobj,
670 "parent_dport");
671 if (rc)
672 return rc;
673 return devm_add_action_or_reset(host, cxl_unlink_parent_dport, port);
674 }
675
676 static struct lock_class_key cxl_port_key;
677
cxl_port_alloc(struct device * uport_dev,struct cxl_dport * parent_dport)678 static struct cxl_port *cxl_port_alloc(struct device *uport_dev,
679 struct cxl_dport *parent_dport)
680 {
681 struct cxl_root *cxl_root __free(kfree) = NULL;
682 struct cxl_port *port, *_port __free(kfree) = NULL;
683 struct device *dev;
684 int rc;
685
686 /* No parent_dport, root cxl_port */
687 if (!parent_dport) {
688 cxl_root = kzalloc(sizeof(*cxl_root), GFP_KERNEL);
689 if (!cxl_root)
690 return ERR_PTR(-ENOMEM);
691 } else {
692 _port = kzalloc(sizeof(*port), GFP_KERNEL);
693 if (!_port)
694 return ERR_PTR(-ENOMEM);
695 }
696
697 rc = ida_alloc(&cxl_port_ida, GFP_KERNEL);
698 if (rc < 0)
699 return ERR_PTR(rc);
700
701 if (cxl_root)
702 port = &no_free_ptr(cxl_root)->port;
703 else
704 port = no_free_ptr(_port);
705
706 port->id = rc;
707 port->uport_dev = uport_dev;
708
709 /*
710 * The top-level cxl_port "cxl_root" does not have a cxl_port as
711 * its parent and it does not have any corresponding component
712 * registers as its decode is described by a fixed platform
713 * description.
714 */
715 dev = &port->dev;
716 if (parent_dport) {
717 struct cxl_port *parent_port = parent_dport->port;
718 struct cxl_port *iter;
719
720 dev->parent = &parent_port->dev;
721 port->depth = parent_port->depth + 1;
722 port->parent_dport = parent_dport;
723
724 /*
725 * walk to the host bridge, or the first ancestor that knows
726 * the host bridge
727 */
728 iter = port;
729 while (!iter->host_bridge &&
730 !is_cxl_root(to_cxl_port(iter->dev.parent)))
731 iter = to_cxl_port(iter->dev.parent);
732 if (iter->host_bridge)
733 port->host_bridge = iter->host_bridge;
734 else if (parent_dport->rch)
735 port->host_bridge = parent_dport->dport_dev;
736 else
737 port->host_bridge = iter->uport_dev;
738 dev_dbg(uport_dev, "host-bridge: %s\n",
739 dev_name(port->host_bridge));
740 } else
741 dev->parent = uport_dev;
742
743 ida_init(&port->decoder_ida);
744 port->hdm_end = -1;
745 port->commit_end = -1;
746 xa_init(&port->dports);
747 xa_init(&port->endpoints);
748 xa_init(&port->regions);
749
750 device_initialize(dev);
751 lockdep_set_class_and_subclass(&dev->mutex, &cxl_port_key, port->depth);
752 device_set_pm_not_required(dev);
753 dev->bus = &cxl_bus_type;
754 dev->type = &cxl_port_type;
755
756 return port;
757 }
758
cxl_setup_comp_regs(struct device * host,struct cxl_register_map * map,resource_size_t component_reg_phys)759 static int cxl_setup_comp_regs(struct device *host, struct cxl_register_map *map,
760 resource_size_t component_reg_phys)
761 {
762 *map = (struct cxl_register_map) {
763 .host = host,
764 .reg_type = CXL_REGLOC_RBI_EMPTY,
765 .resource = component_reg_phys,
766 };
767
768 if (component_reg_phys == CXL_RESOURCE_NONE)
769 return 0;
770
771 map->reg_type = CXL_REGLOC_RBI_COMPONENT;
772 map->max_size = CXL_COMPONENT_REG_BLOCK_SIZE;
773
774 return cxl_setup_regs(map);
775 }
776
cxl_port_setup_regs(struct cxl_port * port,resource_size_t component_reg_phys)777 static int cxl_port_setup_regs(struct cxl_port *port,
778 resource_size_t component_reg_phys)
779 {
780 if (dev_is_platform(port->uport_dev))
781 return 0;
782 return cxl_setup_comp_regs(&port->dev, &port->reg_map,
783 component_reg_phys);
784 }
785
cxl_dport_setup_regs(struct device * host,struct cxl_dport * dport,resource_size_t component_reg_phys)786 static int cxl_dport_setup_regs(struct device *host, struct cxl_dport *dport,
787 resource_size_t component_reg_phys)
788 {
789 int rc;
790
791 if (dev_is_platform(dport->dport_dev))
792 return 0;
793
794 /*
795 * use @dport->dport_dev for the context for error messages during
796 * register probing, and fixup @host after the fact, since @host may be
797 * NULL.
798 */
799 rc = cxl_setup_comp_regs(dport->dport_dev, &dport->reg_map,
800 component_reg_phys);
801 dport->reg_map.host = host;
802 return rc;
803 }
804
805 DEFINE_SHOW_ATTRIBUTE(einj_cxl_available_error_type);
806
cxl_einj_inject(void * data,u64 type)807 static int cxl_einj_inject(void *data, u64 type)
808 {
809 struct cxl_dport *dport = data;
810
811 if (dport->rch)
812 return einj_cxl_inject_rch_error(dport->rcrb.base, type);
813
814 return einj_cxl_inject_error(to_pci_dev(dport->dport_dev), type);
815 }
816 DEFINE_DEBUGFS_ATTRIBUTE(cxl_einj_inject_fops, NULL, cxl_einj_inject,
817 "0x%llx\n");
818
cxl_debugfs_create_dport_dir(struct cxl_dport * dport)819 static void cxl_debugfs_create_dport_dir(struct cxl_dport *dport)
820 {
821 struct dentry *dir;
822
823 if (!einj_cxl_is_initialized())
824 return;
825
826 /*
827 * dport_dev needs to be a PCIe port for CXL 2.0+ ports because
828 * EINJ expects a dport SBDF to be specified for 2.0 error injection.
829 */
830 if (!dport->rch && !dev_is_pci(dport->dport_dev))
831 return;
832
833 dir = cxl_debugfs_create_dir(dev_name(dport->dport_dev));
834
835 debugfs_create_file("einj_inject", 0200, dir, dport,
836 &cxl_einj_inject_fops);
837 }
838
cxl_port_add(struct cxl_port * port,resource_size_t component_reg_phys,struct cxl_dport * parent_dport)839 static int cxl_port_add(struct cxl_port *port,
840 resource_size_t component_reg_phys,
841 struct cxl_dport *parent_dport)
842 {
843 struct device *dev __free(put_device) = &port->dev;
844 int rc;
845
846 if (is_cxl_memdev(port->uport_dev)) {
847 struct cxl_memdev *cxlmd = to_cxl_memdev(port->uport_dev);
848 struct cxl_dev_state *cxlds = cxlmd->cxlds;
849
850 rc = dev_set_name(dev, "endpoint%d", port->id);
851 if (rc)
852 return rc;
853
854 /*
855 * The endpoint driver already enumerated the component and RAS
856 * registers. Reuse that enumeration while prepping them to be
857 * mapped by the cxl_port driver.
858 */
859 port->reg_map = cxlds->reg_map;
860 port->reg_map.host = &port->dev;
861 cxlmd->endpoint = port;
862 } else if (parent_dport) {
863 rc = dev_set_name(dev, "port%d", port->id);
864 if (rc)
865 return rc;
866
867 rc = cxl_port_setup_regs(port, component_reg_phys);
868 if (rc)
869 return rc;
870 } else {
871 rc = dev_set_name(dev, "root%d", port->id);
872 if (rc)
873 return rc;
874 }
875
876 rc = device_add(dev);
877 if (rc)
878 return rc;
879
880 /* Inhibit the cleanup function invoked */
881 dev = NULL;
882 return 0;
883 }
884
__devm_cxl_add_port(struct device * host,struct device * uport_dev,resource_size_t component_reg_phys,struct cxl_dport * parent_dport)885 static struct cxl_port *__devm_cxl_add_port(struct device *host,
886 struct device *uport_dev,
887 resource_size_t component_reg_phys,
888 struct cxl_dport *parent_dport)
889 {
890 struct cxl_port *port;
891 int rc;
892
893 port = cxl_port_alloc(uport_dev, parent_dport);
894 if (IS_ERR(port))
895 return port;
896
897 rc = cxl_port_add(port, component_reg_phys, parent_dport);
898 if (rc)
899 return ERR_PTR(rc);
900
901 rc = devm_add_action_or_reset(host, unregister_port, port);
902 if (rc)
903 return ERR_PTR(rc);
904
905 rc = devm_cxl_link_uport(host, port);
906 if (rc)
907 return ERR_PTR(rc);
908
909 rc = devm_cxl_link_parent_dport(host, port, parent_dport);
910 if (rc)
911 return ERR_PTR(rc);
912
913 if (parent_dport && dev_is_pci(uport_dev))
914 port->pci_latency = cxl_pci_get_latency(to_pci_dev(uport_dev));
915
916 return port;
917 }
918
919 /**
920 * devm_cxl_add_port - register a cxl_port in CXL memory decode hierarchy
921 * @host: host device for devm operations
922 * @uport_dev: "physical" device implementing this upstream port
923 * @component_reg_phys: (optional) for configurable cxl_port instances
924 * @parent_dport: next hop up in the CXL memory decode hierarchy
925 */
devm_cxl_add_port(struct device * host,struct device * uport_dev,resource_size_t component_reg_phys,struct cxl_dport * parent_dport)926 struct cxl_port *devm_cxl_add_port(struct device *host,
927 struct device *uport_dev,
928 resource_size_t component_reg_phys,
929 struct cxl_dport *parent_dport)
930 {
931 struct cxl_port *port, *parent_port;
932
933 port = __devm_cxl_add_port(host, uport_dev, component_reg_phys,
934 parent_dport);
935
936 parent_port = parent_dport ? parent_dport->port : NULL;
937 if (IS_ERR(port)) {
938 dev_dbg(uport_dev, "Failed to add%s%s%s: %ld\n",
939 parent_port ? " port to " : "",
940 parent_port ? dev_name(&parent_port->dev) : "",
941 parent_port ? "" : " root port",
942 PTR_ERR(port));
943 } else {
944 dev_dbg(uport_dev, "%s added%s%s%s\n",
945 dev_name(&port->dev),
946 parent_port ? " to " : "",
947 parent_port ? dev_name(&parent_port->dev) : "",
948 parent_port ? "" : " (root port)");
949 }
950
951 return port;
952 }
953 EXPORT_SYMBOL_NS_GPL(devm_cxl_add_port, "CXL");
954
devm_cxl_add_root(struct device * host,const struct cxl_root_ops * ops)955 struct cxl_root *devm_cxl_add_root(struct device *host,
956 const struct cxl_root_ops *ops)
957 {
958 struct cxl_root *cxl_root;
959 struct cxl_port *port;
960
961 port = devm_cxl_add_port(host, host, CXL_RESOURCE_NONE, NULL);
962 if (IS_ERR(port))
963 return ERR_CAST(port);
964
965 cxl_root = to_cxl_root(port);
966 cxl_root->ops = ops;
967 return cxl_root;
968 }
969 EXPORT_SYMBOL_NS_GPL(devm_cxl_add_root, "CXL");
970
cxl_port_to_pci_bus(struct cxl_port * port)971 struct pci_bus *cxl_port_to_pci_bus(struct cxl_port *port)
972 {
973 /* There is no pci_bus associated with a CXL platform-root port */
974 if (is_cxl_root(port))
975 return NULL;
976
977 if (dev_is_pci(port->uport_dev)) {
978 struct pci_dev *pdev = to_pci_dev(port->uport_dev);
979
980 return pdev->subordinate;
981 }
982
983 return xa_load(&cxl_root_buses, (unsigned long)port->uport_dev);
984 }
985 EXPORT_SYMBOL_NS_GPL(cxl_port_to_pci_bus, "CXL");
986
unregister_pci_bus(void * uport_dev)987 static void unregister_pci_bus(void *uport_dev)
988 {
989 xa_erase(&cxl_root_buses, (unsigned long)uport_dev);
990 }
991
devm_cxl_register_pci_bus(struct device * host,struct device * uport_dev,struct pci_bus * bus)992 int devm_cxl_register_pci_bus(struct device *host, struct device *uport_dev,
993 struct pci_bus *bus)
994 {
995 int rc;
996
997 if (dev_is_pci(uport_dev))
998 return -EINVAL;
999
1000 rc = xa_insert(&cxl_root_buses, (unsigned long)uport_dev, bus,
1001 GFP_KERNEL);
1002 if (rc)
1003 return rc;
1004 return devm_add_action_or_reset(host, unregister_pci_bus, uport_dev);
1005 }
1006 EXPORT_SYMBOL_NS_GPL(devm_cxl_register_pci_bus, "CXL");
1007
dev_is_cxl_root_child(struct device * dev)1008 static bool dev_is_cxl_root_child(struct device *dev)
1009 {
1010 struct cxl_port *port, *parent;
1011
1012 if (!is_cxl_port(dev))
1013 return false;
1014
1015 port = to_cxl_port(dev);
1016 if (is_cxl_root(port))
1017 return false;
1018
1019 parent = to_cxl_port(port->dev.parent);
1020 if (is_cxl_root(parent))
1021 return true;
1022
1023 return false;
1024 }
1025
find_cxl_root(struct cxl_port * port)1026 struct cxl_root *find_cxl_root(struct cxl_port *port)
1027 {
1028 struct cxl_port *iter = port;
1029
1030 while (iter && !is_cxl_root(iter))
1031 iter = to_cxl_port(iter->dev.parent);
1032
1033 if (!iter)
1034 return NULL;
1035 get_device(&iter->dev);
1036 return to_cxl_root(iter);
1037 }
1038 EXPORT_SYMBOL_NS_GPL(find_cxl_root, "CXL");
1039
find_dport(struct cxl_port * port,int id)1040 static struct cxl_dport *find_dport(struct cxl_port *port, int id)
1041 {
1042 struct cxl_dport *dport;
1043 unsigned long index;
1044
1045 device_lock_assert(&port->dev);
1046 xa_for_each(&port->dports, index, dport)
1047 if (dport->port_id == id)
1048 return dport;
1049 return NULL;
1050 }
1051
add_dport(struct cxl_port * port,struct cxl_dport * dport)1052 static int add_dport(struct cxl_port *port, struct cxl_dport *dport)
1053 {
1054 struct cxl_dport *dup;
1055 int rc;
1056
1057 device_lock_assert(&port->dev);
1058 dup = find_dport(port, dport->port_id);
1059 if (dup) {
1060 dev_err(&port->dev,
1061 "unable to add dport%d-%s non-unique port id (%s)\n",
1062 dport->port_id, dev_name(dport->dport_dev),
1063 dev_name(dup->dport_dev));
1064 return -EBUSY;
1065 }
1066
1067 rc = xa_insert(&port->dports, (unsigned long)dport->dport_dev, dport,
1068 GFP_KERNEL);
1069 if (rc)
1070 return rc;
1071
1072 port->nr_dports++;
1073 return 0;
1074 }
1075
1076 /*
1077 * Since root-level CXL dports cannot be enumerated by PCI they are not
1078 * enumerated by the common port driver that acquires the port lock over
1079 * dport add/remove. Instead, root dports are manually added by a
1080 * platform driver and cond_cxl_root_lock() is used to take the missing
1081 * port lock in that case.
1082 */
cond_cxl_root_lock(struct cxl_port * port)1083 static void cond_cxl_root_lock(struct cxl_port *port)
1084 {
1085 if (is_cxl_root(port))
1086 device_lock(&port->dev);
1087 }
1088
cond_cxl_root_unlock(struct cxl_port * port)1089 static void cond_cxl_root_unlock(struct cxl_port *port)
1090 {
1091 if (is_cxl_root(port))
1092 device_unlock(&port->dev);
1093 }
1094
cxl_dport_remove(void * data)1095 static void cxl_dport_remove(void *data)
1096 {
1097 struct cxl_dport *dport = data;
1098 struct cxl_port *port = dport->port;
1099
1100 xa_erase(&port->dports, (unsigned long) dport->dport_dev);
1101 put_device(dport->dport_dev);
1102 }
1103
cxl_dport_unlink(void * data)1104 static void cxl_dport_unlink(void *data)
1105 {
1106 struct cxl_dport *dport = data;
1107 struct cxl_port *port = dport->port;
1108 char link_name[CXL_TARGET_STRLEN];
1109
1110 sprintf(link_name, "dport%d", dport->port_id);
1111 sysfs_remove_link(&port->dev.kobj, link_name);
1112 }
1113
1114 static struct cxl_dport *
__devm_cxl_add_dport(struct cxl_port * port,struct device * dport_dev,int port_id,resource_size_t component_reg_phys,resource_size_t rcrb)1115 __devm_cxl_add_dport(struct cxl_port *port, struct device *dport_dev,
1116 int port_id, resource_size_t component_reg_phys,
1117 resource_size_t rcrb)
1118 {
1119 char link_name[CXL_TARGET_STRLEN];
1120 struct cxl_dport *dport;
1121 struct device *host;
1122 int rc;
1123
1124 if (is_cxl_root(port))
1125 host = port->uport_dev;
1126 else
1127 host = &port->dev;
1128
1129 if (!host->driver) {
1130 dev_WARN_ONCE(&port->dev, 1, "dport:%s bad devm context\n",
1131 dev_name(dport_dev));
1132 return ERR_PTR(-ENXIO);
1133 }
1134
1135 if (snprintf(link_name, CXL_TARGET_STRLEN, "dport%d", port_id) >=
1136 CXL_TARGET_STRLEN)
1137 return ERR_PTR(-EINVAL);
1138
1139 dport = devm_kzalloc(host, sizeof(*dport), GFP_KERNEL);
1140 if (!dport)
1141 return ERR_PTR(-ENOMEM);
1142
1143 dport->dport_dev = dport_dev;
1144 dport->port_id = port_id;
1145 dport->port = port;
1146
1147 if (rcrb == CXL_RESOURCE_NONE) {
1148 rc = cxl_dport_setup_regs(&port->dev, dport,
1149 component_reg_phys);
1150 if (rc)
1151 return ERR_PTR(rc);
1152 } else {
1153 dport->rcrb.base = rcrb;
1154 component_reg_phys = __rcrb_to_component(dport_dev, &dport->rcrb,
1155 CXL_RCRB_DOWNSTREAM);
1156 if (component_reg_phys == CXL_RESOURCE_NONE) {
1157 dev_warn(dport_dev, "Invalid Component Registers in RCRB");
1158 return ERR_PTR(-ENXIO);
1159 }
1160
1161 /*
1162 * RCH @dport is not ready to map until associated with its
1163 * memdev
1164 */
1165 rc = cxl_dport_setup_regs(NULL, dport, component_reg_phys);
1166 if (rc)
1167 return ERR_PTR(rc);
1168
1169 dport->rch = true;
1170 }
1171
1172 if (component_reg_phys != CXL_RESOURCE_NONE)
1173 dev_dbg(dport_dev, "Component Registers found for dport: %pa\n",
1174 &component_reg_phys);
1175
1176 cond_cxl_root_lock(port);
1177 rc = add_dport(port, dport);
1178 cond_cxl_root_unlock(port);
1179 if (rc)
1180 return ERR_PTR(rc);
1181
1182 get_device(dport_dev);
1183 rc = devm_add_action_or_reset(host, cxl_dport_remove, dport);
1184 if (rc)
1185 return ERR_PTR(rc);
1186
1187 rc = sysfs_create_link(&port->dev.kobj, &dport_dev->kobj, link_name);
1188 if (rc)
1189 return ERR_PTR(rc);
1190
1191 rc = devm_add_action_or_reset(host, cxl_dport_unlink, dport);
1192 if (rc)
1193 return ERR_PTR(rc);
1194
1195 if (dev_is_pci(dport_dev))
1196 dport->link_latency = cxl_pci_get_latency(to_pci_dev(dport_dev));
1197
1198 cxl_debugfs_create_dport_dir(dport);
1199
1200 return dport;
1201 }
1202
1203 /**
1204 * devm_cxl_add_dport - append VH downstream port data to a cxl_port
1205 * @port: the cxl_port that references this dport
1206 * @dport_dev: firmware or PCI device representing the dport
1207 * @port_id: identifier for this dport in a decoder's target list
1208 * @component_reg_phys: optional location of CXL component registers
1209 *
1210 * Note that dports are appended to the devm release action's of the
1211 * either the port's host (for root ports), or the port itself (for
1212 * switch ports)
1213 */
devm_cxl_add_dport(struct cxl_port * port,struct device * dport_dev,int port_id,resource_size_t component_reg_phys)1214 struct cxl_dport *devm_cxl_add_dport(struct cxl_port *port,
1215 struct device *dport_dev, int port_id,
1216 resource_size_t component_reg_phys)
1217 {
1218 struct cxl_dport *dport;
1219
1220 dport = __devm_cxl_add_dport(port, dport_dev, port_id,
1221 component_reg_phys, CXL_RESOURCE_NONE);
1222 if (IS_ERR(dport)) {
1223 dev_dbg(dport_dev, "failed to add dport to %s: %ld\n",
1224 dev_name(&port->dev), PTR_ERR(dport));
1225 } else {
1226 dev_dbg(dport_dev, "dport added to %s\n",
1227 dev_name(&port->dev));
1228 }
1229
1230 return dport;
1231 }
1232 EXPORT_SYMBOL_NS_GPL(devm_cxl_add_dport, "CXL");
1233
1234 /**
1235 * devm_cxl_add_rch_dport - append RCH downstream port data to a cxl_port
1236 * @port: the cxl_port that references this dport
1237 * @dport_dev: firmware or PCI device representing the dport
1238 * @port_id: identifier for this dport in a decoder's target list
1239 * @rcrb: mandatory location of a Root Complex Register Block
1240 *
1241 * See CXL 3.0 9.11.8 CXL Devices Attached to an RCH
1242 */
devm_cxl_add_rch_dport(struct cxl_port * port,struct device * dport_dev,int port_id,resource_size_t rcrb)1243 struct cxl_dport *devm_cxl_add_rch_dport(struct cxl_port *port,
1244 struct device *dport_dev, int port_id,
1245 resource_size_t rcrb)
1246 {
1247 struct cxl_dport *dport;
1248
1249 if (rcrb == CXL_RESOURCE_NONE) {
1250 dev_dbg(&port->dev, "failed to add RCH dport, missing RCRB\n");
1251 return ERR_PTR(-EINVAL);
1252 }
1253
1254 dport = __devm_cxl_add_dport(port, dport_dev, port_id,
1255 CXL_RESOURCE_NONE, rcrb);
1256 if (IS_ERR(dport)) {
1257 dev_dbg(dport_dev, "failed to add RCH dport to %s: %ld\n",
1258 dev_name(&port->dev), PTR_ERR(dport));
1259 } else {
1260 dev_dbg(dport_dev, "RCH dport added to %s\n",
1261 dev_name(&port->dev));
1262 }
1263
1264 return dport;
1265 }
1266 EXPORT_SYMBOL_NS_GPL(devm_cxl_add_rch_dport, "CXL");
1267
add_ep(struct cxl_ep * new)1268 static int add_ep(struct cxl_ep *new)
1269 {
1270 struct cxl_port *port = new->dport->port;
1271
1272 guard(device)(&port->dev);
1273 if (port->dead)
1274 return -ENXIO;
1275
1276 return xa_insert(&port->endpoints, (unsigned long)new->ep,
1277 new, GFP_KERNEL);
1278 }
1279
1280 /**
1281 * cxl_add_ep - register an endpoint's interest in a port
1282 * @dport: the dport that routes to @ep_dev
1283 * @ep_dev: device representing the endpoint
1284 *
1285 * Intermediate CXL ports are scanned based on the arrival of endpoints.
1286 * When those endpoints depart the port can be destroyed once all
1287 * endpoints that care about that port have been removed.
1288 */
cxl_add_ep(struct cxl_dport * dport,struct device * ep_dev)1289 static int cxl_add_ep(struct cxl_dport *dport, struct device *ep_dev)
1290 {
1291 struct cxl_ep *ep;
1292 int rc;
1293
1294 ep = kzalloc(sizeof(*ep), GFP_KERNEL);
1295 if (!ep)
1296 return -ENOMEM;
1297
1298 ep->ep = get_device(ep_dev);
1299 ep->dport = dport;
1300
1301 rc = add_ep(ep);
1302 if (rc)
1303 cxl_ep_release(ep);
1304 return rc;
1305 }
1306
1307 struct cxl_find_port_ctx {
1308 const struct device *dport_dev;
1309 const struct cxl_port *parent_port;
1310 struct cxl_dport **dport;
1311 };
1312
match_port_by_dport(struct device * dev,const void * data)1313 static int match_port_by_dport(struct device *dev, const void *data)
1314 {
1315 const struct cxl_find_port_ctx *ctx = data;
1316 struct cxl_dport *dport;
1317 struct cxl_port *port;
1318
1319 if (!is_cxl_port(dev))
1320 return 0;
1321 if (ctx->parent_port && dev->parent != &ctx->parent_port->dev)
1322 return 0;
1323
1324 port = to_cxl_port(dev);
1325 dport = cxl_find_dport_by_dev(port, ctx->dport_dev);
1326 if (ctx->dport)
1327 *ctx->dport = dport;
1328 return dport != NULL;
1329 }
1330
__find_cxl_port(struct cxl_find_port_ctx * ctx)1331 static struct cxl_port *__find_cxl_port(struct cxl_find_port_ctx *ctx)
1332 {
1333 struct device *dev;
1334
1335 if (!ctx->dport_dev)
1336 return NULL;
1337
1338 dev = bus_find_device(&cxl_bus_type, NULL, ctx, match_port_by_dport);
1339 if (dev)
1340 return to_cxl_port(dev);
1341 return NULL;
1342 }
1343
find_cxl_port(struct device * dport_dev,struct cxl_dport ** dport)1344 static struct cxl_port *find_cxl_port(struct device *dport_dev,
1345 struct cxl_dport **dport)
1346 {
1347 struct cxl_find_port_ctx ctx = {
1348 .dport_dev = dport_dev,
1349 .dport = dport,
1350 };
1351 struct cxl_port *port;
1352
1353 port = __find_cxl_port(&ctx);
1354 return port;
1355 }
1356
find_cxl_port_at(struct cxl_port * parent_port,struct device * dport_dev,struct cxl_dport ** dport)1357 static struct cxl_port *find_cxl_port_at(struct cxl_port *parent_port,
1358 struct device *dport_dev,
1359 struct cxl_dport **dport)
1360 {
1361 struct cxl_find_port_ctx ctx = {
1362 .dport_dev = dport_dev,
1363 .parent_port = parent_port,
1364 .dport = dport,
1365 };
1366 struct cxl_port *port;
1367
1368 port = __find_cxl_port(&ctx);
1369 return port;
1370 }
1371
1372 /*
1373 * All users of grandparent() are using it to walk PCIe-like switch port
1374 * hierarchy. A PCIe switch is comprised of a bridge device representing the
1375 * upstream switch port and N bridges representing downstream switch ports. When
1376 * bridges stack the grand-parent of a downstream switch port is another
1377 * downstream switch port in the immediate ancestor switch.
1378 */
grandparent(struct device * dev)1379 static struct device *grandparent(struct device *dev)
1380 {
1381 if (dev && dev->parent)
1382 return dev->parent->parent;
1383 return NULL;
1384 }
1385
endpoint_host(struct cxl_port * endpoint)1386 static struct device *endpoint_host(struct cxl_port *endpoint)
1387 {
1388 struct cxl_port *port = to_cxl_port(endpoint->dev.parent);
1389
1390 if (is_cxl_root(port))
1391 return port->uport_dev;
1392 return &port->dev;
1393 }
1394
delete_endpoint(void * data)1395 static void delete_endpoint(void *data)
1396 {
1397 struct cxl_memdev *cxlmd = data;
1398 struct cxl_port *endpoint = cxlmd->endpoint;
1399 struct device *host = endpoint_host(endpoint);
1400
1401 scoped_guard(device, host) {
1402 if (host->driver && !endpoint->dead) {
1403 devm_release_action(host, cxl_unlink_parent_dport, endpoint);
1404 devm_release_action(host, cxl_unlink_uport, endpoint);
1405 devm_release_action(host, unregister_port, endpoint);
1406 }
1407 cxlmd->endpoint = NULL;
1408 }
1409 put_device(&endpoint->dev);
1410 put_device(host);
1411 }
1412
cxl_endpoint_autoremove(struct cxl_memdev * cxlmd,struct cxl_port * endpoint)1413 int cxl_endpoint_autoremove(struct cxl_memdev *cxlmd, struct cxl_port *endpoint)
1414 {
1415 struct device *host = endpoint_host(endpoint);
1416 struct device *dev = &cxlmd->dev;
1417
1418 get_device(host);
1419 get_device(&endpoint->dev);
1420 cxlmd->depth = endpoint->depth;
1421 return devm_add_action_or_reset(dev, delete_endpoint, cxlmd);
1422 }
1423 EXPORT_SYMBOL_NS_GPL(cxl_endpoint_autoremove, "CXL");
1424
1425 /*
1426 * The natural end of life of a non-root 'cxl_port' is when its parent port goes
1427 * through a ->remove() event ("top-down" unregistration). The unnatural trigger
1428 * for a port to be unregistered is when all memdevs beneath that port have gone
1429 * through ->remove(). This "bottom-up" removal selectively removes individual
1430 * child ports manually. This depends on devm_cxl_add_port() to not change is
1431 * devm action registration order, and for dports to have already been
1432 * destroyed by reap_dports().
1433 */
delete_switch_port(struct cxl_port * port)1434 static void delete_switch_port(struct cxl_port *port)
1435 {
1436 devm_release_action(port->dev.parent, cxl_unlink_parent_dport, port);
1437 devm_release_action(port->dev.parent, cxl_unlink_uport, port);
1438 devm_release_action(port->dev.parent, unregister_port, port);
1439 }
1440
reap_dports(struct cxl_port * port)1441 static void reap_dports(struct cxl_port *port)
1442 {
1443 struct cxl_dport *dport;
1444 unsigned long index;
1445
1446 device_lock_assert(&port->dev);
1447
1448 xa_for_each(&port->dports, index, dport) {
1449 devm_release_action(&port->dev, cxl_dport_unlink, dport);
1450 devm_release_action(&port->dev, cxl_dport_remove, dport);
1451 devm_kfree(&port->dev, dport);
1452 }
1453 }
1454
1455 struct detach_ctx {
1456 struct cxl_memdev *cxlmd;
1457 int depth;
1458 };
1459
port_has_memdev(struct device * dev,const void * data)1460 static int port_has_memdev(struct device *dev, const void *data)
1461 {
1462 const struct detach_ctx *ctx = data;
1463 struct cxl_port *port;
1464
1465 if (!is_cxl_port(dev))
1466 return 0;
1467
1468 port = to_cxl_port(dev);
1469 if (port->depth != ctx->depth)
1470 return 0;
1471
1472 return !!cxl_ep_load(port, ctx->cxlmd);
1473 }
1474
cxl_detach_ep(void * data)1475 static void cxl_detach_ep(void *data)
1476 {
1477 struct cxl_memdev *cxlmd = data;
1478
1479 for (int i = cxlmd->depth - 1; i >= 1; i--) {
1480 struct cxl_port *port, *parent_port;
1481 struct detach_ctx ctx = {
1482 .cxlmd = cxlmd,
1483 .depth = i,
1484 };
1485 struct cxl_ep *ep;
1486 bool died = false;
1487
1488 struct device *dev __free(put_device) =
1489 bus_find_device(&cxl_bus_type, NULL, &ctx, port_has_memdev);
1490 if (!dev)
1491 continue;
1492 port = to_cxl_port(dev);
1493
1494 parent_port = to_cxl_port(port->dev.parent);
1495 device_lock(&parent_port->dev);
1496 device_lock(&port->dev);
1497 ep = cxl_ep_load(port, cxlmd);
1498 dev_dbg(&cxlmd->dev, "disconnect %s from %s\n",
1499 ep ? dev_name(ep->ep) : "", dev_name(&port->dev));
1500 cxl_ep_remove(port, ep);
1501 if (ep && !port->dead && xa_empty(&port->endpoints) &&
1502 !is_cxl_root(parent_port) && parent_port->dev.driver) {
1503 /*
1504 * This was the last ep attached to a dynamically
1505 * enumerated port. Block new cxl_add_ep() and garbage
1506 * collect the port.
1507 */
1508 died = true;
1509 port->dead = true;
1510 reap_dports(port);
1511 }
1512 device_unlock(&port->dev);
1513
1514 if (died) {
1515 dev_dbg(&cxlmd->dev, "delete %s\n",
1516 dev_name(&port->dev));
1517 delete_switch_port(port);
1518 }
1519 device_unlock(&parent_port->dev);
1520 }
1521 }
1522
find_component_registers(struct device * dev)1523 static resource_size_t find_component_registers(struct device *dev)
1524 {
1525 struct cxl_register_map map;
1526 struct pci_dev *pdev;
1527
1528 /*
1529 * Theoretically, CXL component registers can be hosted on a
1530 * non-PCI device, in practice, only cxl_test hits this case.
1531 */
1532 if (!dev_is_pci(dev))
1533 return CXL_RESOURCE_NONE;
1534
1535 pdev = to_pci_dev(dev);
1536
1537 cxl_find_regblock(pdev, CXL_REGLOC_RBI_COMPONENT, &map);
1538 return map.resource;
1539 }
1540
add_port_attach_ep(struct cxl_memdev * cxlmd,struct device * uport_dev,struct device * dport_dev)1541 static int add_port_attach_ep(struct cxl_memdev *cxlmd,
1542 struct device *uport_dev,
1543 struct device *dport_dev)
1544 {
1545 struct device *dparent = grandparent(dport_dev);
1546 struct cxl_dport *dport, *parent_dport;
1547 resource_size_t component_reg_phys;
1548 int rc;
1549
1550 if (!dparent) {
1551 /*
1552 * The iteration reached the topology root without finding the
1553 * CXL-root 'cxl_port' on a previous iteration, fail for now to
1554 * be re-probed after platform driver attaches.
1555 */
1556 dev_dbg(&cxlmd->dev, "%s is a root dport\n",
1557 dev_name(dport_dev));
1558 return -ENXIO;
1559 }
1560
1561 struct cxl_port *parent_port __free(put_cxl_port) =
1562 find_cxl_port(dparent, &parent_dport);
1563 if (!parent_port) {
1564 /* iterate to create this parent_port */
1565 return -EAGAIN;
1566 }
1567
1568 /*
1569 * Definition with __free() here to keep the sequence of
1570 * dereferencing the device of the port before the parent_port releasing.
1571 */
1572 struct cxl_port *port __free(put_cxl_port) = NULL;
1573 scoped_guard(device, &parent_port->dev) {
1574 if (!parent_port->dev.driver) {
1575 dev_warn(&cxlmd->dev,
1576 "port %s:%s disabled, failed to enumerate CXL.mem\n",
1577 dev_name(&parent_port->dev), dev_name(uport_dev));
1578 return -ENXIO;
1579 }
1580
1581 port = find_cxl_port_at(parent_port, dport_dev, &dport);
1582 if (!port) {
1583 component_reg_phys = find_component_registers(uport_dev);
1584 port = devm_cxl_add_port(&parent_port->dev, uport_dev,
1585 component_reg_phys, parent_dport);
1586 if (IS_ERR(port))
1587 return PTR_ERR(port);
1588
1589 /* retry find to pick up the new dport information */
1590 port = find_cxl_port_at(parent_port, dport_dev, &dport);
1591 if (!port)
1592 return -ENXIO;
1593 }
1594 }
1595
1596 dev_dbg(&cxlmd->dev, "add to new port %s:%s\n",
1597 dev_name(&port->dev), dev_name(port->uport_dev));
1598 rc = cxl_add_ep(dport, &cxlmd->dev);
1599 if (rc == -EBUSY) {
1600 /*
1601 * "can't" happen, but this error code means
1602 * something to the caller, so translate it.
1603 */
1604 rc = -ENXIO;
1605 }
1606
1607 return rc;
1608 }
1609
devm_cxl_enumerate_ports(struct cxl_memdev * cxlmd)1610 int devm_cxl_enumerate_ports(struct cxl_memdev *cxlmd)
1611 {
1612 struct device *dev = &cxlmd->dev;
1613 struct device *iter;
1614 int rc;
1615
1616 /*
1617 * Skip intermediate port enumeration in the RCH case, there
1618 * are no ports in between a host bridge and an endpoint.
1619 */
1620 if (cxlmd->cxlds->rcd)
1621 return 0;
1622
1623 rc = devm_add_action_or_reset(&cxlmd->dev, cxl_detach_ep, cxlmd);
1624 if (rc)
1625 return rc;
1626
1627 /*
1628 * Scan for and add all cxl_ports in this device's ancestry.
1629 * Repeat until no more ports are added. Abort if a port add
1630 * attempt fails.
1631 */
1632 retry:
1633 for (iter = dev; iter; iter = grandparent(iter)) {
1634 struct device *dport_dev = grandparent(iter);
1635 struct device *uport_dev;
1636 struct cxl_dport *dport;
1637
1638 /*
1639 * The terminal "grandparent" in PCI is NULL and @platform_bus
1640 * for platform devices
1641 */
1642 if (!dport_dev || dport_dev == &platform_bus)
1643 return 0;
1644
1645 uport_dev = dport_dev->parent;
1646 if (!uport_dev) {
1647 dev_warn(dev, "at %s no parent for dport: %s\n",
1648 dev_name(iter), dev_name(dport_dev));
1649 return -ENXIO;
1650 }
1651
1652 dev_dbg(dev, "scan: iter: %s dport_dev: %s parent: %s\n",
1653 dev_name(iter), dev_name(dport_dev),
1654 dev_name(uport_dev));
1655 struct cxl_port *port __free(put_cxl_port) =
1656 find_cxl_port(dport_dev, &dport);
1657 if (port) {
1658 dev_dbg(&cxlmd->dev,
1659 "found already registered port %s:%s\n",
1660 dev_name(&port->dev),
1661 dev_name(port->uport_dev));
1662 rc = cxl_add_ep(dport, &cxlmd->dev);
1663
1664 /*
1665 * If the endpoint already exists in the port's list,
1666 * that's ok, it was added on a previous pass.
1667 * Otherwise, retry in add_port_attach_ep() after taking
1668 * the parent_port lock as the current port may be being
1669 * reaped.
1670 */
1671 if (rc && rc != -EBUSY)
1672 return rc;
1673
1674 cxl_gpf_port_setup(dport);
1675
1676 /* Any more ports to add between this one and the root? */
1677 if (!dev_is_cxl_root_child(&port->dev))
1678 continue;
1679
1680 return 0;
1681 }
1682
1683 rc = add_port_attach_ep(cxlmd, uport_dev, dport_dev);
1684 /* port missing, try to add parent */
1685 if (rc == -EAGAIN)
1686 continue;
1687 /* failed to add ep or port */
1688 if (rc)
1689 return rc;
1690 /* port added, new descendants possible, start over */
1691 goto retry;
1692 }
1693
1694 return 0;
1695 }
1696 EXPORT_SYMBOL_NS_GPL(devm_cxl_enumerate_ports, "CXL");
1697
cxl_pci_find_port(struct pci_dev * pdev,struct cxl_dport ** dport)1698 struct cxl_port *cxl_pci_find_port(struct pci_dev *pdev,
1699 struct cxl_dport **dport)
1700 {
1701 return find_cxl_port(pdev->dev.parent, dport);
1702 }
1703 EXPORT_SYMBOL_NS_GPL(cxl_pci_find_port, "CXL");
1704
cxl_mem_find_port(struct cxl_memdev * cxlmd,struct cxl_dport ** dport)1705 struct cxl_port *cxl_mem_find_port(struct cxl_memdev *cxlmd,
1706 struct cxl_dport **dport)
1707 {
1708 return find_cxl_port(grandparent(&cxlmd->dev), dport);
1709 }
1710 EXPORT_SYMBOL_NS_GPL(cxl_mem_find_port, "CXL");
1711
decoder_populate_targets(struct cxl_switch_decoder * cxlsd,struct cxl_port * port,int * target_map)1712 static int decoder_populate_targets(struct cxl_switch_decoder *cxlsd,
1713 struct cxl_port *port, int *target_map)
1714 {
1715 int i;
1716
1717 if (!target_map)
1718 return 0;
1719
1720 device_lock_assert(&port->dev);
1721
1722 if (xa_empty(&port->dports))
1723 return -EINVAL;
1724
1725 guard(rwsem_write)(&cxl_region_rwsem);
1726 for (i = 0; i < cxlsd->cxld.interleave_ways; i++) {
1727 struct cxl_dport *dport = find_dport(port, target_map[i]);
1728
1729 if (!dport)
1730 return -ENXIO;
1731 cxlsd->target[i] = dport;
1732 }
1733
1734 return 0;
1735 }
1736
1737 static struct lock_class_key cxl_decoder_key;
1738
1739 /**
1740 * cxl_decoder_init - Common decoder setup / initialization
1741 * @port: owning port of this decoder
1742 * @cxld: common decoder properties to initialize
1743 *
1744 * A port may contain one or more decoders. Each of those decoders
1745 * enable some address space for CXL.mem utilization. A decoder is
1746 * expected to be configured by the caller before registering via
1747 * cxl_decoder_add()
1748 */
cxl_decoder_init(struct cxl_port * port,struct cxl_decoder * cxld)1749 static int cxl_decoder_init(struct cxl_port *port, struct cxl_decoder *cxld)
1750 {
1751 struct device *dev;
1752 int rc;
1753
1754 rc = ida_alloc(&port->decoder_ida, GFP_KERNEL);
1755 if (rc < 0)
1756 return rc;
1757
1758 /* need parent to stick around to release the id */
1759 get_device(&port->dev);
1760 cxld->id = rc;
1761
1762 dev = &cxld->dev;
1763 device_initialize(dev);
1764 lockdep_set_class(&dev->mutex, &cxl_decoder_key);
1765 device_set_pm_not_required(dev);
1766 dev->parent = &port->dev;
1767 dev->bus = &cxl_bus_type;
1768
1769 /* Pre initialize an "empty" decoder */
1770 cxld->interleave_ways = 1;
1771 cxld->interleave_granularity = PAGE_SIZE;
1772 cxld->target_type = CXL_DECODER_HOSTONLYMEM;
1773 cxld->hpa_range = (struct range) {
1774 .start = 0,
1775 .end = -1,
1776 };
1777
1778 return 0;
1779 }
1780
cxl_switch_decoder_init(struct cxl_port * port,struct cxl_switch_decoder * cxlsd,int nr_targets)1781 static int cxl_switch_decoder_init(struct cxl_port *port,
1782 struct cxl_switch_decoder *cxlsd,
1783 int nr_targets)
1784 {
1785 if (nr_targets > CXL_DECODER_MAX_INTERLEAVE)
1786 return -EINVAL;
1787
1788 cxlsd->nr_targets = nr_targets;
1789 return cxl_decoder_init(port, &cxlsd->cxld);
1790 }
1791
1792 /**
1793 * cxl_root_decoder_alloc - Allocate a root level decoder
1794 * @port: owning CXL root of this decoder
1795 * @nr_targets: static number of downstream targets
1796 *
1797 * Return: A new cxl decoder to be registered by cxl_decoder_add(). A
1798 * 'CXL root' decoder is one that decodes from a top-level / static platform
1799 * firmware description of CXL resources into a CXL standard decode
1800 * topology.
1801 */
cxl_root_decoder_alloc(struct cxl_port * port,unsigned int nr_targets)1802 struct cxl_root_decoder *cxl_root_decoder_alloc(struct cxl_port *port,
1803 unsigned int nr_targets)
1804 {
1805 struct cxl_root_decoder *cxlrd;
1806 struct cxl_switch_decoder *cxlsd;
1807 struct cxl_decoder *cxld;
1808 int rc;
1809
1810 if (!is_cxl_root(port))
1811 return ERR_PTR(-EINVAL);
1812
1813 cxlrd = kzalloc(struct_size(cxlrd, cxlsd.target, nr_targets),
1814 GFP_KERNEL);
1815 if (!cxlrd)
1816 return ERR_PTR(-ENOMEM);
1817
1818 cxlsd = &cxlrd->cxlsd;
1819 rc = cxl_switch_decoder_init(port, cxlsd, nr_targets);
1820 if (rc) {
1821 kfree(cxlrd);
1822 return ERR_PTR(rc);
1823 }
1824
1825 mutex_init(&cxlrd->range_lock);
1826
1827 cxld = &cxlsd->cxld;
1828 cxld->dev.type = &cxl_decoder_root_type;
1829 /*
1830 * cxl_root_decoder_release() special cases negative ids to
1831 * detect memregion_alloc() failures.
1832 */
1833 atomic_set(&cxlrd->region_id, -1);
1834 rc = memregion_alloc(GFP_KERNEL);
1835 if (rc < 0) {
1836 put_device(&cxld->dev);
1837 return ERR_PTR(rc);
1838 }
1839
1840 atomic_set(&cxlrd->region_id, rc);
1841 cxlrd->qos_class = CXL_QOS_CLASS_INVALID;
1842 return cxlrd;
1843 }
1844 EXPORT_SYMBOL_NS_GPL(cxl_root_decoder_alloc, "CXL");
1845
1846 /**
1847 * cxl_switch_decoder_alloc - Allocate a switch level decoder
1848 * @port: owning CXL switch port of this decoder
1849 * @nr_targets: max number of dynamically addressable downstream targets
1850 *
1851 * Return: A new cxl decoder to be registered by cxl_decoder_add(). A
1852 * 'switch' decoder is any decoder that can be enumerated by PCIe
1853 * topology and the HDM Decoder Capability. This includes the decoders
1854 * that sit between Switch Upstream Ports / Switch Downstream Ports and
1855 * Host Bridges / Root Ports.
1856 */
cxl_switch_decoder_alloc(struct cxl_port * port,unsigned int nr_targets)1857 struct cxl_switch_decoder *cxl_switch_decoder_alloc(struct cxl_port *port,
1858 unsigned int nr_targets)
1859 {
1860 struct cxl_switch_decoder *cxlsd;
1861 struct cxl_decoder *cxld;
1862 int rc;
1863
1864 if (is_cxl_root(port) || is_cxl_endpoint(port))
1865 return ERR_PTR(-EINVAL);
1866
1867 cxlsd = kzalloc(struct_size(cxlsd, target, nr_targets), GFP_KERNEL);
1868 if (!cxlsd)
1869 return ERR_PTR(-ENOMEM);
1870
1871 rc = cxl_switch_decoder_init(port, cxlsd, nr_targets);
1872 if (rc) {
1873 kfree(cxlsd);
1874 return ERR_PTR(rc);
1875 }
1876
1877 cxld = &cxlsd->cxld;
1878 cxld->dev.type = &cxl_decoder_switch_type;
1879 return cxlsd;
1880 }
1881 EXPORT_SYMBOL_NS_GPL(cxl_switch_decoder_alloc, "CXL");
1882
1883 /**
1884 * cxl_endpoint_decoder_alloc - Allocate an endpoint decoder
1885 * @port: owning port of this decoder
1886 *
1887 * Return: A new cxl decoder to be registered by cxl_decoder_add()
1888 */
cxl_endpoint_decoder_alloc(struct cxl_port * port)1889 struct cxl_endpoint_decoder *cxl_endpoint_decoder_alloc(struct cxl_port *port)
1890 {
1891 struct cxl_endpoint_decoder *cxled;
1892 struct cxl_decoder *cxld;
1893 int rc;
1894
1895 if (!is_cxl_endpoint(port))
1896 return ERR_PTR(-EINVAL);
1897
1898 cxled = kzalloc(sizeof(*cxled), GFP_KERNEL);
1899 if (!cxled)
1900 return ERR_PTR(-ENOMEM);
1901
1902 cxled->pos = -1;
1903 cxled->part = -1;
1904 cxld = &cxled->cxld;
1905 rc = cxl_decoder_init(port, cxld);
1906 if (rc) {
1907 kfree(cxled);
1908 return ERR_PTR(rc);
1909 }
1910
1911 cxld->dev.type = &cxl_decoder_endpoint_type;
1912 return cxled;
1913 }
1914 EXPORT_SYMBOL_NS_GPL(cxl_endpoint_decoder_alloc, "CXL");
1915
1916 /**
1917 * cxl_decoder_add_locked - Add a decoder with targets
1918 * @cxld: The cxl decoder allocated by cxl_<type>_decoder_alloc()
1919 * @target_map: A list of downstream ports that this decoder can direct memory
1920 * traffic to. These numbers should correspond with the port number
1921 * in the PCIe Link Capabilities structure.
1922 *
1923 * Certain types of decoders may not have any targets. The main example of this
1924 * is an endpoint device. A more awkward example is a hostbridge whose root
1925 * ports get hot added (technically possible, though unlikely).
1926 *
1927 * This is the locked variant of cxl_decoder_add().
1928 *
1929 * Context: Process context. Expects the device lock of the port that owns the
1930 * @cxld to be held.
1931 *
1932 * Return: Negative error code if the decoder wasn't properly configured; else
1933 * returns 0.
1934 */
cxl_decoder_add_locked(struct cxl_decoder * cxld,int * target_map)1935 int cxl_decoder_add_locked(struct cxl_decoder *cxld, int *target_map)
1936 {
1937 struct cxl_port *port;
1938 struct device *dev;
1939 int rc;
1940
1941 if (WARN_ON_ONCE(!cxld))
1942 return -EINVAL;
1943
1944 if (WARN_ON_ONCE(IS_ERR(cxld)))
1945 return PTR_ERR(cxld);
1946
1947 if (cxld->interleave_ways < 1)
1948 return -EINVAL;
1949
1950 dev = &cxld->dev;
1951
1952 port = to_cxl_port(cxld->dev.parent);
1953 if (!is_endpoint_decoder(dev)) {
1954 struct cxl_switch_decoder *cxlsd = to_cxl_switch_decoder(dev);
1955
1956 rc = decoder_populate_targets(cxlsd, port, target_map);
1957 if (rc && (cxld->flags & CXL_DECODER_F_ENABLE)) {
1958 dev_err(&port->dev,
1959 "Failed to populate active decoder targets\n");
1960 return rc;
1961 }
1962 }
1963
1964 rc = dev_set_name(dev, "decoder%d.%d", port->id, cxld->id);
1965 if (rc)
1966 return rc;
1967
1968 return device_add(dev);
1969 }
1970 EXPORT_SYMBOL_NS_GPL(cxl_decoder_add_locked, "CXL");
1971
1972 /**
1973 * cxl_decoder_add - Add a decoder with targets
1974 * @cxld: The cxl decoder allocated by cxl_<type>_decoder_alloc()
1975 * @target_map: A list of downstream ports that this decoder can direct memory
1976 * traffic to. These numbers should correspond with the port number
1977 * in the PCIe Link Capabilities structure.
1978 *
1979 * This is the unlocked variant of cxl_decoder_add_locked().
1980 * See cxl_decoder_add_locked().
1981 *
1982 * Context: Process context. Takes and releases the device lock of the port that
1983 * owns the @cxld.
1984 */
cxl_decoder_add(struct cxl_decoder * cxld,int * target_map)1985 int cxl_decoder_add(struct cxl_decoder *cxld, int *target_map)
1986 {
1987 struct cxl_port *port;
1988
1989 if (WARN_ON_ONCE(!cxld))
1990 return -EINVAL;
1991
1992 if (WARN_ON_ONCE(IS_ERR(cxld)))
1993 return PTR_ERR(cxld);
1994
1995 port = to_cxl_port(cxld->dev.parent);
1996
1997 guard(device)(&port->dev);
1998 return cxl_decoder_add_locked(cxld, target_map);
1999 }
2000 EXPORT_SYMBOL_NS_GPL(cxl_decoder_add, "CXL");
2001
cxld_unregister(void * dev)2002 static void cxld_unregister(void *dev)
2003 {
2004 struct cxl_endpoint_decoder *cxled;
2005
2006 if (is_endpoint_decoder(dev)) {
2007 cxled = to_cxl_endpoint_decoder(dev);
2008 cxl_decoder_kill_region(cxled);
2009 }
2010
2011 device_unregister(dev);
2012 }
2013
cxl_decoder_autoremove(struct device * host,struct cxl_decoder * cxld)2014 int cxl_decoder_autoremove(struct device *host, struct cxl_decoder *cxld)
2015 {
2016 return devm_add_action_or_reset(host, cxld_unregister, &cxld->dev);
2017 }
2018 EXPORT_SYMBOL_NS_GPL(cxl_decoder_autoremove, "CXL");
2019
2020 /**
2021 * __cxl_driver_register - register a driver for the cxl bus
2022 * @cxl_drv: cxl driver structure to attach
2023 * @owner: owning module/driver
2024 * @modname: KBUILD_MODNAME for parent driver
2025 */
__cxl_driver_register(struct cxl_driver * cxl_drv,struct module * owner,const char * modname)2026 int __cxl_driver_register(struct cxl_driver *cxl_drv, struct module *owner,
2027 const char *modname)
2028 {
2029 if (!cxl_drv->probe) {
2030 pr_debug("%s ->probe() must be specified\n", modname);
2031 return -EINVAL;
2032 }
2033
2034 if (!cxl_drv->name) {
2035 pr_debug("%s ->name must be specified\n", modname);
2036 return -EINVAL;
2037 }
2038
2039 if (!cxl_drv->id) {
2040 pr_debug("%s ->id must be specified\n", modname);
2041 return -EINVAL;
2042 }
2043
2044 cxl_drv->drv.bus = &cxl_bus_type;
2045 cxl_drv->drv.owner = owner;
2046 cxl_drv->drv.mod_name = modname;
2047 cxl_drv->drv.name = cxl_drv->name;
2048
2049 return driver_register(&cxl_drv->drv);
2050 }
2051 EXPORT_SYMBOL_NS_GPL(__cxl_driver_register, "CXL");
2052
cxl_driver_unregister(struct cxl_driver * cxl_drv)2053 void cxl_driver_unregister(struct cxl_driver *cxl_drv)
2054 {
2055 driver_unregister(&cxl_drv->drv);
2056 }
2057 EXPORT_SYMBOL_NS_GPL(cxl_driver_unregister, "CXL");
2058
cxl_bus_uevent(const struct device * dev,struct kobj_uevent_env * env)2059 static int cxl_bus_uevent(const struct device *dev, struct kobj_uevent_env *env)
2060 {
2061 return add_uevent_var(env, "MODALIAS=" CXL_MODALIAS_FMT,
2062 cxl_device_id(dev));
2063 }
2064
cxl_bus_match(struct device * dev,const struct device_driver * drv)2065 static int cxl_bus_match(struct device *dev, const struct device_driver *drv)
2066 {
2067 return cxl_device_id(dev) == to_cxl_drv(drv)->id;
2068 }
2069
cxl_bus_probe(struct device * dev)2070 static int cxl_bus_probe(struct device *dev)
2071 {
2072 int rc;
2073
2074 rc = to_cxl_drv(dev->driver)->probe(dev);
2075 dev_dbg(dev, "probe: %d\n", rc);
2076 return rc;
2077 }
2078
cxl_bus_remove(struct device * dev)2079 static void cxl_bus_remove(struct device *dev)
2080 {
2081 struct cxl_driver *cxl_drv = to_cxl_drv(dev->driver);
2082
2083 if (cxl_drv->remove)
2084 cxl_drv->remove(dev);
2085 }
2086
2087 static struct workqueue_struct *cxl_bus_wq;
2088
cxl_rescan_attach(struct device * dev,void * data)2089 static int cxl_rescan_attach(struct device *dev, void *data)
2090 {
2091 int rc = device_attach(dev);
2092
2093 dev_vdbg(dev, "rescan: %s\n", rc ? "attach" : "detached");
2094
2095 return 0;
2096 }
2097
cxl_bus_rescan_queue(struct work_struct * w)2098 static void cxl_bus_rescan_queue(struct work_struct *w)
2099 {
2100 bus_for_each_dev(&cxl_bus_type, NULL, NULL, cxl_rescan_attach);
2101 }
2102
cxl_bus_rescan(void)2103 void cxl_bus_rescan(void)
2104 {
2105 static DECLARE_WORK(rescan_work, cxl_bus_rescan_queue);
2106
2107 queue_work(cxl_bus_wq, &rescan_work);
2108 }
2109 EXPORT_SYMBOL_NS_GPL(cxl_bus_rescan, "CXL");
2110
cxl_bus_drain(void)2111 void cxl_bus_drain(void)
2112 {
2113 drain_workqueue(cxl_bus_wq);
2114 }
2115 EXPORT_SYMBOL_NS_GPL(cxl_bus_drain, "CXL");
2116
schedule_cxl_memdev_detach(struct cxl_memdev * cxlmd)2117 bool schedule_cxl_memdev_detach(struct cxl_memdev *cxlmd)
2118 {
2119 return queue_work(cxl_bus_wq, &cxlmd->detach_work);
2120 }
2121 EXPORT_SYMBOL_NS_GPL(schedule_cxl_memdev_detach, "CXL");
2122
add_latency(struct access_coordinate * c,long latency)2123 static void add_latency(struct access_coordinate *c, long latency)
2124 {
2125 for (int i = 0; i < ACCESS_COORDINATE_MAX; i++) {
2126 c[i].write_latency += latency;
2127 c[i].read_latency += latency;
2128 }
2129 }
2130
coordinates_valid(struct access_coordinate * c)2131 static bool coordinates_valid(struct access_coordinate *c)
2132 {
2133 for (int i = 0; i < ACCESS_COORDINATE_MAX; i++) {
2134 if (c[i].read_bandwidth && c[i].write_bandwidth &&
2135 c[i].read_latency && c[i].write_latency)
2136 continue;
2137 return false;
2138 }
2139
2140 return true;
2141 }
2142
set_min_bandwidth(struct access_coordinate * c,unsigned int bw)2143 static void set_min_bandwidth(struct access_coordinate *c, unsigned int bw)
2144 {
2145 for (int i = 0; i < ACCESS_COORDINATE_MAX; i++) {
2146 c[i].write_bandwidth = min(c[i].write_bandwidth, bw);
2147 c[i].read_bandwidth = min(c[i].read_bandwidth, bw);
2148 }
2149 }
2150
set_access_coordinates(struct access_coordinate * out,struct access_coordinate * in)2151 static void set_access_coordinates(struct access_coordinate *out,
2152 struct access_coordinate *in)
2153 {
2154 for (int i = 0; i < ACCESS_COORDINATE_MAX; i++)
2155 out[i] = in[i];
2156 }
2157
parent_port_is_cxl_root(struct cxl_port * port)2158 static bool parent_port_is_cxl_root(struct cxl_port *port)
2159 {
2160 return is_cxl_root(to_cxl_port(port->dev.parent));
2161 }
2162
2163 /**
2164 * cxl_endpoint_get_perf_coordinates - Retrieve performance numbers stored in dports
2165 * of CXL path
2166 * @port: endpoint cxl_port
2167 * @coord: output performance data
2168 *
2169 * Return: errno on failure, 0 on success.
2170 */
cxl_endpoint_get_perf_coordinates(struct cxl_port * port,struct access_coordinate * coord)2171 int cxl_endpoint_get_perf_coordinates(struct cxl_port *port,
2172 struct access_coordinate *coord)
2173 {
2174 struct cxl_memdev *cxlmd = to_cxl_memdev(port->uport_dev);
2175 struct access_coordinate c[] = {
2176 {
2177 .read_bandwidth = UINT_MAX,
2178 .write_bandwidth = UINT_MAX,
2179 },
2180 {
2181 .read_bandwidth = UINT_MAX,
2182 .write_bandwidth = UINT_MAX,
2183 },
2184 };
2185 struct cxl_port *iter = port;
2186 struct cxl_dport *dport;
2187 struct pci_dev *pdev;
2188 struct device *dev;
2189 unsigned int bw;
2190 bool is_cxl_root;
2191
2192 if (!is_cxl_endpoint(port))
2193 return -EINVAL;
2194
2195 /*
2196 * Skip calculation for RCD. Expectation is HMAT already covers RCD case
2197 * since RCH does not support hotplug.
2198 */
2199 if (cxlmd->cxlds->rcd)
2200 return 0;
2201
2202 /*
2203 * Exit the loop when the parent port of the current iter port is cxl
2204 * root. The iterative loop starts at the endpoint and gathers the
2205 * latency of the CXL link from the current device/port to the connected
2206 * downstream port each iteration.
2207 */
2208 do {
2209 dport = iter->parent_dport;
2210 iter = to_cxl_port(iter->dev.parent);
2211 is_cxl_root = parent_port_is_cxl_root(iter);
2212
2213 /*
2214 * There's no valid access_coordinate for a root port since RPs do not
2215 * have CDAT and therefore needs to be skipped.
2216 */
2217 if (!is_cxl_root) {
2218 if (!coordinates_valid(dport->coord))
2219 return -EINVAL;
2220 cxl_coordinates_combine(c, c, dport->coord);
2221 }
2222 add_latency(c, dport->link_latency);
2223 } while (!is_cxl_root);
2224
2225 dport = iter->parent_dport;
2226 /* Retrieve HB coords */
2227 if (!coordinates_valid(dport->coord))
2228 return -EINVAL;
2229 cxl_coordinates_combine(c, c, dport->coord);
2230
2231 dev = port->uport_dev->parent;
2232 if (!dev_is_pci(dev))
2233 return -ENODEV;
2234
2235 /* Get the calculated PCI paths bandwidth */
2236 pdev = to_pci_dev(dev);
2237 bw = pcie_bandwidth_available(pdev, NULL, NULL, NULL);
2238 if (bw == 0)
2239 return -ENXIO;
2240 bw /= BITS_PER_BYTE;
2241
2242 set_min_bandwidth(c, bw);
2243 set_access_coordinates(coord, c);
2244
2245 return 0;
2246 }
2247 EXPORT_SYMBOL_NS_GPL(cxl_endpoint_get_perf_coordinates, "CXL");
2248
cxl_port_get_switch_dport_bandwidth(struct cxl_port * port,struct access_coordinate * c)2249 int cxl_port_get_switch_dport_bandwidth(struct cxl_port *port,
2250 struct access_coordinate *c)
2251 {
2252 struct cxl_dport *dport = port->parent_dport;
2253
2254 /* Check this port is connected to a switch DSP and not an RP */
2255 if (parent_port_is_cxl_root(to_cxl_port(port->dev.parent)))
2256 return -ENODEV;
2257
2258 if (!coordinates_valid(dport->coord))
2259 return -EINVAL;
2260
2261 for (int i = 0; i < ACCESS_COORDINATE_MAX; i++) {
2262 c[i].read_bandwidth = dport->coord[i].read_bandwidth;
2263 c[i].write_bandwidth = dport->coord[i].write_bandwidth;
2264 }
2265
2266 return 0;
2267 }
2268
2269 /* for user tooling to ensure port disable work has completed */
flush_store(const struct bus_type * bus,const char * buf,size_t count)2270 static ssize_t flush_store(const struct bus_type *bus, const char *buf, size_t count)
2271 {
2272 if (sysfs_streq(buf, "1")) {
2273 flush_workqueue(cxl_bus_wq);
2274 return count;
2275 }
2276
2277 return -EINVAL;
2278 }
2279
2280 static BUS_ATTR_WO(flush);
2281
2282 static struct attribute *cxl_bus_attributes[] = {
2283 &bus_attr_flush.attr,
2284 NULL,
2285 };
2286
2287 static struct attribute_group cxl_bus_attribute_group = {
2288 .attrs = cxl_bus_attributes,
2289 };
2290
2291 static const struct attribute_group *cxl_bus_attribute_groups[] = {
2292 &cxl_bus_attribute_group,
2293 NULL,
2294 };
2295
2296 struct bus_type cxl_bus_type = {
2297 .name = "cxl",
2298 .uevent = cxl_bus_uevent,
2299 .match = cxl_bus_match,
2300 .probe = cxl_bus_probe,
2301 .remove = cxl_bus_remove,
2302 .bus_groups = cxl_bus_attribute_groups,
2303 };
2304 EXPORT_SYMBOL_NS_GPL(cxl_bus_type, "CXL");
2305
2306 static struct dentry *cxl_debugfs;
2307
cxl_debugfs_create_dir(const char * dir)2308 struct dentry *cxl_debugfs_create_dir(const char *dir)
2309 {
2310 return debugfs_create_dir(dir, cxl_debugfs);
2311 }
2312 EXPORT_SYMBOL_NS_GPL(cxl_debugfs_create_dir, "CXL");
2313
cxl_core_init(void)2314 static __init int cxl_core_init(void)
2315 {
2316 int rc;
2317
2318 cxl_debugfs = debugfs_create_dir("cxl", NULL);
2319
2320 if (einj_cxl_is_initialized())
2321 debugfs_create_file("einj_types", 0400, cxl_debugfs, NULL,
2322 &einj_cxl_available_error_type_fops);
2323
2324 cxl_mbox_init();
2325
2326 rc = cxl_memdev_init();
2327 if (rc)
2328 return rc;
2329
2330 cxl_bus_wq = alloc_ordered_workqueue("cxl_port", 0);
2331 if (!cxl_bus_wq) {
2332 rc = -ENOMEM;
2333 goto err_wq;
2334 }
2335
2336 rc = bus_register(&cxl_bus_type);
2337 if (rc)
2338 goto err_bus;
2339
2340 rc = cxl_region_init();
2341 if (rc)
2342 goto err_region;
2343
2344 rc = cxl_ras_init();
2345 if (rc)
2346 goto err_ras;
2347
2348 return 0;
2349
2350 err_ras:
2351 cxl_region_exit();
2352 err_region:
2353 bus_unregister(&cxl_bus_type);
2354 err_bus:
2355 destroy_workqueue(cxl_bus_wq);
2356 err_wq:
2357 cxl_memdev_exit();
2358 return rc;
2359 }
2360
cxl_core_exit(void)2361 static void cxl_core_exit(void)
2362 {
2363 cxl_ras_exit();
2364 cxl_region_exit();
2365 bus_unregister(&cxl_bus_type);
2366 destroy_workqueue(cxl_bus_wq);
2367 cxl_memdev_exit();
2368 debugfs_remove_recursive(cxl_debugfs);
2369 }
2370
2371 subsys_initcall(cxl_core_init);
2372 module_exit(cxl_core_exit);
2373 MODULE_DESCRIPTION("CXL: Core Compute Express Link support");
2374 MODULE_LICENSE("GPL v2");
2375 MODULE_IMPORT_NS("CXL");
2376