xref: /linux/drivers/cxl/core/port.c (revision e812928be2ee1c2744adf20ed04e0ce1e2fc5c13)
1 // SPDX-License-Identifier: GPL-2.0-only
2 /* Copyright(c) 2020 Intel Corporation. All rights reserved. */
3 #include <linux/platform_device.h>
4 #include <linux/memregion.h>
5 #include <linux/workqueue.h>
6 #include <linux/debugfs.h>
7 #include <linux/device.h>
8 #include <linux/module.h>
9 #include <linux/pci.h>
10 #include <linux/slab.h>
11 #include <linux/idr.h>
12 #include <linux/node.h>
13 #include <cxl/einj.h>
14 #include <cxlmem.h>
15 #include <cxlpci.h>
16 #include <cxl.h>
17 #include "core.h"
18 
19 /**
20  * DOC: cxl core
21  *
22  * The CXL core provides a set of interfaces that can be consumed by CXL aware
23  * drivers. The interfaces allow for creation, modification, and destruction of
24  * regions, memory devices, ports, and decoders. CXL aware drivers must register
25  * with the CXL core via these interfaces in order to be able to participate in
26  * cross-device interleave coordination. The CXL core also establishes and
27  * maintains the bridge to the nvdimm subsystem.
28  *
29  * CXL core introduces sysfs hierarchy to control the devices that are
30  * instantiated by the core.
31  */
32 
33 static DEFINE_IDA(cxl_port_ida);
34 static DEFINE_XARRAY(cxl_root_buses);
35 
36 /*
37  * The terminal device in PCI is NULL and @platform_bus
38  * for platform devices (for cxl_test)
39  */
40 static bool is_cxl_host_bridge(struct device *dev)
41 {
42 	return (!dev || dev == &platform_bus);
43 }
44 
45 int cxl_num_decoders_committed(struct cxl_port *port)
46 {
47 	lockdep_assert_held(&cxl_rwsem.region);
48 
49 	return port->commit_end + 1;
50 }
51 
52 static ssize_t devtype_show(struct device *dev, struct device_attribute *attr,
53 			    char *buf)
54 {
55 	return sysfs_emit(buf, "%s\n", dev->type->name);
56 }
57 static DEVICE_ATTR_RO(devtype);
58 
59 static int cxl_device_id(const struct device *dev)
60 {
61 	if (dev->type == &cxl_nvdimm_bridge_type)
62 		return CXL_DEVICE_NVDIMM_BRIDGE;
63 	if (dev->type == &cxl_nvdimm_type)
64 		return CXL_DEVICE_NVDIMM;
65 	if (dev->type == CXL_PMEM_REGION_TYPE())
66 		return CXL_DEVICE_PMEM_REGION;
67 	if (dev->type == CXL_DAX_REGION_TYPE())
68 		return CXL_DEVICE_DAX_REGION;
69 	if (is_cxl_port(dev)) {
70 		if (is_cxl_root(to_cxl_port(dev)))
71 			return CXL_DEVICE_ROOT;
72 		return CXL_DEVICE_PORT;
73 	}
74 	if (is_cxl_memdev(dev))
75 		return CXL_DEVICE_MEMORY_EXPANDER;
76 	if (dev->type == CXL_REGION_TYPE())
77 		return CXL_DEVICE_REGION;
78 	if (dev->type == &cxl_pmu_type)
79 		return CXL_DEVICE_PMU;
80 	return 0;
81 }
82 
83 static ssize_t modalias_show(struct device *dev, struct device_attribute *attr,
84 			     char *buf)
85 {
86 	return sysfs_emit(buf, CXL_MODALIAS_FMT "\n", cxl_device_id(dev));
87 }
88 static DEVICE_ATTR_RO(modalias);
89 
90 static struct attribute *cxl_base_attributes[] = {
91 	&dev_attr_devtype.attr,
92 	&dev_attr_modalias.attr,
93 	NULL,
94 };
95 
96 struct attribute_group cxl_base_attribute_group = {
97 	.attrs = cxl_base_attributes,
98 };
99 
100 static ssize_t start_show(struct device *dev, struct device_attribute *attr,
101 			  char *buf)
102 {
103 	struct cxl_decoder *cxld = to_cxl_decoder(dev);
104 
105 	return sysfs_emit(buf, "%#llx\n", cxld->hpa_range.start);
106 }
107 static DEVICE_ATTR_ADMIN_RO(start);
108 
109 static ssize_t size_show(struct device *dev, struct device_attribute *attr,
110 			char *buf)
111 {
112 	struct cxl_decoder *cxld = to_cxl_decoder(dev);
113 
114 	return sysfs_emit(buf, "%#llx\n", range_len(&cxld->hpa_range));
115 }
116 static DEVICE_ATTR_RO(size);
117 
118 #define CXL_DECODER_FLAG_ATTR(name, flag)                            \
119 static ssize_t name##_show(struct device *dev,                       \
120 			   struct device_attribute *attr, char *buf) \
121 {                                                                    \
122 	struct cxl_decoder *cxld = to_cxl_decoder(dev);              \
123                                                                      \
124 	return sysfs_emit(buf, "%s\n",                               \
125 			  (cxld->flags & (flag)) ? "1" : "0");       \
126 }                                                                    \
127 static DEVICE_ATTR_RO(name)
128 
129 CXL_DECODER_FLAG_ATTR(cap_pmem, CXL_DECODER_F_PMEM);
130 CXL_DECODER_FLAG_ATTR(cap_ram, CXL_DECODER_F_RAM);
131 CXL_DECODER_FLAG_ATTR(cap_type2, CXL_DECODER_F_TYPE2);
132 CXL_DECODER_FLAG_ATTR(cap_type3, CXL_DECODER_F_TYPE3);
133 CXL_DECODER_FLAG_ATTR(locked, CXL_DECODER_F_LOCK);
134 
135 static ssize_t target_type_show(struct device *dev,
136 				struct device_attribute *attr, char *buf)
137 {
138 	struct cxl_decoder *cxld = to_cxl_decoder(dev);
139 
140 	switch (cxld->target_type) {
141 	case CXL_DECODER_DEVMEM:
142 		return sysfs_emit(buf, "accelerator\n");
143 	case CXL_DECODER_HOSTONLYMEM:
144 		return sysfs_emit(buf, "expander\n");
145 	}
146 	return -ENXIO;
147 }
148 static DEVICE_ATTR_RO(target_type);
149 
150 static ssize_t emit_target_list(struct cxl_switch_decoder *cxlsd, char *buf)
151 {
152 	struct cxl_decoder *cxld = &cxlsd->cxld;
153 	ssize_t offset = 0;
154 	int i, rc = 0;
155 
156 	for (i = 0; i < cxld->interleave_ways; i++) {
157 		struct cxl_dport *dport = cxlsd->target[i];
158 		struct cxl_dport *next = NULL;
159 
160 		if (!dport)
161 			break;
162 
163 		if (i + 1 < cxld->interleave_ways)
164 			next = cxlsd->target[i + 1];
165 		rc = sysfs_emit_at(buf, offset, "%d%s", dport->port_id,
166 				   next ? "," : "");
167 		if (rc < 0)
168 			return rc;
169 		offset += rc;
170 	}
171 
172 	return offset;
173 }
174 
175 static ssize_t target_list_show(struct device *dev,
176 				struct device_attribute *attr, char *buf)
177 {
178 	struct cxl_switch_decoder *cxlsd = to_cxl_switch_decoder(dev);
179 	ssize_t offset;
180 	int rc;
181 
182 	guard(rwsem_read)(&cxl_rwsem.region);
183 	rc = emit_target_list(cxlsd, buf);
184 	if (rc < 0)
185 		return rc;
186 	offset = rc;
187 
188 	rc = sysfs_emit_at(buf, offset, "\n");
189 	if (rc < 0)
190 		return rc;
191 
192 	return offset + rc;
193 }
194 static DEVICE_ATTR_RO(target_list);
195 
196 static ssize_t mode_show(struct device *dev, struct device_attribute *attr,
197 			 char *buf)
198 {
199 	struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
200 	struct cxl_memdev *cxlmd = cxled_to_memdev(cxled);
201 	struct cxl_dev_state *cxlds = cxlmd->cxlds;
202 	/* without @cxl_rwsem.dpa, make sure @part is not reloaded */
203 	int part = READ_ONCE(cxled->part);
204 	const char *desc;
205 
206 	if (part < 0)
207 		desc = "none";
208 	else
209 		desc = cxlds->part[part].res.name;
210 
211 	return sysfs_emit(buf, "%s\n", desc);
212 }
213 
214 static ssize_t mode_store(struct device *dev, struct device_attribute *attr,
215 			  const char *buf, size_t len)
216 {
217 	struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
218 	enum cxl_partition_mode mode;
219 	ssize_t rc;
220 
221 	if (sysfs_streq(buf, "pmem"))
222 		mode = CXL_PARTMODE_PMEM;
223 	else if (sysfs_streq(buf, "ram"))
224 		mode = CXL_PARTMODE_RAM;
225 	else
226 		return -EINVAL;
227 
228 	rc = cxl_dpa_set_part(cxled, mode);
229 	if (rc)
230 		return rc;
231 
232 	return len;
233 }
234 static DEVICE_ATTR_RW(mode);
235 
236 static ssize_t dpa_resource_show(struct device *dev, struct device_attribute *attr,
237 			    char *buf)
238 {
239 	struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
240 
241 	guard(rwsem_read)(&cxl_rwsem.dpa);
242 	return sysfs_emit(buf, "%#llx\n", (u64)cxl_dpa_resource_start(cxled));
243 }
244 static DEVICE_ATTR_RO(dpa_resource);
245 
246 static ssize_t dpa_size_show(struct device *dev, struct device_attribute *attr,
247 			     char *buf)
248 {
249 	struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
250 	resource_size_t size = cxl_dpa_size(cxled);
251 
252 	return sysfs_emit(buf, "%pa\n", &size);
253 }
254 
255 static ssize_t dpa_size_store(struct device *dev, struct device_attribute *attr,
256 			      const char *buf, size_t len)
257 {
258 	struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
259 	unsigned long long size;
260 	ssize_t rc;
261 
262 	rc = kstrtoull(buf, 0, &size);
263 	if (rc)
264 		return rc;
265 
266 	if (!IS_ALIGNED(size, SZ_256M))
267 		return -EINVAL;
268 
269 	rc = cxl_dpa_free(cxled);
270 	if (rc)
271 		return rc;
272 
273 	if (size == 0)
274 		return len;
275 
276 	rc = cxl_dpa_alloc(cxled, size);
277 	if (rc)
278 		return rc;
279 
280 	return len;
281 }
282 static DEVICE_ATTR_RW(dpa_size);
283 
284 static ssize_t interleave_granularity_show(struct device *dev,
285 					   struct device_attribute *attr,
286 					   char *buf)
287 {
288 	struct cxl_decoder *cxld = to_cxl_decoder(dev);
289 
290 	return sysfs_emit(buf, "%d\n", cxld->interleave_granularity);
291 }
292 
293 static DEVICE_ATTR_RO(interleave_granularity);
294 
295 static ssize_t interleave_ways_show(struct device *dev,
296 				    struct device_attribute *attr, char *buf)
297 {
298 	struct cxl_decoder *cxld = to_cxl_decoder(dev);
299 
300 	return sysfs_emit(buf, "%d\n", cxld->interleave_ways);
301 }
302 
303 static DEVICE_ATTR_RO(interleave_ways);
304 
305 static ssize_t qos_class_show(struct device *dev,
306 			      struct device_attribute *attr, char *buf)
307 {
308 	struct cxl_root_decoder *cxlrd = to_cxl_root_decoder(dev);
309 
310 	return sysfs_emit(buf, "%d\n", cxlrd->qos_class);
311 }
312 static DEVICE_ATTR_RO(qos_class);
313 
314 static struct attribute *cxl_decoder_base_attrs[] = {
315 	&dev_attr_start.attr,
316 	&dev_attr_size.attr,
317 	&dev_attr_locked.attr,
318 	&dev_attr_interleave_granularity.attr,
319 	&dev_attr_interleave_ways.attr,
320 	NULL,
321 };
322 
323 static struct attribute_group cxl_decoder_base_attribute_group = {
324 	.attrs = cxl_decoder_base_attrs,
325 };
326 
327 static struct attribute *cxl_decoder_root_attrs[] = {
328 	&dev_attr_cap_pmem.attr,
329 	&dev_attr_cap_ram.attr,
330 	&dev_attr_cap_type2.attr,
331 	&dev_attr_cap_type3.attr,
332 	&dev_attr_target_list.attr,
333 	&dev_attr_qos_class.attr,
334 	SET_CXL_REGION_ATTR(create_pmem_region)
335 	SET_CXL_REGION_ATTR(create_ram_region)
336 	SET_CXL_REGION_ATTR(delete_region)
337 	NULL,
338 };
339 
340 static bool can_create_pmem(struct cxl_root_decoder *cxlrd)
341 {
342 	unsigned long flags = CXL_DECODER_F_TYPE3 | CXL_DECODER_F_PMEM;
343 
344 	return (cxlrd->cxlsd.cxld.flags & flags) == flags;
345 }
346 
347 static bool can_create_ram(struct cxl_root_decoder *cxlrd)
348 {
349 	unsigned long flags = CXL_DECODER_F_TYPE3 | CXL_DECODER_F_RAM;
350 
351 	return (cxlrd->cxlsd.cxld.flags & flags) == flags;
352 }
353 
354 static umode_t cxl_root_decoder_visible(struct kobject *kobj, struct attribute *a, int n)
355 {
356 	struct device *dev = kobj_to_dev(kobj);
357 	struct cxl_root_decoder *cxlrd = to_cxl_root_decoder(dev);
358 
359 	if (a == CXL_REGION_ATTR(create_pmem_region) && !can_create_pmem(cxlrd))
360 		return 0;
361 
362 	if (a == CXL_REGION_ATTR(create_ram_region) && !can_create_ram(cxlrd))
363 		return 0;
364 
365 	if (a == CXL_REGION_ATTR(delete_region) &&
366 	    !(can_create_pmem(cxlrd) || can_create_ram(cxlrd)))
367 		return 0;
368 
369 	return a->mode;
370 }
371 
372 static struct attribute_group cxl_decoder_root_attribute_group = {
373 	.attrs = cxl_decoder_root_attrs,
374 	.is_visible = cxl_root_decoder_visible,
375 };
376 
377 static const struct attribute_group *cxl_decoder_root_attribute_groups[] = {
378 	&cxl_decoder_root_attribute_group,
379 	&cxl_decoder_base_attribute_group,
380 	&cxl_base_attribute_group,
381 	NULL,
382 };
383 
384 static struct attribute *cxl_decoder_switch_attrs[] = {
385 	&dev_attr_target_type.attr,
386 	&dev_attr_target_list.attr,
387 	SET_CXL_REGION_ATTR(region)
388 	NULL,
389 };
390 
391 static struct attribute_group cxl_decoder_switch_attribute_group = {
392 	.attrs = cxl_decoder_switch_attrs,
393 };
394 
395 static const struct attribute_group *cxl_decoder_switch_attribute_groups[] = {
396 	&cxl_decoder_switch_attribute_group,
397 	&cxl_decoder_base_attribute_group,
398 	&cxl_base_attribute_group,
399 	NULL,
400 };
401 
402 static struct attribute *cxl_decoder_endpoint_attrs[] = {
403 	&dev_attr_target_type.attr,
404 	&dev_attr_mode.attr,
405 	&dev_attr_dpa_size.attr,
406 	&dev_attr_dpa_resource.attr,
407 	SET_CXL_REGION_ATTR(region)
408 	NULL,
409 };
410 
411 static struct attribute_group cxl_decoder_endpoint_attribute_group = {
412 	.attrs = cxl_decoder_endpoint_attrs,
413 };
414 
415 static const struct attribute_group *cxl_decoder_endpoint_attribute_groups[] = {
416 	&cxl_decoder_base_attribute_group,
417 	&cxl_decoder_endpoint_attribute_group,
418 	&cxl_base_attribute_group,
419 	NULL,
420 };
421 
422 static void __cxl_decoder_release(struct cxl_decoder *cxld)
423 {
424 	struct cxl_port *port = to_cxl_port(cxld->dev.parent);
425 
426 	ida_free(&port->decoder_ida, cxld->id);
427 	put_device(&port->dev);
428 }
429 
430 static void cxl_endpoint_decoder_release(struct device *dev)
431 {
432 	struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
433 
434 	__cxl_decoder_release(&cxled->cxld);
435 	kfree(cxled);
436 }
437 
438 static void cxl_switch_decoder_release(struct device *dev)
439 {
440 	struct cxl_switch_decoder *cxlsd = to_cxl_switch_decoder(dev);
441 
442 	__cxl_decoder_release(&cxlsd->cxld);
443 	kfree(cxlsd);
444 }
445 
446 struct cxl_root_decoder *to_cxl_root_decoder(struct device *dev)
447 {
448 	if (dev_WARN_ONCE(dev, !is_root_decoder(dev),
449 			  "not a cxl_root_decoder device\n"))
450 		return NULL;
451 	return container_of(dev, struct cxl_root_decoder, cxlsd.cxld.dev);
452 }
453 EXPORT_SYMBOL_NS_GPL(to_cxl_root_decoder, "CXL");
454 
455 static void cxl_root_decoder_release(struct device *dev)
456 {
457 	struct cxl_root_decoder *cxlrd = to_cxl_root_decoder(dev);
458 
459 	if (atomic_read(&cxlrd->region_id) >= 0)
460 		memregion_free(atomic_read(&cxlrd->region_id));
461 	__cxl_decoder_release(&cxlrd->cxlsd.cxld);
462 	kfree(cxlrd);
463 }
464 
465 static const struct device_type cxl_decoder_endpoint_type = {
466 	.name = "cxl_decoder_endpoint",
467 	.release = cxl_endpoint_decoder_release,
468 	.groups = cxl_decoder_endpoint_attribute_groups,
469 };
470 
471 static const struct device_type cxl_decoder_switch_type = {
472 	.name = "cxl_decoder_switch",
473 	.release = cxl_switch_decoder_release,
474 	.groups = cxl_decoder_switch_attribute_groups,
475 };
476 
477 static const struct device_type cxl_decoder_root_type = {
478 	.name = "cxl_decoder_root",
479 	.release = cxl_root_decoder_release,
480 	.groups = cxl_decoder_root_attribute_groups,
481 };
482 
483 bool is_endpoint_decoder(struct device *dev)
484 {
485 	return dev->type == &cxl_decoder_endpoint_type;
486 }
487 EXPORT_SYMBOL_NS_GPL(is_endpoint_decoder, "CXL");
488 
489 bool is_root_decoder(struct device *dev)
490 {
491 	return dev->type == &cxl_decoder_root_type;
492 }
493 EXPORT_SYMBOL_NS_GPL(is_root_decoder, "CXL");
494 
495 bool is_switch_decoder(struct device *dev)
496 {
497 	return is_root_decoder(dev) || dev->type == &cxl_decoder_switch_type;
498 }
499 EXPORT_SYMBOL_NS_GPL(is_switch_decoder, "CXL");
500 
501 struct cxl_decoder *to_cxl_decoder(struct device *dev)
502 {
503 	if (dev_WARN_ONCE(dev,
504 			  !is_switch_decoder(dev) && !is_endpoint_decoder(dev),
505 			  "not a cxl_decoder device\n"))
506 		return NULL;
507 	return container_of(dev, struct cxl_decoder, dev);
508 }
509 EXPORT_SYMBOL_NS_GPL(to_cxl_decoder, "CXL");
510 
511 struct cxl_endpoint_decoder *to_cxl_endpoint_decoder(struct device *dev)
512 {
513 	if (dev_WARN_ONCE(dev, !is_endpoint_decoder(dev),
514 			  "not a cxl_endpoint_decoder device\n"))
515 		return NULL;
516 	return container_of(dev, struct cxl_endpoint_decoder, cxld.dev);
517 }
518 EXPORT_SYMBOL_NS_GPL(to_cxl_endpoint_decoder, "CXL");
519 
520 struct cxl_switch_decoder *to_cxl_switch_decoder(struct device *dev)
521 {
522 	if (dev_WARN_ONCE(dev, !is_switch_decoder(dev),
523 			  "not a cxl_switch_decoder device\n"))
524 		return NULL;
525 	return container_of(dev, struct cxl_switch_decoder, cxld.dev);
526 }
527 EXPORT_SYMBOL_NS_GPL(to_cxl_switch_decoder, "CXL");
528 
529 static void cxl_ep_release(struct cxl_ep *ep)
530 {
531 	put_device(ep->ep);
532 	kfree(ep);
533 }
534 
535 static void cxl_ep_remove(struct cxl_port *port, struct cxl_ep *ep)
536 {
537 	if (!ep)
538 		return;
539 	xa_erase(&port->endpoints, (unsigned long) ep->ep);
540 	cxl_ep_release(ep);
541 }
542 
543 static void cxl_port_release(struct device *dev)
544 {
545 	struct cxl_port *port = to_cxl_port(dev);
546 	unsigned long index;
547 	struct cxl_ep *ep;
548 
549 	xa_for_each(&port->endpoints, index, ep)
550 		cxl_ep_remove(port, ep);
551 	xa_destroy(&port->endpoints);
552 	xa_destroy(&port->dports);
553 	xa_destroy(&port->regions);
554 	ida_free(&cxl_port_ida, port->id);
555 	if (is_cxl_root(port))
556 		kfree(to_cxl_root(port));
557 	else
558 		kfree(port);
559 }
560 
561 static ssize_t decoders_committed_show(struct device *dev,
562 				       struct device_attribute *attr, char *buf)
563 {
564 	struct cxl_port *port = to_cxl_port(dev);
565 
566 	guard(rwsem_read)(&cxl_rwsem.region);
567 	return sysfs_emit(buf, "%d\n", cxl_num_decoders_committed(port));
568 }
569 
570 static DEVICE_ATTR_RO(decoders_committed);
571 
572 static struct attribute *cxl_port_attrs[] = {
573 	&dev_attr_decoders_committed.attr,
574 	NULL,
575 };
576 
577 static struct attribute_group cxl_port_attribute_group = {
578 	.attrs = cxl_port_attrs,
579 };
580 
581 static const struct attribute_group *cxl_port_attribute_groups[] = {
582 	&cxl_base_attribute_group,
583 	&cxl_port_attribute_group,
584 	NULL,
585 };
586 
587 static const struct device_type cxl_port_type = {
588 	.name = "cxl_port",
589 	.release = cxl_port_release,
590 	.groups = cxl_port_attribute_groups,
591 };
592 
593 bool is_cxl_port(const struct device *dev)
594 {
595 	return dev->type == &cxl_port_type;
596 }
597 EXPORT_SYMBOL_NS_GPL(is_cxl_port, "CXL");
598 
599 struct cxl_port *to_cxl_port(const struct device *dev)
600 {
601 	if (dev_WARN_ONCE(dev, dev->type != &cxl_port_type,
602 			  "not a cxl_port device\n"))
603 		return NULL;
604 	return container_of(dev, struct cxl_port, dev);
605 }
606 EXPORT_SYMBOL_NS_GPL(to_cxl_port, "CXL");
607 
608 struct cxl_port *parent_port_of(struct cxl_port *port)
609 {
610 	if (!port || !port->parent_dport)
611 		return NULL;
612 	return port->parent_dport->port;
613 }
614 
615 static void unregister_port(void *_port)
616 {
617 	struct cxl_port *port = _port;
618 	struct cxl_port *parent = parent_port_of(port);
619 	struct device *lock_dev;
620 
621 	/*
622 	 * CXL root port's and the first level of ports are unregistered
623 	 * under the platform firmware device lock, all other ports are
624 	 * unregistered while holding their parent port lock.
625 	 */
626 	if (!parent)
627 		lock_dev = port->uport_dev;
628 	else if (is_cxl_root(parent))
629 		lock_dev = parent->uport_dev;
630 	else
631 		lock_dev = &parent->dev;
632 
633 	device_lock_assert(lock_dev);
634 	port->dead = true;
635 	device_unregister(&port->dev);
636 }
637 
638 static void cxl_unlink_uport(void *_port)
639 {
640 	struct cxl_port *port = _port;
641 
642 	sysfs_remove_link(&port->dev.kobj, "uport");
643 }
644 
645 static int devm_cxl_link_uport(struct device *host, struct cxl_port *port)
646 {
647 	int rc;
648 
649 	rc = sysfs_create_link(&port->dev.kobj, &port->uport_dev->kobj,
650 			       "uport");
651 	if (rc)
652 		return rc;
653 	return devm_add_action_or_reset(host, cxl_unlink_uport, port);
654 }
655 
656 static void cxl_unlink_parent_dport(void *_port)
657 {
658 	struct cxl_port *port = _port;
659 
660 	sysfs_remove_link(&port->dev.kobj, "parent_dport");
661 }
662 
663 static int devm_cxl_link_parent_dport(struct device *host,
664 				      struct cxl_port *port,
665 				      struct cxl_dport *parent_dport)
666 {
667 	int rc;
668 
669 	if (!parent_dport)
670 		return 0;
671 
672 	rc = sysfs_create_link(&port->dev.kobj, &parent_dport->dport_dev->kobj,
673 			       "parent_dport");
674 	if (rc)
675 		return rc;
676 	return devm_add_action_or_reset(host, cxl_unlink_parent_dport, port);
677 }
678 
679 static struct lock_class_key cxl_port_key;
680 
681 static struct cxl_port *cxl_port_alloc(struct device *uport_dev,
682 				       struct cxl_dport *parent_dport)
683 {
684 	struct cxl_root *cxl_root __free(kfree) = NULL;
685 	struct cxl_port *port, *_port __free(kfree) = NULL;
686 	struct device *dev;
687 	int rc;
688 
689 	/* No parent_dport, root cxl_port */
690 	if (!parent_dport) {
691 		cxl_root = kzalloc(sizeof(*cxl_root), GFP_KERNEL);
692 		if (!cxl_root)
693 			return ERR_PTR(-ENOMEM);
694 	} else {
695 		_port = kzalloc(sizeof(*port), GFP_KERNEL);
696 		if (!_port)
697 			return ERR_PTR(-ENOMEM);
698 	}
699 
700 	rc = ida_alloc(&cxl_port_ida, GFP_KERNEL);
701 	if (rc < 0)
702 		return ERR_PTR(rc);
703 
704 	if (cxl_root)
705 		port = &no_free_ptr(cxl_root)->port;
706 	else
707 		port = no_free_ptr(_port);
708 
709 	port->id = rc;
710 	port->uport_dev = uport_dev;
711 
712 	/*
713 	 * The top-level cxl_port "cxl_root" does not have a cxl_port as
714 	 * its parent and it does not have any corresponding component
715 	 * registers as its decode is described by a fixed platform
716 	 * description.
717 	 */
718 	dev = &port->dev;
719 	if (parent_dport) {
720 		struct cxl_port *parent_port = parent_dport->port;
721 		struct cxl_port *iter;
722 
723 		dev->parent = &parent_port->dev;
724 		port->depth = parent_port->depth + 1;
725 		port->parent_dport = parent_dport;
726 
727 		/*
728 		 * walk to the host bridge, or the first ancestor that knows
729 		 * the host bridge
730 		 */
731 		iter = port;
732 		while (!iter->host_bridge &&
733 		       !is_cxl_root(to_cxl_port(iter->dev.parent)))
734 			iter = to_cxl_port(iter->dev.parent);
735 		if (iter->host_bridge)
736 			port->host_bridge = iter->host_bridge;
737 		else if (parent_dport->rch)
738 			port->host_bridge = parent_dport->dport_dev;
739 		else
740 			port->host_bridge = iter->uport_dev;
741 		dev_dbg(uport_dev, "host-bridge: %s\n",
742 			dev_name(port->host_bridge));
743 	} else
744 		dev->parent = uport_dev;
745 
746 	ida_init(&port->decoder_ida);
747 	port->hdm_end = -1;
748 	port->commit_end = -1;
749 	xa_init(&port->dports);
750 	xa_init(&port->endpoints);
751 	xa_init(&port->regions);
752 	port->component_reg_phys = CXL_RESOURCE_NONE;
753 
754 	device_initialize(dev);
755 	lockdep_set_class_and_subclass(&dev->mutex, &cxl_port_key, port->depth);
756 	device_set_pm_not_required(dev);
757 	dev->bus = &cxl_bus_type;
758 	dev->type = &cxl_port_type;
759 
760 	return port;
761 }
762 
763 static int cxl_setup_comp_regs(struct device *host, struct cxl_register_map *map,
764 			       resource_size_t component_reg_phys)
765 {
766 	*map = (struct cxl_register_map) {
767 		.host = host,
768 		.reg_type = CXL_REGLOC_RBI_EMPTY,
769 		.resource = component_reg_phys,
770 	};
771 
772 	if (component_reg_phys == CXL_RESOURCE_NONE)
773 		return 0;
774 
775 	map->reg_type = CXL_REGLOC_RBI_COMPONENT;
776 	map->max_size = CXL_COMPONENT_REG_BLOCK_SIZE;
777 
778 	return cxl_setup_regs(map);
779 }
780 
781 int cxl_port_setup_regs(struct cxl_port *port,
782 			resource_size_t component_reg_phys)
783 {
784 	if (dev_is_platform(port->uport_dev))
785 		return 0;
786 	return cxl_setup_comp_regs(&port->dev, &port->reg_map,
787 				   component_reg_phys);
788 }
789 EXPORT_SYMBOL_NS_GPL(cxl_port_setup_regs, "CXL");
790 
791 static int cxl_dport_setup_regs(struct device *host, struct cxl_dport *dport,
792 				resource_size_t component_reg_phys)
793 {
794 	int rc;
795 
796 	if (dev_is_platform(dport->dport_dev))
797 		return 0;
798 
799 	/*
800 	 * use @dport->dport_dev for the context for error messages during
801 	 * register probing, and fixup @host after the fact, since @host may be
802 	 * NULL.
803 	 */
804 	rc = cxl_setup_comp_regs(dport->dport_dev, &dport->reg_map,
805 				 component_reg_phys);
806 	dport->reg_map.host = host;
807 	return rc;
808 }
809 
810 DEFINE_SHOW_ATTRIBUTE(einj_cxl_available_error_type);
811 
812 static int cxl_einj_inject(void *data, u64 type)
813 {
814 	struct cxl_dport *dport = data;
815 
816 	if (dport->rch)
817 		return einj_cxl_inject_rch_error(dport->rcrb.base, type);
818 
819 	return einj_cxl_inject_error(to_pci_dev(dport->dport_dev), type);
820 }
821 DEFINE_DEBUGFS_ATTRIBUTE(cxl_einj_inject_fops, NULL, cxl_einj_inject,
822 			 "0x%llx\n");
823 
824 static void cxl_debugfs_create_dport_dir(struct cxl_dport *dport)
825 {
826 	struct cxl_port *parent = parent_port_of(dport->port);
827 	struct dentry *dir;
828 
829 	if (!einj_cxl_is_initialized())
830 		return;
831 
832 	/*
833 	 * Protocol error injection is only available for CXL 2.0+ root ports
834 	 * and CXL 1.1 downstream ports
835 	 */
836 	if (!dport->rch &&
837 	    !(dev_is_pci(dport->dport_dev) && parent && is_cxl_root(parent)))
838 		return;
839 
840 	dir = cxl_debugfs_create_dir(dev_name(dport->dport_dev));
841 
842 	debugfs_create_file("einj_inject", 0200, dir, dport,
843 			    &cxl_einj_inject_fops);
844 }
845 
846 static int cxl_port_add(struct cxl_port *port,
847 			resource_size_t component_reg_phys,
848 			struct cxl_dport *parent_dport)
849 {
850 	struct device *dev __free(put_device) = &port->dev;
851 	int rc;
852 
853 	if (is_cxl_memdev(port->uport_dev)) {
854 		struct cxl_memdev *cxlmd = to_cxl_memdev(port->uport_dev);
855 		struct cxl_dev_state *cxlds = cxlmd->cxlds;
856 
857 		rc = dev_set_name(dev, "endpoint%d", port->id);
858 		if (rc)
859 			return rc;
860 
861 		/*
862 		 * The endpoint driver already enumerated the component and RAS
863 		 * registers. Reuse that enumeration while prepping them to be
864 		 * mapped by the cxl_port driver.
865 		 */
866 		port->reg_map = cxlds->reg_map;
867 		port->reg_map.host = &port->dev;
868 		cxlmd->endpoint = port;
869 	} else if (parent_dport) {
870 		rc = dev_set_name(dev, "port%d", port->id);
871 		if (rc)
872 			return rc;
873 
874 		port->component_reg_phys = component_reg_phys;
875 	} else {
876 		rc = dev_set_name(dev, "root%d", port->id);
877 		if (rc)
878 			return rc;
879 	}
880 
881 	rc = device_add(dev);
882 	if (rc)
883 		return rc;
884 
885 	/* Inhibit the cleanup function invoked */
886 	dev = NULL;
887 	return 0;
888 }
889 
890 static struct cxl_port *__devm_cxl_add_port(struct device *host,
891 					    struct device *uport_dev,
892 					    resource_size_t component_reg_phys,
893 					    struct cxl_dport *parent_dport)
894 {
895 	struct cxl_port *port;
896 	int rc;
897 
898 	port = cxl_port_alloc(uport_dev, parent_dport);
899 	if (IS_ERR(port))
900 		return port;
901 
902 	rc = cxl_port_add(port, component_reg_phys, parent_dport);
903 	if (rc)
904 		return ERR_PTR(rc);
905 
906 	rc = devm_add_action_or_reset(host, unregister_port, port);
907 	if (rc)
908 		return ERR_PTR(rc);
909 
910 	rc = devm_cxl_link_uport(host, port);
911 	if (rc)
912 		return ERR_PTR(rc);
913 
914 	rc = devm_cxl_link_parent_dport(host, port, parent_dport);
915 	if (rc)
916 		return ERR_PTR(rc);
917 
918 	if (parent_dport && dev_is_pci(uport_dev))
919 		port->pci_latency = cxl_pci_get_latency(to_pci_dev(uport_dev));
920 
921 	return port;
922 }
923 
924 /**
925  * devm_cxl_add_port - register a cxl_port in CXL memory decode hierarchy
926  * @host: host device for devm operations
927  * @uport_dev: "physical" device implementing this upstream port
928  * @component_reg_phys: (optional) for configurable cxl_port instances
929  * @parent_dport: next hop up in the CXL memory decode hierarchy
930  */
931 struct cxl_port *devm_cxl_add_port(struct device *host,
932 				   struct device *uport_dev,
933 				   resource_size_t component_reg_phys,
934 				   struct cxl_dport *parent_dport)
935 {
936 	struct cxl_port *port, *parent_port;
937 
938 	port = __devm_cxl_add_port(host, uport_dev, component_reg_phys,
939 				   parent_dport);
940 
941 	parent_port = parent_dport ? parent_dport->port : NULL;
942 	if (IS_ERR(port)) {
943 		dev_dbg(uport_dev, "Failed to add%s%s%s: %ld\n",
944 			parent_port ? " port to " : "",
945 			parent_port ? dev_name(&parent_port->dev) : "",
946 			parent_port ? "" : " root port",
947 			PTR_ERR(port));
948 	} else {
949 		dev_dbg(uport_dev, "%s added%s%s%s\n",
950 			dev_name(&port->dev),
951 			parent_port ? " to " : "",
952 			parent_port ? dev_name(&parent_port->dev) : "",
953 			parent_port ? "" : " (root port)");
954 	}
955 
956 	return port;
957 }
958 EXPORT_SYMBOL_NS_GPL(devm_cxl_add_port, "CXL");
959 
960 struct cxl_root *devm_cxl_add_root(struct device *host)
961 {
962 	struct cxl_port *port;
963 
964 	port = devm_cxl_add_port(host, host, CXL_RESOURCE_NONE, NULL);
965 	if (IS_ERR(port))
966 		return ERR_CAST(port);
967 
968 	return to_cxl_root(port);
969 }
970 EXPORT_SYMBOL_NS_GPL(devm_cxl_add_root, "CXL");
971 
972 struct pci_bus *cxl_port_to_pci_bus(struct cxl_port *port)
973 {
974 	/* There is no pci_bus associated with a CXL platform-root port */
975 	if (is_cxl_root(port))
976 		return NULL;
977 
978 	if (dev_is_pci(port->uport_dev)) {
979 		struct pci_dev *pdev = to_pci_dev(port->uport_dev);
980 
981 		return pdev->subordinate;
982 	}
983 
984 	return xa_load(&cxl_root_buses, (unsigned long)port->uport_dev);
985 }
986 EXPORT_SYMBOL_NS_GPL(cxl_port_to_pci_bus, "CXL");
987 
988 static void unregister_pci_bus(void *uport_dev)
989 {
990 	xa_erase(&cxl_root_buses, (unsigned long)uport_dev);
991 }
992 
993 int devm_cxl_register_pci_bus(struct device *host, struct device *uport_dev,
994 			      struct pci_bus *bus)
995 {
996 	int rc;
997 
998 	if (dev_is_pci(uport_dev))
999 		return -EINVAL;
1000 
1001 	rc = xa_insert(&cxl_root_buses, (unsigned long)uport_dev, bus,
1002 		       GFP_KERNEL);
1003 	if (rc)
1004 		return rc;
1005 	return devm_add_action_or_reset(host, unregister_pci_bus, uport_dev);
1006 }
1007 EXPORT_SYMBOL_NS_GPL(devm_cxl_register_pci_bus, "CXL");
1008 
1009 static bool dev_is_cxl_root_child(struct device *dev)
1010 {
1011 	struct cxl_port *port, *parent;
1012 
1013 	if (!is_cxl_port(dev))
1014 		return false;
1015 
1016 	port = to_cxl_port(dev);
1017 	if (is_cxl_root(port))
1018 		return false;
1019 
1020 	parent = to_cxl_port(port->dev.parent);
1021 	if (is_cxl_root(parent))
1022 		return true;
1023 
1024 	return false;
1025 }
1026 
1027 struct cxl_root *find_cxl_root(struct cxl_port *port)
1028 {
1029 	struct cxl_port *iter = port;
1030 
1031 	while (iter && !is_cxl_root(iter))
1032 		iter = to_cxl_port(iter->dev.parent);
1033 
1034 	if (!iter)
1035 		return NULL;
1036 	get_device(&iter->dev);
1037 	return to_cxl_root(iter);
1038 }
1039 EXPORT_SYMBOL_NS_GPL(find_cxl_root, "CXL");
1040 
1041 static struct cxl_dport *find_dport(struct cxl_port *port, int id)
1042 {
1043 	struct cxl_dport *dport;
1044 	unsigned long index;
1045 
1046 	device_lock_assert(&port->dev);
1047 	xa_for_each(&port->dports, index, dport)
1048 		if (dport->port_id == id)
1049 			return dport;
1050 	return NULL;
1051 }
1052 
1053 static int add_dport(struct cxl_port *port, struct cxl_dport *dport)
1054 {
1055 	struct cxl_dport *dup;
1056 	int rc;
1057 
1058 	device_lock_assert(&port->dev);
1059 	dup = find_dport(port, dport->port_id);
1060 	if (dup) {
1061 		dev_err(&port->dev,
1062 			"unable to add dport%d-%s non-unique port id (%s)\n",
1063 			dport->port_id, dev_name(dport->dport_dev),
1064 			dev_name(dup->dport_dev));
1065 		return -EBUSY;
1066 	}
1067 
1068 	/* Arrange for dport_dev to be valid through remove_dport() */
1069 	struct device *dev __free(put_device) = get_device(dport->dport_dev);
1070 
1071 	rc = xa_insert(&port->dports, (unsigned long)dport->dport_dev, dport,
1072 		       GFP_KERNEL);
1073 	if (rc)
1074 		return rc;
1075 
1076 	retain_and_null_ptr(dev);
1077 	port->nr_dports++;
1078 	return 0;
1079 }
1080 
1081 /*
1082  * Since root-level CXL dports cannot be enumerated by PCI they are not
1083  * enumerated by the common port driver that acquires the port lock over
1084  * dport add/remove. Instead, root dports are manually added by a
1085  * platform driver and cond_cxl_root_lock() is used to take the missing
1086  * port lock in that case.
1087  */
1088 static void cond_cxl_root_lock(struct cxl_port *port)
1089 {
1090 	if (is_cxl_root(port))
1091 		device_lock(&port->dev);
1092 }
1093 
1094 static void cond_cxl_root_unlock(struct cxl_port *port)
1095 {
1096 	if (is_cxl_root(port))
1097 		device_unlock(&port->dev);
1098 }
1099 
1100 static void cxl_dport_remove(void *data)
1101 {
1102 	struct cxl_dport *dport = data;
1103 	struct cxl_port *port = dport->port;
1104 
1105 	port->nr_dports--;
1106 	xa_erase(&port->dports, (unsigned long) dport->dport_dev);
1107 	put_device(dport->dport_dev);
1108 }
1109 
1110 static void cxl_dport_unlink(void *data)
1111 {
1112 	struct cxl_dport *dport = data;
1113 	struct cxl_port *port = dport->port;
1114 	char link_name[CXL_TARGET_STRLEN];
1115 
1116 	sprintf(link_name, "dport%d", dport->port_id);
1117 	sysfs_remove_link(&port->dev.kobj, link_name);
1118 }
1119 
1120 static void free_dport(void *dport)
1121 {
1122 	kfree(dport);
1123 }
1124 
1125 /*
1126  * Upon return either a group is established with one action (free_dport()), or
1127  * no group established and @dport is freed.
1128  */
1129 static void *cxl_dport_open_dr_group_or_free(struct cxl_dport *dport)
1130 {
1131 	int rc;
1132 	struct device *host = dport_to_host(dport);
1133 	void *group = devres_open_group(host, dport, GFP_KERNEL);
1134 
1135 	if (!group) {
1136 		kfree(dport);
1137 		return NULL;
1138 	}
1139 
1140 	rc = devm_add_action_or_reset(host, free_dport, dport);
1141 	if (rc) {
1142 		devres_release_group(host, group);
1143 		return NULL;
1144 	}
1145 
1146 	return group;
1147 }
1148 
1149 static void cxl_dport_close_dr_group(struct cxl_dport *dport, void *group)
1150 {
1151 	devres_close_group(dport_to_host(dport), group);
1152 }
1153 
1154 static void del_dport(struct cxl_dport *dport)
1155 {
1156 	devres_release_group(dport_to_host(dport), dport);
1157 }
1158 
1159 /* The dport group id is the dport */
1160 DEFINE_FREE(cxl_dport_release_dr_group, void *, if (_T) del_dport(_T))
1161 
1162 static struct cxl_dport *
1163 __devm_cxl_add_dport(struct cxl_port *port, struct device *dport_dev,
1164 		     int port_id, resource_size_t component_reg_phys,
1165 		     resource_size_t rcrb)
1166 {
1167 	char link_name[CXL_TARGET_STRLEN];
1168 	struct cxl_dport *dport;
1169 	struct device *host;
1170 	int rc;
1171 
1172 	if (is_cxl_root(port))
1173 		host = port->uport_dev;
1174 	else
1175 		host = &port->dev;
1176 
1177 	if (!host->driver) {
1178 		dev_WARN_ONCE(&port->dev, 1, "dport:%s bad devm context\n",
1179 			      dev_name(dport_dev));
1180 		return ERR_PTR(-ENXIO);
1181 	}
1182 
1183 	if (snprintf(link_name, CXL_TARGET_STRLEN, "dport%d", port_id) >=
1184 	    CXL_TARGET_STRLEN)
1185 		return ERR_PTR(-EINVAL);
1186 
1187 	dport = kzalloc(sizeof(*dport), GFP_KERNEL);
1188 	if (!dport)
1189 		return ERR_PTR(-ENOMEM);
1190 
1191 	/* Just enough init to manage the devres group */
1192 	dport->dport_dev = dport_dev;
1193 	dport->port_id = port_id;
1194 	dport->port = port;
1195 
1196 	void *dport_dr_group __free(cxl_dport_release_dr_group) =
1197 		cxl_dport_open_dr_group_or_free(dport);
1198 	if (!dport_dr_group)
1199 		return ERR_PTR(-ENOMEM);
1200 
1201 	if (rcrb == CXL_RESOURCE_NONE) {
1202 		rc = cxl_dport_setup_regs(&port->dev, dport,
1203 					  component_reg_phys);
1204 		if (rc)
1205 			return ERR_PTR(rc);
1206 	} else {
1207 		dport->rcrb.base = rcrb;
1208 		component_reg_phys = __rcrb_to_component(dport_dev, &dport->rcrb,
1209 							 CXL_RCRB_DOWNSTREAM);
1210 		if (component_reg_phys == CXL_RESOURCE_NONE) {
1211 			dev_warn(dport_dev, "Invalid Component Registers in RCRB");
1212 			return ERR_PTR(-ENXIO);
1213 		}
1214 
1215 		/*
1216 		 * RCH @dport is not ready to map until associated with its
1217 		 * memdev
1218 		 */
1219 		rc = cxl_dport_setup_regs(NULL, dport, component_reg_phys);
1220 		if (rc)
1221 			return ERR_PTR(rc);
1222 
1223 		dport->rch = true;
1224 	}
1225 
1226 	if (component_reg_phys != CXL_RESOURCE_NONE)
1227 		dev_dbg(dport_dev, "Component Registers found for dport: %pa\n",
1228 			&component_reg_phys);
1229 
1230 	cond_cxl_root_lock(port);
1231 	rc = add_dport(port, dport);
1232 	cond_cxl_root_unlock(port);
1233 	if (rc)
1234 		return ERR_PTR(rc);
1235 
1236 	rc = devm_add_action_or_reset(host, cxl_dport_remove, dport);
1237 	if (rc)
1238 		return ERR_PTR(rc);
1239 
1240 	rc = sysfs_create_link(&port->dev.kobj, &dport_dev->kobj, link_name);
1241 	if (rc)
1242 		return ERR_PTR(rc);
1243 
1244 	rc = devm_add_action_or_reset(host, cxl_dport_unlink, dport);
1245 	if (rc)
1246 		return ERR_PTR(rc);
1247 
1248 	if (dev_is_pci(dport_dev))
1249 		dport->link_latency = cxl_pci_get_latency(to_pci_dev(dport_dev));
1250 
1251 	cxl_debugfs_create_dport_dir(dport);
1252 
1253 	if (!dport->rch)
1254 		devm_cxl_dport_ras_setup(dport);
1255 
1256 	/* keep the group, and mark the end of devm actions */
1257 	cxl_dport_close_dr_group(dport, no_free_ptr(dport_dr_group));
1258 
1259 	return dport;
1260 }
1261 
1262 /**
1263  * devm_cxl_add_dport - append VH downstream port data to a cxl_port
1264  * @port: the cxl_port that references this dport
1265  * @dport_dev: firmware or PCI device representing the dport
1266  * @port_id: identifier for this dport in a decoder's target list
1267  * @component_reg_phys: optional location of CXL component registers
1268  *
1269  * Note that dports are appended to the devm release action's of the
1270  * either the port's host (for root ports), or the port itself (for
1271  * switch ports)
1272  */
1273 struct cxl_dport *devm_cxl_add_dport(struct cxl_port *port,
1274 				     struct device *dport_dev, int port_id,
1275 				     resource_size_t component_reg_phys)
1276 {
1277 	struct cxl_dport *dport;
1278 
1279 	dport = __devm_cxl_add_dport(port, dport_dev, port_id,
1280 				     component_reg_phys, CXL_RESOURCE_NONE);
1281 	if (IS_ERR(dport)) {
1282 		dev_dbg(dport_dev, "failed to add dport to %s: %ld\n",
1283 			dev_name(&port->dev), PTR_ERR(dport));
1284 	} else {
1285 		dev_dbg(dport_dev, "dport added to %s\n",
1286 			dev_name(&port->dev));
1287 	}
1288 
1289 	return dport;
1290 }
1291 EXPORT_SYMBOL_NS_GPL(devm_cxl_add_dport, "CXL");
1292 
1293 /**
1294  * devm_cxl_add_rch_dport - append RCH downstream port data to a cxl_port
1295  * @port: the cxl_port that references this dport
1296  * @dport_dev: firmware or PCI device representing the dport
1297  * @port_id: identifier for this dport in a decoder's target list
1298  * @rcrb: mandatory location of a Root Complex Register Block
1299  *
1300  * See CXL 3.0 9.11.8 CXL Devices Attached to an RCH
1301  */
1302 struct cxl_dport *devm_cxl_add_rch_dport(struct cxl_port *port,
1303 					 struct device *dport_dev, int port_id,
1304 					 resource_size_t rcrb)
1305 {
1306 	struct cxl_dport *dport;
1307 
1308 	if (rcrb == CXL_RESOURCE_NONE) {
1309 		dev_dbg(&port->dev, "failed to add RCH dport, missing RCRB\n");
1310 		return ERR_PTR(-EINVAL);
1311 	}
1312 
1313 	dport = __devm_cxl_add_dport(port, dport_dev, port_id,
1314 				     CXL_RESOURCE_NONE, rcrb);
1315 	if (IS_ERR(dport)) {
1316 		dev_dbg(dport_dev, "failed to add RCH dport to %s: %ld\n",
1317 			dev_name(&port->dev), PTR_ERR(dport));
1318 	} else {
1319 		dev_dbg(dport_dev, "RCH dport added to %s\n",
1320 			dev_name(&port->dev));
1321 	}
1322 
1323 	return dport;
1324 }
1325 EXPORT_SYMBOL_NS_GPL(devm_cxl_add_rch_dport, "CXL");
1326 
1327 static int add_ep(struct cxl_ep *new)
1328 {
1329 	struct cxl_port *port = new->dport->port;
1330 
1331 	guard(device)(&port->dev);
1332 	if (port->dead)
1333 		return -ENXIO;
1334 
1335 	return xa_insert(&port->endpoints, (unsigned long)new->ep,
1336 			 new, GFP_KERNEL);
1337 }
1338 
1339 /**
1340  * cxl_add_ep - register an endpoint's interest in a port
1341  * @dport: the dport that routes to @ep_dev
1342  * @ep_dev: device representing the endpoint
1343  *
1344  * Intermediate CXL ports are scanned based on the arrival of endpoints.
1345  * When those endpoints depart the port can be destroyed once all
1346  * endpoints that care about that port have been removed.
1347  */
1348 static int cxl_add_ep(struct cxl_dport *dport, struct device *ep_dev)
1349 {
1350 	struct cxl_ep *ep;
1351 	int rc;
1352 
1353 	ep = kzalloc(sizeof(*ep), GFP_KERNEL);
1354 	if (!ep)
1355 		return -ENOMEM;
1356 
1357 	ep->ep = get_device(ep_dev);
1358 	ep->dport = dport;
1359 
1360 	rc = add_ep(ep);
1361 	if (rc)
1362 		cxl_ep_release(ep);
1363 	return rc;
1364 }
1365 
1366 struct cxl_find_port_ctx {
1367 	const struct device *dport_dev;
1368 	const struct cxl_port *parent_port;
1369 	struct cxl_dport **dport;
1370 };
1371 
1372 static int match_port_by_dport(struct device *dev, const void *data)
1373 {
1374 	const struct cxl_find_port_ctx *ctx = data;
1375 	struct cxl_dport *dport;
1376 	struct cxl_port *port;
1377 
1378 	if (!is_cxl_port(dev))
1379 		return 0;
1380 	if (ctx->parent_port && dev->parent != &ctx->parent_port->dev)
1381 		return 0;
1382 
1383 	port = to_cxl_port(dev);
1384 	dport = cxl_find_dport_by_dev(port, ctx->dport_dev);
1385 	if (ctx->dport)
1386 		*ctx->dport = dport;
1387 	return dport != NULL;
1388 }
1389 
1390 static struct cxl_port *__find_cxl_port(struct cxl_find_port_ctx *ctx)
1391 {
1392 	struct device *dev;
1393 
1394 	if (!ctx->dport_dev)
1395 		return NULL;
1396 
1397 	dev = bus_find_device(&cxl_bus_type, NULL, ctx, match_port_by_dport);
1398 	if (dev)
1399 		return to_cxl_port(dev);
1400 	return NULL;
1401 }
1402 
1403 static struct cxl_port *find_cxl_port(struct device *dport_dev,
1404 				      struct cxl_dport **dport)
1405 {
1406 	struct cxl_find_port_ctx ctx = {
1407 		.dport_dev = dport_dev,
1408 		.dport = dport,
1409 	};
1410 	struct cxl_port *port;
1411 
1412 	port = __find_cxl_port(&ctx);
1413 	return port;
1414 }
1415 
1416 /*
1417  * All users of grandparent() are using it to walk PCIe-like switch port
1418  * hierarchy. A PCIe switch is comprised of a bridge device representing the
1419  * upstream switch port and N bridges representing downstream switch ports. When
1420  * bridges stack the grand-parent of a downstream switch port is another
1421  * downstream switch port in the immediate ancestor switch.
1422  */
1423 static struct device *grandparent(struct device *dev)
1424 {
1425 	if (dev && dev->parent)
1426 		return dev->parent->parent;
1427 	return NULL;
1428 }
1429 
1430 static struct device *endpoint_host(struct cxl_port *endpoint)
1431 {
1432 	struct cxl_port *port = to_cxl_port(endpoint->dev.parent);
1433 
1434 	if (is_cxl_root(port))
1435 		return port->uport_dev;
1436 	return &port->dev;
1437 }
1438 
1439 static void delete_endpoint(void *data)
1440 {
1441 	struct cxl_memdev *cxlmd = data;
1442 	struct cxl_port *endpoint = cxlmd->endpoint;
1443 	struct device *host = endpoint_host(endpoint);
1444 
1445 	scoped_guard(device, host) {
1446 		if (host->driver && !endpoint->dead) {
1447 			devm_release_action(host, cxl_unlink_parent_dport, endpoint);
1448 			devm_release_action(host, cxl_unlink_uport, endpoint);
1449 			devm_release_action(host, unregister_port, endpoint);
1450 		}
1451 		cxlmd->endpoint = NULL;
1452 	}
1453 	put_device(&endpoint->dev);
1454 	put_device(host);
1455 }
1456 
1457 int cxl_endpoint_autoremove(struct cxl_memdev *cxlmd, struct cxl_port *endpoint)
1458 {
1459 	struct device *host = endpoint_host(endpoint);
1460 	struct device *dev = &cxlmd->dev;
1461 
1462 	get_device(host);
1463 	get_device(&endpoint->dev);
1464 	cxlmd->depth = endpoint->depth;
1465 	return devm_add_action_or_reset(dev, delete_endpoint, cxlmd);
1466 }
1467 EXPORT_SYMBOL_NS_GPL(cxl_endpoint_autoremove, "CXL");
1468 
1469 /*
1470  * The natural end of life of a non-root 'cxl_port' is when its parent port goes
1471  * through a ->remove() event ("top-down" unregistration). The unnatural trigger
1472  * for a port to be unregistered is when all memdevs beneath that port have gone
1473  * through ->remove(). This "bottom-up" removal selectively removes individual
1474  * child ports manually. This depends on devm_cxl_add_port() to not change is
1475  * devm action registration order, and for dports to have already been
1476  * destroyed by del_dports().
1477  */
1478 static void delete_switch_port(struct cxl_port *port)
1479 {
1480 	devm_release_action(port->dev.parent, cxl_unlink_parent_dport, port);
1481 	devm_release_action(port->dev.parent, cxl_unlink_uport, port);
1482 	devm_release_action(port->dev.parent, unregister_port, port);
1483 }
1484 
1485 static void del_dports(struct cxl_port *port)
1486 {
1487 	struct cxl_dport *dport;
1488 	unsigned long index;
1489 
1490 	device_lock_assert(&port->dev);
1491 
1492 	xa_for_each(&port->dports, index, dport)
1493 		del_dport(dport);
1494 }
1495 
1496 struct detach_ctx {
1497 	struct cxl_memdev *cxlmd;
1498 	int depth;
1499 };
1500 
1501 static int port_has_memdev(struct device *dev, const void *data)
1502 {
1503 	const struct detach_ctx *ctx = data;
1504 	struct cxl_port *port;
1505 
1506 	if (!is_cxl_port(dev))
1507 		return 0;
1508 
1509 	port = to_cxl_port(dev);
1510 	if (port->depth != ctx->depth)
1511 		return 0;
1512 
1513 	return !!cxl_ep_load(port, ctx->cxlmd);
1514 }
1515 
1516 static void cxl_detach_ep(void *data)
1517 {
1518 	struct cxl_memdev *cxlmd = data;
1519 
1520 	for (int i = cxlmd->depth - 1; i >= 1; i--) {
1521 		struct cxl_port *port, *parent_port;
1522 		struct detach_ctx ctx = {
1523 			.cxlmd = cxlmd,
1524 			.depth = i,
1525 		};
1526 		struct cxl_ep *ep;
1527 		bool died = false;
1528 
1529 		struct device *dev __free(put_device) =
1530 			bus_find_device(&cxl_bus_type, NULL, &ctx, port_has_memdev);
1531 		if (!dev)
1532 			continue;
1533 		port = to_cxl_port(dev);
1534 
1535 		parent_port = to_cxl_port(port->dev.parent);
1536 		device_lock(&parent_port->dev);
1537 		device_lock(&port->dev);
1538 		ep = cxl_ep_load(port, cxlmd);
1539 		dev_dbg(&cxlmd->dev, "disconnect %s from %s\n",
1540 			ep ? dev_name(ep->ep) : "", dev_name(&port->dev));
1541 		cxl_ep_remove(port, ep);
1542 		if (ep && !port->dead && xa_empty(&port->endpoints) &&
1543 		    !is_cxl_root(parent_port) && parent_port->dev.driver) {
1544 			/*
1545 			 * This was the last ep attached to a dynamically
1546 			 * enumerated port. Block new cxl_add_ep() and garbage
1547 			 * collect the port.
1548 			 */
1549 			died = true;
1550 			port->dead = true;
1551 			del_dports(port);
1552 		}
1553 		device_unlock(&port->dev);
1554 
1555 		if (died) {
1556 			dev_dbg(&cxlmd->dev, "delete %s\n",
1557 				dev_name(&port->dev));
1558 			delete_switch_port(port);
1559 		}
1560 		device_unlock(&parent_port->dev);
1561 	}
1562 }
1563 
1564 static resource_size_t find_component_registers(struct device *dev)
1565 {
1566 	struct cxl_register_map map;
1567 	struct pci_dev *pdev;
1568 
1569 	/*
1570 	 * Theoretically, CXL component registers can be hosted on a
1571 	 * non-PCI device, in practice, only cxl_test hits this case.
1572 	 */
1573 	if (!dev_is_pci(dev))
1574 		return CXL_RESOURCE_NONE;
1575 
1576 	pdev = to_pci_dev(dev);
1577 
1578 	cxl_find_regblock(pdev, CXL_REGLOC_RBI_COMPONENT, &map);
1579 	return map.resource;
1580 }
1581 
1582 static int match_port_by_uport(struct device *dev, const void *data)
1583 {
1584 	const struct device *uport_dev = data;
1585 	struct cxl_port *port;
1586 
1587 	if (!is_cxl_port(dev))
1588 		return 0;
1589 
1590 	port = to_cxl_port(dev);
1591 	/* Endpoint ports are hosted by memdevs */
1592 	if (is_cxl_memdev(port->uport_dev))
1593 		return uport_dev == port->uport_dev->parent;
1594 	return uport_dev == port->uport_dev;
1595 }
1596 
1597 /**
1598  * find_cxl_port_by_uport - Find a CXL port device companion
1599  * @uport_dev: Device that acts as a switch or endpoint in the CXL hierarchy
1600  *
1601  * In the case of endpoint ports recall that port->uport_dev points to a 'struct
1602  * cxl_memdev' device. So, the @uport_dev argument is the parent device of the
1603  * 'struct cxl_memdev' in that case.
1604  *
1605  * Function takes a device reference on the port device. Caller should do a
1606  * put_device() when done.
1607  */
1608 static struct cxl_port *find_cxl_port_by_uport(struct device *uport_dev)
1609 {
1610 	struct device *dev;
1611 
1612 	dev = bus_find_device(&cxl_bus_type, NULL, uport_dev, match_port_by_uport);
1613 	if (dev)
1614 		return to_cxl_port(dev);
1615 	return NULL;
1616 }
1617 
1618 static int update_decoder_targets(struct device *dev, void *data)
1619 {
1620 	struct cxl_dport *dport = data;
1621 	struct cxl_switch_decoder *cxlsd;
1622 	struct cxl_decoder *cxld;
1623 	int i;
1624 
1625 	if (!is_switch_decoder(dev))
1626 		return 0;
1627 
1628 	cxlsd = to_cxl_switch_decoder(dev);
1629 	cxld = &cxlsd->cxld;
1630 	guard(rwsem_write)(&cxl_rwsem.region);
1631 
1632 	for (i = 0; i < cxld->interleave_ways; i++) {
1633 		if (cxld->target_map[i] == dport->port_id) {
1634 			cxlsd->target[i] = dport;
1635 			dev_dbg(dev, "dport%d found in target list, index %d\n",
1636 				dport->port_id, i);
1637 			return 0;
1638 		}
1639 	}
1640 
1641 	return 0;
1642 }
1643 
1644 void cxl_port_update_decoder_targets(struct cxl_port *port,
1645 				     struct cxl_dport *dport)
1646 {
1647 	device_for_each_child(&port->dev, dport, update_decoder_targets);
1648 }
1649 EXPORT_SYMBOL_NS_GPL(cxl_port_update_decoder_targets, "CXL");
1650 
1651 static bool dport_exists(struct cxl_port *port, struct device *dport_dev)
1652 {
1653 	struct cxl_dport *dport = cxl_find_dport_by_dev(port, dport_dev);
1654 
1655 	if (dport) {
1656 		dev_dbg(&port->dev, "dport%d:%s already exists\n",
1657 			dport->port_id, dev_name(dport_dev));
1658 		return true;
1659 	}
1660 
1661 	return false;
1662 }
1663 
1664 static struct cxl_dport *probe_dport(struct cxl_port *port,
1665 				     struct device *dport_dev)
1666 {
1667 	struct cxl_driver *drv;
1668 
1669 	device_lock_assert(&port->dev);
1670 	if (!port->dev.driver)
1671 		return ERR_PTR(-ENXIO);
1672 
1673 	if (dport_exists(port, dport_dev))
1674 		return ERR_PTR(-EBUSY);
1675 
1676 	drv = container_of(port->dev.driver, struct cxl_driver, drv);
1677 	if (!drv->add_dport)
1678 		return ERR_PTR(-ENXIO);
1679 
1680 	/* see cxl_port_add_dport() */
1681 	return drv->add_dport(port, dport_dev);
1682 }
1683 
1684 static struct cxl_dport *devm_cxl_create_port(struct device *ep_dev,
1685 					      struct cxl_port *parent_port,
1686 					      struct cxl_dport *parent_dport,
1687 					      struct device *uport_dev,
1688 					      struct device *dport_dev)
1689 {
1690 	resource_size_t component_reg_phys;
1691 
1692 	device_lock_assert(&parent_port->dev);
1693 	if (!parent_port->dev.driver) {
1694 		dev_warn(ep_dev,
1695 			 "port %s:%s:%s disabled, failed to enumerate CXL.mem\n",
1696 			 dev_name(&parent_port->dev), dev_name(uport_dev),
1697 			 dev_name(dport_dev));
1698 	}
1699 
1700 	struct cxl_port *port __free(put_cxl_port) =
1701 		find_cxl_port_by_uport(uport_dev);
1702 	if (!port) {
1703 		component_reg_phys = find_component_registers(uport_dev);
1704 		port = devm_cxl_add_port(&parent_port->dev, uport_dev,
1705 					 component_reg_phys, parent_dport);
1706 		if (IS_ERR(port))
1707 			return ERR_CAST(port);
1708 
1709 		/*
1710 		 * retry to make sure a port is found. a port device
1711 		 * reference is taken.
1712 		 */
1713 		port = find_cxl_port_by_uport(uport_dev);
1714 		if (!port)
1715 			return ERR_PTR(-ENODEV);
1716 
1717 		dev_dbg(ep_dev, "created port %s:%s\n",
1718 			dev_name(&port->dev), dev_name(port->uport_dev));
1719 	} else {
1720 		/*
1721 		 * Port was created before right before this function is
1722 		 * called. Signal the caller to deal with it.
1723 		 */
1724 		return ERR_PTR(-EAGAIN);
1725 	}
1726 
1727 	guard(device)(&port->dev);
1728 	return probe_dport(port, dport_dev);
1729 }
1730 
1731 static int add_port_attach_ep(struct cxl_memdev *cxlmd,
1732 			      struct device *uport_dev,
1733 			      struct device *dport_dev)
1734 {
1735 	struct device *dparent = grandparent(dport_dev);
1736 	struct cxl_dport *dport, *parent_dport;
1737 	int rc;
1738 
1739 	if (is_cxl_host_bridge(dparent)) {
1740 		/*
1741 		 * The iteration reached the topology root without finding the
1742 		 * CXL-root 'cxl_port' on a previous iteration, fail for now to
1743 		 * be re-probed after platform driver attaches.
1744 		 */
1745 		dev_dbg(&cxlmd->dev, "%s is a root dport\n",
1746 			dev_name(dport_dev));
1747 		return -ENXIO;
1748 	}
1749 
1750 	struct cxl_port *parent_port __free(put_cxl_port) =
1751 		find_cxl_port_by_uport(dparent->parent);
1752 	if (!parent_port) {
1753 		/* iterate to create this parent_port */
1754 		return -EAGAIN;
1755 	}
1756 
1757 	scoped_guard(device, &parent_port->dev) {
1758 		parent_dport = cxl_find_dport_by_dev(parent_port, dparent);
1759 		if (!parent_dport) {
1760 			parent_dport = probe_dport(parent_port, dparent);
1761 			if (IS_ERR(parent_dport))
1762 				return PTR_ERR(parent_dport);
1763 		}
1764 
1765 		dport = devm_cxl_create_port(&cxlmd->dev, parent_port,
1766 					     parent_dport, uport_dev,
1767 					     dport_dev);
1768 		if (IS_ERR(dport)) {
1769 			/* Port already exists, restart iteration */
1770 			if (PTR_ERR(dport) == -EAGAIN)
1771 				return 0;
1772 			return PTR_ERR(dport);
1773 		}
1774 	}
1775 
1776 	rc = cxl_add_ep(dport, &cxlmd->dev);
1777 	if (rc == -EBUSY) {
1778 		/*
1779 		 * "can't" happen, but this error code means
1780 		 * something to the caller, so translate it.
1781 		 */
1782 		rc = -ENXIO;
1783 	}
1784 
1785 	return rc;
1786 }
1787 
1788 static struct cxl_dport *find_or_add_dport(struct cxl_port *port,
1789 					   struct device *dport_dev)
1790 {
1791 	struct cxl_dport *dport;
1792 
1793 	device_lock_assert(&port->dev);
1794 	dport = cxl_find_dport_by_dev(port, dport_dev);
1795 	if (!dport) {
1796 		dport = probe_dport(port, dport_dev);
1797 		if (IS_ERR(dport))
1798 			return dport;
1799 
1800 		/* New dport added, restart iteration */
1801 		return ERR_PTR(-EAGAIN);
1802 	}
1803 
1804 	return dport;
1805 }
1806 
1807 int devm_cxl_enumerate_ports(struct cxl_memdev *cxlmd)
1808 {
1809 	struct device *dev = &cxlmd->dev;
1810 	struct device *iter;
1811 	int rc;
1812 
1813 	/*
1814 	 * Skip intermediate port enumeration in the RCH case, there
1815 	 * are no ports in between a host bridge and an endpoint.
1816 	 */
1817 	if (cxlmd->cxlds->rcd)
1818 		return 0;
1819 
1820 	rc = devm_add_action_or_reset(&cxlmd->dev, cxl_detach_ep, cxlmd);
1821 	if (rc)
1822 		return rc;
1823 
1824 	/*
1825 	 * Scan for and add all cxl_ports in this device's ancestry.
1826 	 * Repeat until no more ports are added. Abort if a port add
1827 	 * attempt fails.
1828 	 */
1829 retry:
1830 	for (iter = dev; iter; iter = grandparent(iter)) {
1831 		struct device *dport_dev = grandparent(iter);
1832 		struct device *uport_dev;
1833 		struct cxl_dport *dport;
1834 
1835 		if (is_cxl_host_bridge(dport_dev))
1836 			return 0;
1837 
1838 		uport_dev = dport_dev->parent;
1839 		if (!uport_dev) {
1840 			dev_warn(dev, "at %s no parent for dport: %s\n",
1841 				 dev_name(iter), dev_name(dport_dev));
1842 			return -ENXIO;
1843 		}
1844 
1845 		dev_dbg(dev, "scan: iter: %s dport_dev: %s parent: %s\n",
1846 			dev_name(iter), dev_name(dport_dev),
1847 			dev_name(uport_dev));
1848 		struct cxl_port *port __free(put_cxl_port) =
1849 			find_cxl_port_by_uport(uport_dev);
1850 		if (port) {
1851 			dev_dbg(&cxlmd->dev,
1852 				"found already registered port %s:%s\n",
1853 				dev_name(&port->dev),
1854 				dev_name(port->uport_dev));
1855 
1856 			/*
1857 			 * RP port enumerated by cxl_acpi without dport will
1858 			 * have the dport added here.
1859 			 */
1860 			scoped_guard(device, &port->dev) {
1861 				dport = find_or_add_dport(port, dport_dev);
1862 				if (IS_ERR(dport)) {
1863 					if (PTR_ERR(dport) == -EAGAIN)
1864 						goto retry;
1865 					return PTR_ERR(dport);
1866 				}
1867 			}
1868 
1869 			rc = cxl_add_ep(dport, &cxlmd->dev);
1870 
1871 			/*
1872 			 * If the endpoint already exists in the port's list,
1873 			 * that's ok, it was added on a previous pass.
1874 			 * Otherwise, retry in add_port_attach_ep() after taking
1875 			 * the parent_port lock as the current port may be being
1876 			 * reaped.
1877 			 */
1878 			if (rc && rc != -EBUSY)
1879 				return rc;
1880 
1881 			cxl_gpf_port_setup(dport);
1882 
1883 			/* Any more ports to add between this one and the root? */
1884 			if (!dev_is_cxl_root_child(&port->dev))
1885 				continue;
1886 
1887 			return 0;
1888 		}
1889 
1890 		rc = add_port_attach_ep(cxlmd, uport_dev, dport_dev);
1891 		/* port missing, try to add parent */
1892 		if (rc == -EAGAIN)
1893 			continue;
1894 		/* failed to add ep or port */
1895 		if (rc)
1896 			return rc;
1897 		/* port added, new descendants possible, start over */
1898 		goto retry;
1899 	}
1900 
1901 	return 0;
1902 }
1903 EXPORT_SYMBOL_NS_GPL(devm_cxl_enumerate_ports, "CXL");
1904 
1905 struct cxl_port *cxl_pci_find_port(struct pci_dev *pdev,
1906 				   struct cxl_dport **dport)
1907 {
1908 	return find_cxl_port(pdev->dev.parent, dport);
1909 }
1910 EXPORT_SYMBOL_NS_GPL(cxl_pci_find_port, "CXL");
1911 
1912 struct cxl_port *cxl_mem_find_port(struct cxl_memdev *cxlmd,
1913 				   struct cxl_dport **dport)
1914 {
1915 	return find_cxl_port(grandparent(&cxlmd->dev), dport);
1916 }
1917 EXPORT_SYMBOL_NS_GPL(cxl_mem_find_port, "CXL");
1918 
1919 static int decoder_populate_targets(struct cxl_switch_decoder *cxlsd,
1920 				    struct cxl_port *port)
1921 {
1922 	struct cxl_decoder *cxld = &cxlsd->cxld;
1923 	int i;
1924 
1925 	device_lock_assert(&port->dev);
1926 
1927 	if (xa_empty(&port->dports))
1928 		return 0;
1929 
1930 	guard(rwsem_write)(&cxl_rwsem.region);
1931 	for (i = 0; i < cxlsd->cxld.interleave_ways; i++) {
1932 		struct cxl_dport *dport = find_dport(port, cxld->target_map[i]);
1933 
1934 		if (!dport) {
1935 			/* dport may be activated later */
1936 			continue;
1937 		}
1938 		cxlsd->target[i] = dport;
1939 	}
1940 
1941 	return 0;
1942 }
1943 
1944 static struct lock_class_key cxl_decoder_key;
1945 
1946 /**
1947  * cxl_decoder_init - Common decoder setup / initialization
1948  * @port: owning port of this decoder
1949  * @cxld: common decoder properties to initialize
1950  *
1951  * A port may contain one or more decoders. Each of those decoders
1952  * enable some address space for CXL.mem utilization. A decoder is
1953  * expected to be configured by the caller before registering via
1954  * cxl_decoder_add()
1955  */
1956 static int cxl_decoder_init(struct cxl_port *port, struct cxl_decoder *cxld)
1957 {
1958 	struct device *dev;
1959 	int rc;
1960 
1961 	rc = ida_alloc(&port->decoder_ida, GFP_KERNEL);
1962 	if (rc < 0)
1963 		return rc;
1964 
1965 	/* need parent to stick around to release the id */
1966 	get_device(&port->dev);
1967 	cxld->id = rc;
1968 
1969 	dev = &cxld->dev;
1970 	device_initialize(dev);
1971 	lockdep_set_class(&dev->mutex, &cxl_decoder_key);
1972 	device_set_pm_not_required(dev);
1973 	dev->parent = &port->dev;
1974 	dev->bus = &cxl_bus_type;
1975 
1976 	/* Pre initialize an "empty" decoder */
1977 	cxld->interleave_ways = 1;
1978 	cxld->interleave_granularity = PAGE_SIZE;
1979 	cxld->target_type = CXL_DECODER_HOSTONLYMEM;
1980 	cxld->hpa_range = (struct range) {
1981 		.start = 0,
1982 		.end = -1,
1983 	};
1984 
1985 	return 0;
1986 }
1987 
1988 static int cxl_switch_decoder_init(struct cxl_port *port,
1989 				   struct cxl_switch_decoder *cxlsd,
1990 				   int nr_targets)
1991 {
1992 	if (nr_targets > CXL_DECODER_MAX_INTERLEAVE)
1993 		return -EINVAL;
1994 
1995 	cxlsd->nr_targets = nr_targets;
1996 	return cxl_decoder_init(port, &cxlsd->cxld);
1997 }
1998 
1999 /**
2000  * cxl_root_decoder_alloc - Allocate a root level decoder
2001  * @port: owning CXL root of this decoder
2002  * @nr_targets: static number of downstream targets
2003  *
2004  * Return: A new cxl decoder to be registered by cxl_decoder_add(). A
2005  * 'CXL root' decoder is one that decodes from a top-level / static platform
2006  * firmware description of CXL resources into a CXL standard decode
2007  * topology.
2008  */
2009 struct cxl_root_decoder *cxl_root_decoder_alloc(struct cxl_port *port,
2010 						unsigned int nr_targets)
2011 {
2012 	struct cxl_root_decoder *cxlrd;
2013 	struct cxl_switch_decoder *cxlsd;
2014 	struct cxl_decoder *cxld;
2015 	int rc;
2016 
2017 	if (!is_cxl_root(port))
2018 		return ERR_PTR(-EINVAL);
2019 
2020 	cxlrd = kzalloc(struct_size(cxlrd, cxlsd.target, nr_targets),
2021 			GFP_KERNEL);
2022 	if (!cxlrd)
2023 		return ERR_PTR(-ENOMEM);
2024 
2025 	cxlsd = &cxlrd->cxlsd;
2026 	rc = cxl_switch_decoder_init(port, cxlsd, nr_targets);
2027 	if (rc) {
2028 		kfree(cxlrd);
2029 		return ERR_PTR(rc);
2030 	}
2031 
2032 	mutex_init(&cxlrd->range_lock);
2033 
2034 	cxld = &cxlsd->cxld;
2035 	cxld->dev.type = &cxl_decoder_root_type;
2036 	/*
2037 	 * cxl_root_decoder_release() special cases negative ids to
2038 	 * detect memregion_alloc() failures.
2039 	 */
2040 	atomic_set(&cxlrd->region_id, -1);
2041 	rc = memregion_alloc(GFP_KERNEL);
2042 	if (rc < 0) {
2043 		put_device(&cxld->dev);
2044 		return ERR_PTR(rc);
2045 	}
2046 
2047 	atomic_set(&cxlrd->region_id, rc);
2048 	cxlrd->qos_class = CXL_QOS_CLASS_INVALID;
2049 	return cxlrd;
2050 }
2051 EXPORT_SYMBOL_NS_GPL(cxl_root_decoder_alloc, "CXL");
2052 
2053 /**
2054  * cxl_switch_decoder_alloc - Allocate a switch level decoder
2055  * @port: owning CXL switch port of this decoder
2056  * @nr_targets: max number of dynamically addressable downstream targets
2057  *
2058  * Return: A new cxl decoder to be registered by cxl_decoder_add(). A
2059  * 'switch' decoder is any decoder that can be enumerated by PCIe
2060  * topology and the HDM Decoder Capability. This includes the decoders
2061  * that sit between Switch Upstream Ports / Switch Downstream Ports and
2062  * Host Bridges / Root Ports.
2063  */
2064 struct cxl_switch_decoder *cxl_switch_decoder_alloc(struct cxl_port *port,
2065 						    unsigned int nr_targets)
2066 {
2067 	struct cxl_switch_decoder *cxlsd;
2068 	struct cxl_decoder *cxld;
2069 	int rc;
2070 
2071 	if (is_cxl_root(port) || is_cxl_endpoint(port))
2072 		return ERR_PTR(-EINVAL);
2073 
2074 	cxlsd = kzalloc(struct_size(cxlsd, target, nr_targets), GFP_KERNEL);
2075 	if (!cxlsd)
2076 		return ERR_PTR(-ENOMEM);
2077 
2078 	rc = cxl_switch_decoder_init(port, cxlsd, nr_targets);
2079 	if (rc) {
2080 		kfree(cxlsd);
2081 		return ERR_PTR(rc);
2082 	}
2083 
2084 	cxld = &cxlsd->cxld;
2085 	cxld->dev.type = &cxl_decoder_switch_type;
2086 	return cxlsd;
2087 }
2088 EXPORT_SYMBOL_NS_GPL(cxl_switch_decoder_alloc, "CXL");
2089 
2090 /**
2091  * cxl_endpoint_decoder_alloc - Allocate an endpoint decoder
2092  * @port: owning port of this decoder
2093  *
2094  * Return: A new cxl decoder to be registered by cxl_decoder_add()
2095  */
2096 struct cxl_endpoint_decoder *cxl_endpoint_decoder_alloc(struct cxl_port *port)
2097 {
2098 	struct cxl_endpoint_decoder *cxled;
2099 	struct cxl_decoder *cxld;
2100 	int rc;
2101 
2102 	if (!is_cxl_endpoint(port))
2103 		return ERR_PTR(-EINVAL);
2104 
2105 	cxled = kzalloc(sizeof(*cxled), GFP_KERNEL);
2106 	if (!cxled)
2107 		return ERR_PTR(-ENOMEM);
2108 
2109 	cxled->pos = -1;
2110 	cxled->part = -1;
2111 	cxld = &cxled->cxld;
2112 	rc = cxl_decoder_init(port, cxld);
2113 	if (rc)	 {
2114 		kfree(cxled);
2115 		return ERR_PTR(rc);
2116 	}
2117 
2118 	cxld->dev.type = &cxl_decoder_endpoint_type;
2119 	return cxled;
2120 }
2121 EXPORT_SYMBOL_NS_GPL(cxl_endpoint_decoder_alloc, "CXL");
2122 
2123 /**
2124  * cxl_decoder_add_locked - Add a decoder with targets
2125  * @cxld: The cxl decoder allocated by cxl_<type>_decoder_alloc()
2126  *
2127  * Certain types of decoders may not have any targets. The main example of this
2128  * is an endpoint device. A more awkward example is a hostbridge whose root
2129  * ports get hot added (technically possible, though unlikely).
2130  *
2131  * This is the locked variant of cxl_decoder_add().
2132  *
2133  * Context: Process context. Expects the device lock of the port that owns the
2134  *	    @cxld to be held.
2135  *
2136  * Return: Negative error code if the decoder wasn't properly configured; else
2137  *	   returns 0.
2138  */
2139 int cxl_decoder_add_locked(struct cxl_decoder *cxld)
2140 {
2141 	struct cxl_port *port;
2142 	struct device *dev;
2143 	int rc;
2144 
2145 	if (WARN_ON_ONCE(!cxld))
2146 		return -EINVAL;
2147 
2148 	if (WARN_ON_ONCE(IS_ERR(cxld)))
2149 		return PTR_ERR(cxld);
2150 
2151 	if (cxld->interleave_ways < 1)
2152 		return -EINVAL;
2153 
2154 	dev = &cxld->dev;
2155 
2156 	port = to_cxl_port(cxld->dev.parent);
2157 	if (!is_endpoint_decoder(dev)) {
2158 		struct cxl_switch_decoder *cxlsd = to_cxl_switch_decoder(dev);
2159 
2160 		rc = decoder_populate_targets(cxlsd, port);
2161 		if (rc && (cxld->flags & CXL_DECODER_F_ENABLE)) {
2162 			dev_err(&port->dev,
2163 				"Failed to populate active decoder targets\n");
2164 			return rc;
2165 		}
2166 	}
2167 
2168 	rc = dev_set_name(dev, "decoder%d.%d", port->id, cxld->id);
2169 	if (rc)
2170 		return rc;
2171 
2172 	return device_add(dev);
2173 }
2174 EXPORT_SYMBOL_NS_GPL(cxl_decoder_add_locked, "CXL");
2175 
2176 /**
2177  * cxl_decoder_add - Add a decoder with targets
2178  * @cxld: The cxl decoder allocated by cxl_<type>_decoder_alloc()
2179  *
2180  * This is the unlocked variant of cxl_decoder_add_locked().
2181  * See cxl_decoder_add_locked().
2182  *
2183  * Context: Process context. Takes and releases the device lock of the port that
2184  *	    owns the @cxld.
2185  */
2186 int cxl_decoder_add(struct cxl_decoder *cxld)
2187 {
2188 	struct cxl_port *port;
2189 
2190 	if (WARN_ON_ONCE(!cxld))
2191 		return -EINVAL;
2192 
2193 	if (WARN_ON_ONCE(IS_ERR(cxld)))
2194 		return PTR_ERR(cxld);
2195 
2196 	port = to_cxl_port(cxld->dev.parent);
2197 
2198 	guard(device)(&port->dev);
2199 	return cxl_decoder_add_locked(cxld);
2200 }
2201 EXPORT_SYMBOL_NS_GPL(cxl_decoder_add, "CXL");
2202 
2203 static void cxld_unregister(void *dev)
2204 {
2205 	if (is_endpoint_decoder(dev))
2206 		cxl_decoder_detach(NULL, to_cxl_endpoint_decoder(dev), -1,
2207 				   DETACH_INVALIDATE);
2208 
2209 	device_unregister(dev);
2210 }
2211 
2212 int cxl_decoder_autoremove(struct device *host, struct cxl_decoder *cxld)
2213 {
2214 	return devm_add_action_or_reset(host, cxld_unregister, &cxld->dev);
2215 }
2216 EXPORT_SYMBOL_NS_GPL(cxl_decoder_autoremove, "CXL");
2217 
2218 /**
2219  * __cxl_driver_register - register a driver for the cxl bus
2220  * @cxl_drv: cxl driver structure to attach
2221  * @owner: owning module/driver
2222  * @modname: KBUILD_MODNAME for parent driver
2223  */
2224 int __cxl_driver_register(struct cxl_driver *cxl_drv, struct module *owner,
2225 			  const char *modname)
2226 {
2227 	if (!cxl_drv->probe) {
2228 		pr_debug("%s ->probe() must be specified\n", modname);
2229 		return -EINVAL;
2230 	}
2231 
2232 	if (!cxl_drv->name) {
2233 		pr_debug("%s ->name must be specified\n", modname);
2234 		return -EINVAL;
2235 	}
2236 
2237 	if (!cxl_drv->id) {
2238 		pr_debug("%s ->id must be specified\n", modname);
2239 		return -EINVAL;
2240 	}
2241 
2242 	cxl_drv->drv.bus = &cxl_bus_type;
2243 	cxl_drv->drv.owner = owner;
2244 	cxl_drv->drv.mod_name = modname;
2245 	cxl_drv->drv.name = cxl_drv->name;
2246 
2247 	return driver_register(&cxl_drv->drv);
2248 }
2249 EXPORT_SYMBOL_NS_GPL(__cxl_driver_register, "CXL");
2250 
2251 void cxl_driver_unregister(struct cxl_driver *cxl_drv)
2252 {
2253 	driver_unregister(&cxl_drv->drv);
2254 }
2255 EXPORT_SYMBOL_NS_GPL(cxl_driver_unregister, "CXL");
2256 
2257 static int cxl_bus_uevent(const struct device *dev, struct kobj_uevent_env *env)
2258 {
2259 	return add_uevent_var(env, "MODALIAS=" CXL_MODALIAS_FMT,
2260 			      cxl_device_id(dev));
2261 }
2262 
2263 static int cxl_bus_match(struct device *dev, const struct device_driver *drv)
2264 {
2265 	return cxl_device_id(dev) == to_cxl_drv(drv)->id;
2266 }
2267 
2268 static int cxl_bus_probe(struct device *dev)
2269 {
2270 	int rc;
2271 
2272 	rc = to_cxl_drv(dev->driver)->probe(dev);
2273 	dev_dbg(dev, "probe: %d\n", rc);
2274 	return rc;
2275 }
2276 
2277 static void cxl_bus_remove(struct device *dev)
2278 {
2279 	struct cxl_driver *cxl_drv = to_cxl_drv(dev->driver);
2280 
2281 	if (cxl_drv->remove)
2282 		cxl_drv->remove(dev);
2283 }
2284 
2285 static struct workqueue_struct *cxl_bus_wq;
2286 
2287 static int cxl_rescan_attach(struct device *dev, void *data)
2288 {
2289 	int rc = device_attach(dev);
2290 
2291 	dev_vdbg(dev, "rescan: %s\n", rc ? "attach" : "detached");
2292 
2293 	return 0;
2294 }
2295 
2296 static void cxl_bus_rescan_queue(struct work_struct *w)
2297 {
2298 	bus_for_each_dev(&cxl_bus_type, NULL, NULL, cxl_rescan_attach);
2299 }
2300 
2301 void cxl_bus_rescan(void)
2302 {
2303 	static DECLARE_WORK(rescan_work, cxl_bus_rescan_queue);
2304 
2305 	queue_work(cxl_bus_wq, &rescan_work);
2306 }
2307 EXPORT_SYMBOL_NS_GPL(cxl_bus_rescan, "CXL");
2308 
2309 void cxl_bus_drain(void)
2310 {
2311 	drain_workqueue(cxl_bus_wq);
2312 }
2313 EXPORT_SYMBOL_NS_GPL(cxl_bus_drain, "CXL");
2314 
2315 bool schedule_cxl_memdev_detach(struct cxl_memdev *cxlmd)
2316 {
2317 	return queue_work(cxl_bus_wq, &cxlmd->detach_work);
2318 }
2319 EXPORT_SYMBOL_NS_GPL(schedule_cxl_memdev_detach, "CXL");
2320 
2321 static void add_latency(struct access_coordinate *c, long latency)
2322 {
2323 	for (int i = 0; i < ACCESS_COORDINATE_MAX; i++) {
2324 		c[i].write_latency += latency;
2325 		c[i].read_latency += latency;
2326 	}
2327 }
2328 
2329 static bool coordinates_valid(struct access_coordinate *c)
2330 {
2331 	for (int i = 0; i < ACCESS_COORDINATE_MAX; i++) {
2332 		if (c[i].read_bandwidth && c[i].write_bandwidth &&
2333 		    c[i].read_latency && c[i].write_latency)
2334 			continue;
2335 		return false;
2336 	}
2337 
2338 	return true;
2339 }
2340 
2341 static void set_min_bandwidth(struct access_coordinate *c, unsigned int bw)
2342 {
2343 	for (int i = 0; i < ACCESS_COORDINATE_MAX; i++) {
2344 		c[i].write_bandwidth = min(c[i].write_bandwidth, bw);
2345 		c[i].read_bandwidth = min(c[i].read_bandwidth, bw);
2346 	}
2347 }
2348 
2349 static void set_access_coordinates(struct access_coordinate *out,
2350 				   struct access_coordinate *in)
2351 {
2352 	for (int i = 0; i < ACCESS_COORDINATE_MAX; i++)
2353 		out[i] = in[i];
2354 }
2355 
2356 static bool parent_port_is_cxl_root(struct cxl_port *port)
2357 {
2358 	return is_cxl_root(to_cxl_port(port->dev.parent));
2359 }
2360 
2361 /**
2362  * cxl_endpoint_get_perf_coordinates - Retrieve performance numbers stored in dports
2363  *				   of CXL path
2364  * @port: endpoint cxl_port
2365  * @coord: output performance data
2366  *
2367  * Return: errno on failure, 0 on success.
2368  */
2369 int cxl_endpoint_get_perf_coordinates(struct cxl_port *port,
2370 				      struct access_coordinate *coord)
2371 {
2372 	struct cxl_memdev *cxlmd = to_cxl_memdev(port->uport_dev);
2373 	struct access_coordinate c[] = {
2374 		{
2375 			.read_bandwidth = UINT_MAX,
2376 			.write_bandwidth = UINT_MAX,
2377 		},
2378 		{
2379 			.read_bandwidth = UINT_MAX,
2380 			.write_bandwidth = UINT_MAX,
2381 		},
2382 	};
2383 	struct cxl_port *iter = port;
2384 	struct cxl_dport *dport;
2385 	struct pci_dev *pdev;
2386 	struct device *dev;
2387 	unsigned int bw;
2388 	bool is_cxl_root;
2389 
2390 	if (!is_cxl_endpoint(port))
2391 		return -EINVAL;
2392 
2393 	/*
2394 	 * Skip calculation for RCD. Expectation is HMAT already covers RCD case
2395 	 * since RCH does not support hotplug.
2396 	 */
2397 	if (cxlmd->cxlds->rcd)
2398 		return 0;
2399 
2400 	/*
2401 	 * Exit the loop when the parent port of the current iter port is cxl
2402 	 * root. The iterative loop starts at the endpoint and gathers the
2403 	 * latency of the CXL link from the current device/port to the connected
2404 	 * downstream port each iteration.
2405 	 */
2406 	do {
2407 		dport = iter->parent_dport;
2408 		iter = to_cxl_port(iter->dev.parent);
2409 		is_cxl_root = parent_port_is_cxl_root(iter);
2410 
2411 		/*
2412 		 * There's no valid access_coordinate for a root port since RPs do not
2413 		 * have CDAT and therefore needs to be skipped.
2414 		 */
2415 		if (!is_cxl_root) {
2416 			if (!coordinates_valid(dport->coord))
2417 				return -EINVAL;
2418 			cxl_coordinates_combine(c, c, dport->coord);
2419 		}
2420 		add_latency(c, dport->link_latency);
2421 	} while (!is_cxl_root);
2422 
2423 	dport = iter->parent_dport;
2424 	/* Retrieve HB coords */
2425 	if (!coordinates_valid(dport->coord))
2426 		return -EINVAL;
2427 	cxl_coordinates_combine(c, c, dport->coord);
2428 
2429 	dev = port->uport_dev->parent;
2430 	if (!dev_is_pci(dev))
2431 		return -ENODEV;
2432 
2433 	/* Get the calculated PCI paths bandwidth */
2434 	pdev = to_pci_dev(dev);
2435 	bw = pcie_bandwidth_available(pdev, NULL, NULL, NULL);
2436 	if (bw == 0)
2437 		return -ENXIO;
2438 	bw /= BITS_PER_BYTE;
2439 
2440 	set_min_bandwidth(c, bw);
2441 	set_access_coordinates(coord, c);
2442 
2443 	return 0;
2444 }
2445 EXPORT_SYMBOL_NS_GPL(cxl_endpoint_get_perf_coordinates, "CXL");
2446 
2447 int cxl_port_get_switch_dport_bandwidth(struct cxl_port *port,
2448 					struct access_coordinate *c)
2449 {
2450 	struct cxl_dport *dport = port->parent_dport;
2451 
2452 	/* Check this port is connected to a switch DSP and not an RP */
2453 	if (parent_port_is_cxl_root(to_cxl_port(port->dev.parent)))
2454 		return -ENODEV;
2455 
2456 	if (!coordinates_valid(dport->coord))
2457 		return -EINVAL;
2458 
2459 	for (int i = 0; i < ACCESS_COORDINATE_MAX; i++) {
2460 		c[i].read_bandwidth = dport->coord[i].read_bandwidth;
2461 		c[i].write_bandwidth = dport->coord[i].write_bandwidth;
2462 	}
2463 
2464 	return 0;
2465 }
2466 
2467 /* for user tooling to ensure port disable work has completed */
2468 static ssize_t flush_store(const struct bus_type *bus, const char *buf, size_t count)
2469 {
2470 	if (sysfs_streq(buf, "1")) {
2471 		flush_workqueue(cxl_bus_wq);
2472 		return count;
2473 	}
2474 
2475 	return -EINVAL;
2476 }
2477 
2478 static BUS_ATTR_WO(flush);
2479 
2480 static struct attribute *cxl_bus_attributes[] = {
2481 	&bus_attr_flush.attr,
2482 	NULL,
2483 };
2484 
2485 static struct attribute_group cxl_bus_attribute_group = {
2486 	.attrs = cxl_bus_attributes,
2487 };
2488 
2489 static const struct attribute_group *cxl_bus_attribute_groups[] = {
2490 	&cxl_bus_attribute_group,
2491 	NULL,
2492 };
2493 
2494 const struct bus_type cxl_bus_type = {
2495 	.name = "cxl",
2496 	.uevent = cxl_bus_uevent,
2497 	.match = cxl_bus_match,
2498 	.probe = cxl_bus_probe,
2499 	.remove = cxl_bus_remove,
2500 	.bus_groups = cxl_bus_attribute_groups,
2501 };
2502 EXPORT_SYMBOL_NS_GPL(cxl_bus_type, "CXL");
2503 
2504 static struct dentry *cxl_debugfs;
2505 
2506 struct dentry *cxl_debugfs_create_dir(const char *dir)
2507 {
2508 	return debugfs_create_dir(dir, cxl_debugfs);
2509 }
2510 EXPORT_SYMBOL_NS_GPL(cxl_debugfs_create_dir, "CXL");
2511 
2512 static __init int cxl_core_init(void)
2513 {
2514 	int rc;
2515 
2516 	cxl_debugfs = debugfs_create_dir("cxl", NULL);
2517 
2518 	if (einj_cxl_is_initialized())
2519 		debugfs_create_file("einj_types", 0400, cxl_debugfs, NULL,
2520 				    &einj_cxl_available_error_type_fops);
2521 
2522 	cxl_mbox_init();
2523 
2524 	rc = cxl_memdev_init();
2525 	if (rc)
2526 		return rc;
2527 
2528 	cxl_bus_wq = alloc_ordered_workqueue("cxl_port", 0);
2529 	if (!cxl_bus_wq) {
2530 		rc = -ENOMEM;
2531 		goto err_wq;
2532 	}
2533 
2534 	rc = bus_register(&cxl_bus_type);
2535 	if (rc)
2536 		goto err_bus;
2537 
2538 	rc = cxl_region_init();
2539 	if (rc)
2540 		goto err_region;
2541 
2542 	rc = cxl_ras_init();
2543 	if (rc)
2544 		goto err_ras;
2545 
2546 	return 0;
2547 
2548 err_ras:
2549 	cxl_region_exit();
2550 err_region:
2551 	bus_unregister(&cxl_bus_type);
2552 err_bus:
2553 	destroy_workqueue(cxl_bus_wq);
2554 err_wq:
2555 	cxl_memdev_exit();
2556 	return rc;
2557 }
2558 
2559 static void cxl_core_exit(void)
2560 {
2561 	cxl_ras_exit();
2562 	cxl_region_exit();
2563 	bus_unregister(&cxl_bus_type);
2564 	destroy_workqueue(cxl_bus_wq);
2565 	cxl_memdev_exit();
2566 	debugfs_remove_recursive(cxl_debugfs);
2567 }
2568 
2569 subsys_initcall(cxl_core_init);
2570 module_exit(cxl_core_exit);
2571 MODULE_DESCRIPTION("CXL: Core Compute Express Link support");
2572 MODULE_LICENSE("GPL v2");
2573 MODULE_IMPORT_NS("CXL");
2574