Linux kernel mirror (for testing)
git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
kernel
os
linux
1// SPDX-License-Identifier: GPL-2.0-only
2/* Copyright(c) 2020 Intel Corporation. All rights reserved. */
3#include <linux/platform_device.h>
4#include <linux/memregion.h>
5#include <linux/workqueue.h>
6#include <linux/debugfs.h>
7#include <linux/device.h>
8#include <linux/module.h>
9#include <linux/pci.h>
10#include <linux/slab.h>
11#include <linux/idr.h>
12#include <linux/node.h>
13#include <cxl/einj.h>
14#include <cxlmem.h>
15#include <cxlpci.h>
16#include <cxl.h>
17#include "core.h"
18
19/**
20 * DOC: cxl core
21 *
22 * The CXL core provides a set of interfaces that can be consumed by CXL aware
23 * drivers. The interfaces allow for creation, modification, and destruction of
24 * regions, memory devices, ports, and decoders. CXL aware drivers must register
25 * with the CXL core via these interfaces in order to be able to participate in
26 * cross-device interleave coordination. The CXL core also establishes and
27 * maintains the bridge to the nvdimm subsystem.
28 *
29 * CXL core introduces sysfs hierarchy to control the devices that are
30 * instantiated by the core.
31 */
32
33static DEFINE_IDA(cxl_port_ida);
34static DEFINE_XARRAY(cxl_root_buses);
35
36int cxl_num_decoders_committed(struct cxl_port *port)
37{
38 lockdep_assert_held(&cxl_rwsem.region);
39
40 return port->commit_end + 1;
41}
42
43static ssize_t devtype_show(struct device *dev, struct device_attribute *attr,
44 char *buf)
45{
46 return sysfs_emit(buf, "%s\n", dev->type->name);
47}
48static DEVICE_ATTR_RO(devtype);
49
50static int cxl_device_id(const struct device *dev)
51{
52 if (dev->type == &cxl_nvdimm_bridge_type)
53 return CXL_DEVICE_NVDIMM_BRIDGE;
54 if (dev->type == &cxl_nvdimm_type)
55 return CXL_DEVICE_NVDIMM;
56 if (dev->type == CXL_PMEM_REGION_TYPE())
57 return CXL_DEVICE_PMEM_REGION;
58 if (dev->type == CXL_DAX_REGION_TYPE())
59 return CXL_DEVICE_DAX_REGION;
60 if (is_cxl_port(dev)) {
61 if (is_cxl_root(to_cxl_port(dev)))
62 return CXL_DEVICE_ROOT;
63 return CXL_DEVICE_PORT;
64 }
65 if (is_cxl_memdev(dev))
66 return CXL_DEVICE_MEMORY_EXPANDER;
67 if (dev->type == CXL_REGION_TYPE())
68 return CXL_DEVICE_REGION;
69 if (dev->type == &cxl_pmu_type)
70 return CXL_DEVICE_PMU;
71 return 0;
72}
73
74static ssize_t modalias_show(struct device *dev, struct device_attribute *attr,
75 char *buf)
76{
77 return sysfs_emit(buf, CXL_MODALIAS_FMT "\n", cxl_device_id(dev));
78}
79static DEVICE_ATTR_RO(modalias);
80
81static struct attribute *cxl_base_attributes[] = {
82 &dev_attr_devtype.attr,
83 &dev_attr_modalias.attr,
84 NULL,
85};
86
87struct attribute_group cxl_base_attribute_group = {
88 .attrs = cxl_base_attributes,
89};
90
91static ssize_t start_show(struct device *dev, struct device_attribute *attr,
92 char *buf)
93{
94 struct cxl_decoder *cxld = to_cxl_decoder(dev);
95
96 return sysfs_emit(buf, "%#llx\n", cxld->hpa_range.start);
97}
98static DEVICE_ATTR_ADMIN_RO(start);
99
100static ssize_t size_show(struct device *dev, struct device_attribute *attr,
101 char *buf)
102{
103 struct cxl_decoder *cxld = to_cxl_decoder(dev);
104
105 return sysfs_emit(buf, "%#llx\n", range_len(&cxld->hpa_range));
106}
107static DEVICE_ATTR_RO(size);
108
109#define CXL_DECODER_FLAG_ATTR(name, flag) \
110static ssize_t name##_show(struct device *dev, \
111 struct device_attribute *attr, char *buf) \
112{ \
113 struct cxl_decoder *cxld = to_cxl_decoder(dev); \
114 \
115 return sysfs_emit(buf, "%s\n", \
116 (cxld->flags & (flag)) ? "1" : "0"); \
117} \
118static DEVICE_ATTR_RO(name)
119
120CXL_DECODER_FLAG_ATTR(cap_pmem, CXL_DECODER_F_PMEM);
121CXL_DECODER_FLAG_ATTR(cap_ram, CXL_DECODER_F_RAM);
122CXL_DECODER_FLAG_ATTR(cap_type2, CXL_DECODER_F_TYPE2);
123CXL_DECODER_FLAG_ATTR(cap_type3, CXL_DECODER_F_TYPE3);
124CXL_DECODER_FLAG_ATTR(locked, CXL_DECODER_F_LOCK);
125
126static ssize_t target_type_show(struct device *dev,
127 struct device_attribute *attr, char *buf)
128{
129 struct cxl_decoder *cxld = to_cxl_decoder(dev);
130
131 switch (cxld->target_type) {
132 case CXL_DECODER_DEVMEM:
133 return sysfs_emit(buf, "accelerator\n");
134 case CXL_DECODER_HOSTONLYMEM:
135 return sysfs_emit(buf, "expander\n");
136 }
137 return -ENXIO;
138}
139static DEVICE_ATTR_RO(target_type);
140
141static ssize_t emit_target_list(struct cxl_switch_decoder *cxlsd, char *buf)
142{
143 struct cxl_decoder *cxld = &cxlsd->cxld;
144 ssize_t offset = 0;
145 int i, rc = 0;
146
147 for (i = 0; i < cxld->interleave_ways; i++) {
148 struct cxl_dport *dport = cxlsd->target[i];
149 struct cxl_dport *next = NULL;
150
151 if (!dport)
152 break;
153
154 if (i + 1 < cxld->interleave_ways)
155 next = cxlsd->target[i + 1];
156 rc = sysfs_emit_at(buf, offset, "%d%s", dport->port_id,
157 next ? "," : "");
158 if (rc < 0)
159 return rc;
160 offset += rc;
161 }
162
163 return offset;
164}
165
166static ssize_t target_list_show(struct device *dev,
167 struct device_attribute *attr, char *buf)
168{
169 struct cxl_switch_decoder *cxlsd = to_cxl_switch_decoder(dev);
170 ssize_t offset;
171 int rc;
172
173 guard(rwsem_read)(&cxl_rwsem.region);
174 rc = emit_target_list(cxlsd, buf);
175 if (rc < 0)
176 return rc;
177 offset = rc;
178
179 rc = sysfs_emit_at(buf, offset, "\n");
180 if (rc < 0)
181 return rc;
182
183 return offset + rc;
184}
185static DEVICE_ATTR_RO(target_list);
186
187static ssize_t mode_show(struct device *dev, struct device_attribute *attr,
188 char *buf)
189{
190 struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
191 struct cxl_memdev *cxlmd = cxled_to_memdev(cxled);
192 struct cxl_dev_state *cxlds = cxlmd->cxlds;
193 /* without @cxl_rwsem.dpa, make sure @part is not reloaded */
194 int part = READ_ONCE(cxled->part);
195 const char *desc;
196
197 if (part < 0)
198 desc = "none";
199 else
200 desc = cxlds->part[part].res.name;
201
202 return sysfs_emit(buf, "%s\n", desc);
203}
204
205static ssize_t mode_store(struct device *dev, struct device_attribute *attr,
206 const char *buf, size_t len)
207{
208 struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
209 enum cxl_partition_mode mode;
210 ssize_t rc;
211
212 if (sysfs_streq(buf, "pmem"))
213 mode = CXL_PARTMODE_PMEM;
214 else if (sysfs_streq(buf, "ram"))
215 mode = CXL_PARTMODE_RAM;
216 else
217 return -EINVAL;
218
219 rc = cxl_dpa_set_part(cxled, mode);
220 if (rc)
221 return rc;
222
223 return len;
224}
225static DEVICE_ATTR_RW(mode);
226
227static ssize_t dpa_resource_show(struct device *dev, struct device_attribute *attr,
228 char *buf)
229{
230 struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
231
232 guard(rwsem_read)(&cxl_rwsem.dpa);
233 return sysfs_emit(buf, "%#llx\n", (u64)cxl_dpa_resource_start(cxled));
234}
235static DEVICE_ATTR_RO(dpa_resource);
236
237static ssize_t dpa_size_show(struct device *dev, struct device_attribute *attr,
238 char *buf)
239{
240 struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
241 resource_size_t size = cxl_dpa_size(cxled);
242
243 return sysfs_emit(buf, "%pa\n", &size);
244}
245
246static ssize_t dpa_size_store(struct device *dev, struct device_attribute *attr,
247 const char *buf, size_t len)
248{
249 struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
250 unsigned long long size;
251 ssize_t rc;
252
253 rc = kstrtoull(buf, 0, &size);
254 if (rc)
255 return rc;
256
257 if (!IS_ALIGNED(size, SZ_256M))
258 return -EINVAL;
259
260 rc = cxl_dpa_free(cxled);
261 if (rc)
262 return rc;
263
264 if (size == 0)
265 return len;
266
267 rc = cxl_dpa_alloc(cxled, size);
268 if (rc)
269 return rc;
270
271 return len;
272}
273static DEVICE_ATTR_RW(dpa_size);
274
275static ssize_t interleave_granularity_show(struct device *dev,
276 struct device_attribute *attr,
277 char *buf)
278{
279 struct cxl_decoder *cxld = to_cxl_decoder(dev);
280
281 return sysfs_emit(buf, "%d\n", cxld->interleave_granularity);
282}
283
284static DEVICE_ATTR_RO(interleave_granularity);
285
286static ssize_t interleave_ways_show(struct device *dev,
287 struct device_attribute *attr, char *buf)
288{
289 struct cxl_decoder *cxld = to_cxl_decoder(dev);
290
291 return sysfs_emit(buf, "%d\n", cxld->interleave_ways);
292}
293
294static DEVICE_ATTR_RO(interleave_ways);
295
296static ssize_t qos_class_show(struct device *dev,
297 struct device_attribute *attr, char *buf)
298{
299 struct cxl_root_decoder *cxlrd = to_cxl_root_decoder(dev);
300
301 return sysfs_emit(buf, "%d\n", cxlrd->qos_class);
302}
303static DEVICE_ATTR_RO(qos_class);
304
305static struct attribute *cxl_decoder_base_attrs[] = {
306 &dev_attr_start.attr,
307 &dev_attr_size.attr,
308 &dev_attr_locked.attr,
309 &dev_attr_interleave_granularity.attr,
310 &dev_attr_interleave_ways.attr,
311 NULL,
312};
313
314static struct attribute_group cxl_decoder_base_attribute_group = {
315 .attrs = cxl_decoder_base_attrs,
316};
317
318static struct attribute *cxl_decoder_root_attrs[] = {
319 &dev_attr_cap_pmem.attr,
320 &dev_attr_cap_ram.attr,
321 &dev_attr_cap_type2.attr,
322 &dev_attr_cap_type3.attr,
323 &dev_attr_target_list.attr,
324 &dev_attr_qos_class.attr,
325 SET_CXL_REGION_ATTR(create_pmem_region)
326 SET_CXL_REGION_ATTR(create_ram_region)
327 SET_CXL_REGION_ATTR(delete_region)
328 NULL,
329};
330
331static bool can_create_pmem(struct cxl_root_decoder *cxlrd)
332{
333 unsigned long flags = CXL_DECODER_F_TYPE3 | CXL_DECODER_F_PMEM;
334
335 return (cxlrd->cxlsd.cxld.flags & flags) == flags;
336}
337
338static bool can_create_ram(struct cxl_root_decoder *cxlrd)
339{
340 unsigned long flags = CXL_DECODER_F_TYPE3 | CXL_DECODER_F_RAM;
341
342 return (cxlrd->cxlsd.cxld.flags & flags) == flags;
343}
344
345static umode_t cxl_root_decoder_visible(struct kobject *kobj, struct attribute *a, int n)
346{
347 struct device *dev = kobj_to_dev(kobj);
348 struct cxl_root_decoder *cxlrd = to_cxl_root_decoder(dev);
349
350 if (a == CXL_REGION_ATTR(create_pmem_region) && !can_create_pmem(cxlrd))
351 return 0;
352
353 if (a == CXL_REGION_ATTR(create_ram_region) && !can_create_ram(cxlrd))
354 return 0;
355
356 if (a == CXL_REGION_ATTR(delete_region) &&
357 !(can_create_pmem(cxlrd) || can_create_ram(cxlrd)))
358 return 0;
359
360 return a->mode;
361}
362
363static struct attribute_group cxl_decoder_root_attribute_group = {
364 .attrs = cxl_decoder_root_attrs,
365 .is_visible = cxl_root_decoder_visible,
366};
367
368static const struct attribute_group *cxl_decoder_root_attribute_groups[] = {
369 &cxl_decoder_root_attribute_group,
370 &cxl_decoder_base_attribute_group,
371 &cxl_base_attribute_group,
372 NULL,
373};
374
375static struct attribute *cxl_decoder_switch_attrs[] = {
376 &dev_attr_target_type.attr,
377 &dev_attr_target_list.attr,
378 SET_CXL_REGION_ATTR(region)
379 NULL,
380};
381
382static struct attribute_group cxl_decoder_switch_attribute_group = {
383 .attrs = cxl_decoder_switch_attrs,
384};
385
386static const struct attribute_group *cxl_decoder_switch_attribute_groups[] = {
387 &cxl_decoder_switch_attribute_group,
388 &cxl_decoder_base_attribute_group,
389 &cxl_base_attribute_group,
390 NULL,
391};
392
393static struct attribute *cxl_decoder_endpoint_attrs[] = {
394 &dev_attr_target_type.attr,
395 &dev_attr_mode.attr,
396 &dev_attr_dpa_size.attr,
397 &dev_attr_dpa_resource.attr,
398 SET_CXL_REGION_ATTR(region)
399 NULL,
400};
401
402static struct attribute_group cxl_decoder_endpoint_attribute_group = {
403 .attrs = cxl_decoder_endpoint_attrs,
404};
405
406static const struct attribute_group *cxl_decoder_endpoint_attribute_groups[] = {
407 &cxl_decoder_base_attribute_group,
408 &cxl_decoder_endpoint_attribute_group,
409 &cxl_base_attribute_group,
410 NULL,
411};
412
413static void __cxl_decoder_release(struct cxl_decoder *cxld)
414{
415 struct cxl_port *port = to_cxl_port(cxld->dev.parent);
416
417 ida_free(&port->decoder_ida, cxld->id);
418 put_device(&port->dev);
419}
420
421static void cxl_endpoint_decoder_release(struct device *dev)
422{
423 struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
424
425 __cxl_decoder_release(&cxled->cxld);
426 kfree(cxled);
427}
428
429static void cxl_switch_decoder_release(struct device *dev)
430{
431 struct cxl_switch_decoder *cxlsd = to_cxl_switch_decoder(dev);
432
433 __cxl_decoder_release(&cxlsd->cxld);
434 kfree(cxlsd);
435}
436
437struct cxl_root_decoder *to_cxl_root_decoder(struct device *dev)
438{
439 if (dev_WARN_ONCE(dev, !is_root_decoder(dev),
440 "not a cxl_root_decoder device\n"))
441 return NULL;
442 return container_of(dev, struct cxl_root_decoder, cxlsd.cxld.dev);
443}
444EXPORT_SYMBOL_NS_GPL(to_cxl_root_decoder, "CXL");
445
446static void cxl_root_decoder_release(struct device *dev)
447{
448 struct cxl_root_decoder *cxlrd = to_cxl_root_decoder(dev);
449
450 if (atomic_read(&cxlrd->region_id) >= 0)
451 memregion_free(atomic_read(&cxlrd->region_id));
452 __cxl_decoder_release(&cxlrd->cxlsd.cxld);
453 kfree(cxlrd);
454}
455
456static const struct device_type cxl_decoder_endpoint_type = {
457 .name = "cxl_decoder_endpoint",
458 .release = cxl_endpoint_decoder_release,
459 .groups = cxl_decoder_endpoint_attribute_groups,
460};
461
462static const struct device_type cxl_decoder_switch_type = {
463 .name = "cxl_decoder_switch",
464 .release = cxl_switch_decoder_release,
465 .groups = cxl_decoder_switch_attribute_groups,
466};
467
468static const struct device_type cxl_decoder_root_type = {
469 .name = "cxl_decoder_root",
470 .release = cxl_root_decoder_release,
471 .groups = cxl_decoder_root_attribute_groups,
472};
473
474bool is_endpoint_decoder(struct device *dev)
475{
476 return dev->type == &cxl_decoder_endpoint_type;
477}
478EXPORT_SYMBOL_NS_GPL(is_endpoint_decoder, "CXL");
479
480bool is_root_decoder(struct device *dev)
481{
482 return dev->type == &cxl_decoder_root_type;
483}
484EXPORT_SYMBOL_NS_GPL(is_root_decoder, "CXL");
485
486bool is_switch_decoder(struct device *dev)
487{
488 return is_root_decoder(dev) || dev->type == &cxl_decoder_switch_type;
489}
490EXPORT_SYMBOL_NS_GPL(is_switch_decoder, "CXL");
491
492struct cxl_decoder *to_cxl_decoder(struct device *dev)
493{
494 if (dev_WARN_ONCE(dev,
495 !is_switch_decoder(dev) && !is_endpoint_decoder(dev),
496 "not a cxl_decoder device\n"))
497 return NULL;
498 return container_of(dev, struct cxl_decoder, dev);
499}
500EXPORT_SYMBOL_NS_GPL(to_cxl_decoder, "CXL");
501
502struct cxl_endpoint_decoder *to_cxl_endpoint_decoder(struct device *dev)
503{
504 if (dev_WARN_ONCE(dev, !is_endpoint_decoder(dev),
505 "not a cxl_endpoint_decoder device\n"))
506 return NULL;
507 return container_of(dev, struct cxl_endpoint_decoder, cxld.dev);
508}
509EXPORT_SYMBOL_NS_GPL(to_cxl_endpoint_decoder, "CXL");
510
511struct cxl_switch_decoder *to_cxl_switch_decoder(struct device *dev)
512{
513 if (dev_WARN_ONCE(dev, !is_switch_decoder(dev),
514 "not a cxl_switch_decoder device\n"))
515 return NULL;
516 return container_of(dev, struct cxl_switch_decoder, cxld.dev);
517}
518EXPORT_SYMBOL_NS_GPL(to_cxl_switch_decoder, "CXL");
519
520static void cxl_ep_release(struct cxl_ep *ep)
521{
522 put_device(ep->ep);
523 kfree(ep);
524}
525
526static void cxl_ep_remove(struct cxl_port *port, struct cxl_ep *ep)
527{
528 if (!ep)
529 return;
530 xa_erase(&port->endpoints, (unsigned long) ep->ep);
531 cxl_ep_release(ep);
532}
533
534static void cxl_port_release(struct device *dev)
535{
536 struct cxl_port *port = to_cxl_port(dev);
537 unsigned long index;
538 struct cxl_ep *ep;
539
540 xa_for_each(&port->endpoints, index, ep)
541 cxl_ep_remove(port, ep);
542 xa_destroy(&port->endpoints);
543 xa_destroy(&port->dports);
544 xa_destroy(&port->regions);
545 ida_free(&cxl_port_ida, port->id);
546 if (is_cxl_root(port))
547 kfree(to_cxl_root(port));
548 else
549 kfree(port);
550}
551
552static ssize_t decoders_committed_show(struct device *dev,
553 struct device_attribute *attr, char *buf)
554{
555 struct cxl_port *port = to_cxl_port(dev);
556
557 guard(rwsem_read)(&cxl_rwsem.region);
558 return sysfs_emit(buf, "%d\n", cxl_num_decoders_committed(port));
559}
560
561static DEVICE_ATTR_RO(decoders_committed);
562
563static struct attribute *cxl_port_attrs[] = {
564 &dev_attr_decoders_committed.attr,
565 NULL,
566};
567
568static struct attribute_group cxl_port_attribute_group = {
569 .attrs = cxl_port_attrs,
570};
571
572static const struct attribute_group *cxl_port_attribute_groups[] = {
573 &cxl_base_attribute_group,
574 &cxl_port_attribute_group,
575 NULL,
576};
577
578static const struct device_type cxl_port_type = {
579 .name = "cxl_port",
580 .release = cxl_port_release,
581 .groups = cxl_port_attribute_groups,
582};
583
584bool is_cxl_port(const struct device *dev)
585{
586 return dev->type == &cxl_port_type;
587}
588EXPORT_SYMBOL_NS_GPL(is_cxl_port, "CXL");
589
590struct cxl_port *to_cxl_port(const struct device *dev)
591{
592 if (dev_WARN_ONCE(dev, dev->type != &cxl_port_type,
593 "not a cxl_port device\n"))
594 return NULL;
595 return container_of(dev, struct cxl_port, dev);
596}
597EXPORT_SYMBOL_NS_GPL(to_cxl_port, "CXL");
598
599struct cxl_port *parent_port_of(struct cxl_port *port)
600{
601 if (!port || !port->parent_dport)
602 return NULL;
603 return port->parent_dport->port;
604}
605
606static void unregister_port(void *_port)
607{
608 struct cxl_port *port = _port;
609 struct cxl_port *parent = parent_port_of(port);
610 struct device *lock_dev;
611
612 /*
613 * CXL root port's and the first level of ports are unregistered
614 * under the platform firmware device lock, all other ports are
615 * unregistered while holding their parent port lock.
616 */
617 if (!parent)
618 lock_dev = port->uport_dev;
619 else if (is_cxl_root(parent))
620 lock_dev = parent->uport_dev;
621 else
622 lock_dev = &parent->dev;
623
624 device_lock_assert(lock_dev);
625 port->dead = true;
626 device_unregister(&port->dev);
627}
628
629static void cxl_unlink_uport(void *_port)
630{
631 struct cxl_port *port = _port;
632
633 sysfs_remove_link(&port->dev.kobj, "uport");
634}
635
636static int devm_cxl_link_uport(struct device *host, struct cxl_port *port)
637{
638 int rc;
639
640 rc = sysfs_create_link(&port->dev.kobj, &port->uport_dev->kobj,
641 "uport");
642 if (rc)
643 return rc;
644 return devm_add_action_or_reset(host, cxl_unlink_uport, port);
645}
646
647static void cxl_unlink_parent_dport(void *_port)
648{
649 struct cxl_port *port = _port;
650
651 sysfs_remove_link(&port->dev.kobj, "parent_dport");
652}
653
654static int devm_cxl_link_parent_dport(struct device *host,
655 struct cxl_port *port,
656 struct cxl_dport *parent_dport)
657{
658 int rc;
659
660 if (!parent_dport)
661 return 0;
662
663 rc = sysfs_create_link(&port->dev.kobj, &parent_dport->dport_dev->kobj,
664 "parent_dport");
665 if (rc)
666 return rc;
667 return devm_add_action_or_reset(host, cxl_unlink_parent_dport, port);
668}
669
670static struct lock_class_key cxl_port_key;
671
672static struct cxl_port *cxl_port_alloc(struct device *uport_dev,
673 struct cxl_dport *parent_dport)
674{
675 struct cxl_root *cxl_root __free(kfree) = NULL;
676 struct cxl_port *port, *_port __free(kfree) = NULL;
677 struct device *dev;
678 int rc;
679
680 /* No parent_dport, root cxl_port */
681 if (!parent_dport) {
682 cxl_root = kzalloc(sizeof(*cxl_root), GFP_KERNEL);
683 if (!cxl_root)
684 return ERR_PTR(-ENOMEM);
685 } else {
686 _port = kzalloc(sizeof(*port), GFP_KERNEL);
687 if (!_port)
688 return ERR_PTR(-ENOMEM);
689 }
690
691 rc = ida_alloc(&cxl_port_ida, GFP_KERNEL);
692 if (rc < 0)
693 return ERR_PTR(rc);
694
695 if (cxl_root)
696 port = &no_free_ptr(cxl_root)->port;
697 else
698 port = no_free_ptr(_port);
699
700 port->id = rc;
701 port->uport_dev = uport_dev;
702
703 /*
704 * The top-level cxl_port "cxl_root" does not have a cxl_port as
705 * its parent and it does not have any corresponding component
706 * registers as its decode is described by a fixed platform
707 * description.
708 */
709 dev = &port->dev;
710 if (parent_dport) {
711 struct cxl_port *parent_port = parent_dport->port;
712 struct cxl_port *iter;
713
714 dev->parent = &parent_port->dev;
715 port->depth = parent_port->depth + 1;
716 port->parent_dport = parent_dport;
717
718 /*
719 * walk to the host bridge, or the first ancestor that knows
720 * the host bridge
721 */
722 iter = port;
723 while (!iter->host_bridge &&
724 !is_cxl_root(to_cxl_port(iter->dev.parent)))
725 iter = to_cxl_port(iter->dev.parent);
726 if (iter->host_bridge)
727 port->host_bridge = iter->host_bridge;
728 else if (parent_dport->rch)
729 port->host_bridge = parent_dport->dport_dev;
730 else
731 port->host_bridge = iter->uport_dev;
732 dev_dbg(uport_dev, "host-bridge: %s\n",
733 dev_name(port->host_bridge));
734 } else
735 dev->parent = uport_dev;
736
737 ida_init(&port->decoder_ida);
738 port->hdm_end = -1;
739 port->commit_end = -1;
740 xa_init(&port->dports);
741 xa_init(&port->endpoints);
742 xa_init(&port->regions);
743
744 device_initialize(dev);
745 lockdep_set_class_and_subclass(&dev->mutex, &cxl_port_key, port->depth);
746 device_set_pm_not_required(dev);
747 dev->bus = &cxl_bus_type;
748 dev->type = &cxl_port_type;
749
750 return port;
751}
752
753static int cxl_setup_comp_regs(struct device *host, struct cxl_register_map *map,
754 resource_size_t component_reg_phys)
755{
756 *map = (struct cxl_register_map) {
757 .host = host,
758 .reg_type = CXL_REGLOC_RBI_EMPTY,
759 .resource = component_reg_phys,
760 };
761
762 if (component_reg_phys == CXL_RESOURCE_NONE)
763 return 0;
764
765 map->reg_type = CXL_REGLOC_RBI_COMPONENT;
766 map->max_size = CXL_COMPONENT_REG_BLOCK_SIZE;
767
768 return cxl_setup_regs(map);
769}
770
771static int cxl_port_setup_regs(struct cxl_port *port,
772 resource_size_t component_reg_phys)
773{
774 if (dev_is_platform(port->uport_dev))
775 return 0;
776 return cxl_setup_comp_regs(&port->dev, &port->reg_map,
777 component_reg_phys);
778}
779
780static int cxl_dport_setup_regs(struct device *host, struct cxl_dport *dport,
781 resource_size_t component_reg_phys)
782{
783 int rc;
784
785 if (dev_is_platform(dport->dport_dev))
786 return 0;
787
788 /*
789 * use @dport->dport_dev for the context for error messages during
790 * register probing, and fixup @host after the fact, since @host may be
791 * NULL.
792 */
793 rc = cxl_setup_comp_regs(dport->dport_dev, &dport->reg_map,
794 component_reg_phys);
795 dport->reg_map.host = host;
796 return rc;
797}
798
799DEFINE_SHOW_ATTRIBUTE(einj_cxl_available_error_type);
800
801static int cxl_einj_inject(void *data, u64 type)
802{
803 struct cxl_dport *dport = data;
804
805 if (dport->rch)
806 return einj_cxl_inject_rch_error(dport->rcrb.base, type);
807
808 return einj_cxl_inject_error(to_pci_dev(dport->dport_dev), type);
809}
810DEFINE_DEBUGFS_ATTRIBUTE(cxl_einj_inject_fops, NULL, cxl_einj_inject,
811 "0x%llx\n");
812
813static void cxl_debugfs_create_dport_dir(struct cxl_dport *dport)
814{
815 struct dentry *dir;
816
817 if (!einj_cxl_is_initialized())
818 return;
819
820 /*
821 * dport_dev needs to be a PCIe port for CXL 2.0+ ports because
822 * EINJ expects a dport SBDF to be specified for 2.0 error injection.
823 */
824 if (!dport->rch && !dev_is_pci(dport->dport_dev))
825 return;
826
827 dir = cxl_debugfs_create_dir(dev_name(dport->dport_dev));
828
829 debugfs_create_file("einj_inject", 0200, dir, dport,
830 &cxl_einj_inject_fops);
831}
832
833static int cxl_port_add(struct cxl_port *port,
834 resource_size_t component_reg_phys,
835 struct cxl_dport *parent_dport)
836{
837 struct device *dev __free(put_device) = &port->dev;
838 int rc;
839
840 if (is_cxl_memdev(port->uport_dev)) {
841 struct cxl_memdev *cxlmd = to_cxl_memdev(port->uport_dev);
842 struct cxl_dev_state *cxlds = cxlmd->cxlds;
843
844 rc = dev_set_name(dev, "endpoint%d", port->id);
845 if (rc)
846 return rc;
847
848 /*
849 * The endpoint driver already enumerated the component and RAS
850 * registers. Reuse that enumeration while prepping them to be
851 * mapped by the cxl_port driver.
852 */
853 port->reg_map = cxlds->reg_map;
854 port->reg_map.host = &port->dev;
855 cxlmd->endpoint = port;
856 } else if (parent_dport) {
857 rc = dev_set_name(dev, "port%d", port->id);
858 if (rc)
859 return rc;
860
861 rc = cxl_port_setup_regs(port, component_reg_phys);
862 if (rc)
863 return rc;
864 } else {
865 rc = dev_set_name(dev, "root%d", port->id);
866 if (rc)
867 return rc;
868 }
869
870 rc = device_add(dev);
871 if (rc)
872 return rc;
873
874 /* Inhibit the cleanup function invoked */
875 dev = NULL;
876 return 0;
877}
878
879static struct cxl_port *__devm_cxl_add_port(struct device *host,
880 struct device *uport_dev,
881 resource_size_t component_reg_phys,
882 struct cxl_dport *parent_dport)
883{
884 struct cxl_port *port;
885 int rc;
886
887 port = cxl_port_alloc(uport_dev, parent_dport);
888 if (IS_ERR(port))
889 return port;
890
891 rc = cxl_port_add(port, component_reg_phys, parent_dport);
892 if (rc)
893 return ERR_PTR(rc);
894
895 rc = devm_add_action_or_reset(host, unregister_port, port);
896 if (rc)
897 return ERR_PTR(rc);
898
899 rc = devm_cxl_link_uport(host, port);
900 if (rc)
901 return ERR_PTR(rc);
902
903 rc = devm_cxl_link_parent_dport(host, port, parent_dport);
904 if (rc)
905 return ERR_PTR(rc);
906
907 if (parent_dport && dev_is_pci(uport_dev))
908 port->pci_latency = cxl_pci_get_latency(to_pci_dev(uport_dev));
909
910 return port;
911}
912
913/**
914 * devm_cxl_add_port - register a cxl_port in CXL memory decode hierarchy
915 * @host: host device for devm operations
916 * @uport_dev: "physical" device implementing this upstream port
917 * @component_reg_phys: (optional) for configurable cxl_port instances
918 * @parent_dport: next hop up in the CXL memory decode hierarchy
919 */
920struct cxl_port *devm_cxl_add_port(struct device *host,
921 struct device *uport_dev,
922 resource_size_t component_reg_phys,
923 struct cxl_dport *parent_dport)
924{
925 struct cxl_port *port, *parent_port;
926
927 port = __devm_cxl_add_port(host, uport_dev, component_reg_phys,
928 parent_dport);
929
930 parent_port = parent_dport ? parent_dport->port : NULL;
931 if (IS_ERR(port)) {
932 dev_dbg(uport_dev, "Failed to add%s%s%s: %ld\n",
933 parent_port ? " port to " : "",
934 parent_port ? dev_name(&parent_port->dev) : "",
935 parent_port ? "" : " root port",
936 PTR_ERR(port));
937 } else {
938 dev_dbg(uport_dev, "%s added%s%s%s\n",
939 dev_name(&port->dev),
940 parent_port ? " to " : "",
941 parent_port ? dev_name(&parent_port->dev) : "",
942 parent_port ? "" : " (root port)");
943 }
944
945 return port;
946}
947EXPORT_SYMBOL_NS_GPL(devm_cxl_add_port, "CXL");
948
949struct cxl_root *devm_cxl_add_root(struct device *host,
950 const struct cxl_root_ops *ops)
951{
952 struct cxl_root *cxl_root;
953 struct cxl_port *port;
954
955 port = devm_cxl_add_port(host, host, CXL_RESOURCE_NONE, NULL);
956 if (IS_ERR(port))
957 return ERR_CAST(port);
958
959 cxl_root = to_cxl_root(port);
960 cxl_root->ops = ops;
961 return cxl_root;
962}
963EXPORT_SYMBOL_NS_GPL(devm_cxl_add_root, "CXL");
964
965struct pci_bus *cxl_port_to_pci_bus(struct cxl_port *port)
966{
967 /* There is no pci_bus associated with a CXL platform-root port */
968 if (is_cxl_root(port))
969 return NULL;
970
971 if (dev_is_pci(port->uport_dev)) {
972 struct pci_dev *pdev = to_pci_dev(port->uport_dev);
973
974 return pdev->subordinate;
975 }
976
977 return xa_load(&cxl_root_buses, (unsigned long)port->uport_dev);
978}
979EXPORT_SYMBOL_NS_GPL(cxl_port_to_pci_bus, "CXL");
980
981static void unregister_pci_bus(void *uport_dev)
982{
983 xa_erase(&cxl_root_buses, (unsigned long)uport_dev);
984}
985
986int devm_cxl_register_pci_bus(struct device *host, struct device *uport_dev,
987 struct pci_bus *bus)
988{
989 int rc;
990
991 if (dev_is_pci(uport_dev))
992 return -EINVAL;
993
994 rc = xa_insert(&cxl_root_buses, (unsigned long)uport_dev, bus,
995 GFP_KERNEL);
996 if (rc)
997 return rc;
998 return devm_add_action_or_reset(host, unregister_pci_bus, uport_dev);
999}
1000EXPORT_SYMBOL_NS_GPL(devm_cxl_register_pci_bus, "CXL");
1001
1002static bool dev_is_cxl_root_child(struct device *dev)
1003{
1004 struct cxl_port *port, *parent;
1005
1006 if (!is_cxl_port(dev))
1007 return false;
1008
1009 port = to_cxl_port(dev);
1010 if (is_cxl_root(port))
1011 return false;
1012
1013 parent = to_cxl_port(port->dev.parent);
1014 if (is_cxl_root(parent))
1015 return true;
1016
1017 return false;
1018}
1019
1020struct cxl_root *find_cxl_root(struct cxl_port *port)
1021{
1022 struct cxl_port *iter = port;
1023
1024 while (iter && !is_cxl_root(iter))
1025 iter = to_cxl_port(iter->dev.parent);
1026
1027 if (!iter)
1028 return NULL;
1029 get_device(&iter->dev);
1030 return to_cxl_root(iter);
1031}
1032EXPORT_SYMBOL_NS_GPL(find_cxl_root, "CXL");
1033
1034static struct cxl_dport *find_dport(struct cxl_port *port, int id)
1035{
1036 struct cxl_dport *dport;
1037 unsigned long index;
1038
1039 device_lock_assert(&port->dev);
1040 xa_for_each(&port->dports, index, dport)
1041 if (dport->port_id == id)
1042 return dport;
1043 return NULL;
1044}
1045
1046static int add_dport(struct cxl_port *port, struct cxl_dport *dport)
1047{
1048 struct cxl_dport *dup;
1049 int rc;
1050
1051 device_lock_assert(&port->dev);
1052 dup = find_dport(port, dport->port_id);
1053 if (dup) {
1054 dev_err(&port->dev,
1055 "unable to add dport%d-%s non-unique port id (%s)\n",
1056 dport->port_id, dev_name(dport->dport_dev),
1057 dev_name(dup->dport_dev));
1058 return -EBUSY;
1059 }
1060
1061 rc = xa_insert(&port->dports, (unsigned long)dport->dport_dev, dport,
1062 GFP_KERNEL);
1063 if (rc)
1064 return rc;
1065
1066 port->nr_dports++;
1067 return 0;
1068}
1069
1070/*
1071 * Since root-level CXL dports cannot be enumerated by PCI they are not
1072 * enumerated by the common port driver that acquires the port lock over
1073 * dport add/remove. Instead, root dports are manually added by a
1074 * platform driver and cond_cxl_root_lock() is used to take the missing
1075 * port lock in that case.
1076 */
1077static void cond_cxl_root_lock(struct cxl_port *port)
1078{
1079 if (is_cxl_root(port))
1080 device_lock(&port->dev);
1081}
1082
1083static void cond_cxl_root_unlock(struct cxl_port *port)
1084{
1085 if (is_cxl_root(port))
1086 device_unlock(&port->dev);
1087}
1088
1089static void cxl_dport_remove(void *data)
1090{
1091 struct cxl_dport *dport = data;
1092 struct cxl_port *port = dport->port;
1093
1094 xa_erase(&port->dports, (unsigned long) dport->dport_dev);
1095 put_device(dport->dport_dev);
1096}
1097
1098static void cxl_dport_unlink(void *data)
1099{
1100 struct cxl_dport *dport = data;
1101 struct cxl_port *port = dport->port;
1102 char link_name[CXL_TARGET_STRLEN];
1103
1104 sprintf(link_name, "dport%d", dport->port_id);
1105 sysfs_remove_link(&port->dev.kobj, link_name);
1106}
1107
1108static struct cxl_dport *
1109__devm_cxl_add_dport(struct cxl_port *port, struct device *dport_dev,
1110 int port_id, resource_size_t component_reg_phys,
1111 resource_size_t rcrb)
1112{
1113 char link_name[CXL_TARGET_STRLEN];
1114 struct cxl_dport *dport;
1115 struct device *host;
1116 int rc;
1117
1118 if (is_cxl_root(port))
1119 host = port->uport_dev;
1120 else
1121 host = &port->dev;
1122
1123 if (!host->driver) {
1124 dev_WARN_ONCE(&port->dev, 1, "dport:%s bad devm context\n",
1125 dev_name(dport_dev));
1126 return ERR_PTR(-ENXIO);
1127 }
1128
1129 if (snprintf(link_name, CXL_TARGET_STRLEN, "dport%d", port_id) >=
1130 CXL_TARGET_STRLEN)
1131 return ERR_PTR(-EINVAL);
1132
1133 dport = devm_kzalloc(host, sizeof(*dport), GFP_KERNEL);
1134 if (!dport)
1135 return ERR_PTR(-ENOMEM);
1136
1137 dport->dport_dev = dport_dev;
1138 dport->port_id = port_id;
1139 dport->port = port;
1140
1141 if (rcrb == CXL_RESOURCE_NONE) {
1142 rc = cxl_dport_setup_regs(&port->dev, dport,
1143 component_reg_phys);
1144 if (rc)
1145 return ERR_PTR(rc);
1146 } else {
1147 dport->rcrb.base = rcrb;
1148 component_reg_phys = __rcrb_to_component(dport_dev, &dport->rcrb,
1149 CXL_RCRB_DOWNSTREAM);
1150 if (component_reg_phys == CXL_RESOURCE_NONE) {
1151 dev_warn(dport_dev, "Invalid Component Registers in RCRB");
1152 return ERR_PTR(-ENXIO);
1153 }
1154
1155 /*
1156 * RCH @dport is not ready to map until associated with its
1157 * memdev
1158 */
1159 rc = cxl_dport_setup_regs(NULL, dport, component_reg_phys);
1160 if (rc)
1161 return ERR_PTR(rc);
1162
1163 dport->rch = true;
1164 }
1165
1166 if (component_reg_phys != CXL_RESOURCE_NONE)
1167 dev_dbg(dport_dev, "Component Registers found for dport: %pa\n",
1168 &component_reg_phys);
1169
1170 cond_cxl_root_lock(port);
1171 rc = add_dport(port, dport);
1172 cond_cxl_root_unlock(port);
1173 if (rc)
1174 return ERR_PTR(rc);
1175
1176 get_device(dport_dev);
1177 rc = devm_add_action_or_reset(host, cxl_dport_remove, dport);
1178 if (rc)
1179 return ERR_PTR(rc);
1180
1181 rc = sysfs_create_link(&port->dev.kobj, &dport_dev->kobj, link_name);
1182 if (rc)
1183 return ERR_PTR(rc);
1184
1185 rc = devm_add_action_or_reset(host, cxl_dport_unlink, dport);
1186 if (rc)
1187 return ERR_PTR(rc);
1188
1189 if (dev_is_pci(dport_dev))
1190 dport->link_latency = cxl_pci_get_latency(to_pci_dev(dport_dev));
1191
1192 cxl_debugfs_create_dport_dir(dport);
1193
1194 return dport;
1195}
1196
1197/**
1198 * devm_cxl_add_dport - append VH downstream port data to a cxl_port
1199 * @port: the cxl_port that references this dport
1200 * @dport_dev: firmware or PCI device representing the dport
1201 * @port_id: identifier for this dport in a decoder's target list
1202 * @component_reg_phys: optional location of CXL component registers
1203 *
1204 * Note that dports are appended to the devm release action's of the
1205 * either the port's host (for root ports), or the port itself (for
1206 * switch ports)
1207 */
1208struct cxl_dport *devm_cxl_add_dport(struct cxl_port *port,
1209 struct device *dport_dev, int port_id,
1210 resource_size_t component_reg_phys)
1211{
1212 struct cxl_dport *dport;
1213
1214 dport = __devm_cxl_add_dport(port, dport_dev, port_id,
1215 component_reg_phys, CXL_RESOURCE_NONE);
1216 if (IS_ERR(dport)) {
1217 dev_dbg(dport_dev, "failed to add dport to %s: %ld\n",
1218 dev_name(&port->dev), PTR_ERR(dport));
1219 } else {
1220 dev_dbg(dport_dev, "dport added to %s\n",
1221 dev_name(&port->dev));
1222 }
1223
1224 return dport;
1225}
1226EXPORT_SYMBOL_NS_GPL(devm_cxl_add_dport, "CXL");
1227
1228/**
1229 * devm_cxl_add_rch_dport - append RCH downstream port data to a cxl_port
1230 * @port: the cxl_port that references this dport
1231 * @dport_dev: firmware or PCI device representing the dport
1232 * @port_id: identifier for this dport in a decoder's target list
1233 * @rcrb: mandatory location of a Root Complex Register Block
1234 *
1235 * See CXL 3.0 9.11.8 CXL Devices Attached to an RCH
1236 */
1237struct cxl_dport *devm_cxl_add_rch_dport(struct cxl_port *port,
1238 struct device *dport_dev, int port_id,
1239 resource_size_t rcrb)
1240{
1241 struct cxl_dport *dport;
1242
1243 if (rcrb == CXL_RESOURCE_NONE) {
1244 dev_dbg(&port->dev, "failed to add RCH dport, missing RCRB\n");
1245 return ERR_PTR(-EINVAL);
1246 }
1247
1248 dport = __devm_cxl_add_dport(port, dport_dev, port_id,
1249 CXL_RESOURCE_NONE, rcrb);
1250 if (IS_ERR(dport)) {
1251 dev_dbg(dport_dev, "failed to add RCH dport to %s: %ld\n",
1252 dev_name(&port->dev), PTR_ERR(dport));
1253 } else {
1254 dev_dbg(dport_dev, "RCH dport added to %s\n",
1255 dev_name(&port->dev));
1256 }
1257
1258 return dport;
1259}
1260EXPORT_SYMBOL_NS_GPL(devm_cxl_add_rch_dport, "CXL");
1261
1262static int add_ep(struct cxl_ep *new)
1263{
1264 struct cxl_port *port = new->dport->port;
1265
1266 guard(device)(&port->dev);
1267 if (port->dead)
1268 return -ENXIO;
1269
1270 return xa_insert(&port->endpoints, (unsigned long)new->ep,
1271 new, GFP_KERNEL);
1272}
1273
1274/**
1275 * cxl_add_ep - register an endpoint's interest in a port
1276 * @dport: the dport that routes to @ep_dev
1277 * @ep_dev: device representing the endpoint
1278 *
1279 * Intermediate CXL ports are scanned based on the arrival of endpoints.
1280 * When those endpoints depart the port can be destroyed once all
1281 * endpoints that care about that port have been removed.
1282 */
1283static int cxl_add_ep(struct cxl_dport *dport, struct device *ep_dev)
1284{
1285 struct cxl_ep *ep;
1286 int rc;
1287
1288 ep = kzalloc(sizeof(*ep), GFP_KERNEL);
1289 if (!ep)
1290 return -ENOMEM;
1291
1292 ep->ep = get_device(ep_dev);
1293 ep->dport = dport;
1294
1295 rc = add_ep(ep);
1296 if (rc)
1297 cxl_ep_release(ep);
1298 return rc;
1299}
1300
1301struct cxl_find_port_ctx {
1302 const struct device *dport_dev;
1303 const struct cxl_port *parent_port;
1304 struct cxl_dport **dport;
1305};
1306
1307static int match_port_by_dport(struct device *dev, const void *data)
1308{
1309 const struct cxl_find_port_ctx *ctx = data;
1310 struct cxl_dport *dport;
1311 struct cxl_port *port;
1312
1313 if (!is_cxl_port(dev))
1314 return 0;
1315 if (ctx->parent_port && dev->parent != &ctx->parent_port->dev)
1316 return 0;
1317
1318 port = to_cxl_port(dev);
1319 dport = cxl_find_dport_by_dev(port, ctx->dport_dev);
1320 if (ctx->dport)
1321 *ctx->dport = dport;
1322 return dport != NULL;
1323}
1324
1325static struct cxl_port *__find_cxl_port(struct cxl_find_port_ctx *ctx)
1326{
1327 struct device *dev;
1328
1329 if (!ctx->dport_dev)
1330 return NULL;
1331
1332 dev = bus_find_device(&cxl_bus_type, NULL, ctx, match_port_by_dport);
1333 if (dev)
1334 return to_cxl_port(dev);
1335 return NULL;
1336}
1337
1338static struct cxl_port *find_cxl_port(struct device *dport_dev,
1339 struct cxl_dport **dport)
1340{
1341 struct cxl_find_port_ctx ctx = {
1342 .dport_dev = dport_dev,
1343 .dport = dport,
1344 };
1345 struct cxl_port *port;
1346
1347 port = __find_cxl_port(&ctx);
1348 return port;
1349}
1350
1351static struct cxl_port *find_cxl_port_at(struct cxl_port *parent_port,
1352 struct device *dport_dev,
1353 struct cxl_dport **dport)
1354{
1355 struct cxl_find_port_ctx ctx = {
1356 .dport_dev = dport_dev,
1357 .parent_port = parent_port,
1358 .dport = dport,
1359 };
1360 struct cxl_port *port;
1361
1362 port = __find_cxl_port(&ctx);
1363 return port;
1364}
1365
1366/*
1367 * All users of grandparent() are using it to walk PCIe-like switch port
1368 * hierarchy. A PCIe switch is comprised of a bridge device representing the
1369 * upstream switch port and N bridges representing downstream switch ports. When
1370 * bridges stack the grand-parent of a downstream switch port is another
1371 * downstream switch port in the immediate ancestor switch.
1372 */
1373static struct device *grandparent(struct device *dev)
1374{
1375 if (dev && dev->parent)
1376 return dev->parent->parent;
1377 return NULL;
1378}
1379
1380static struct device *endpoint_host(struct cxl_port *endpoint)
1381{
1382 struct cxl_port *port = to_cxl_port(endpoint->dev.parent);
1383
1384 if (is_cxl_root(port))
1385 return port->uport_dev;
1386 return &port->dev;
1387}
1388
1389static void delete_endpoint(void *data)
1390{
1391 struct cxl_memdev *cxlmd = data;
1392 struct cxl_port *endpoint = cxlmd->endpoint;
1393 struct device *host = endpoint_host(endpoint);
1394
1395 scoped_guard(device, host) {
1396 if (host->driver && !endpoint->dead) {
1397 devm_release_action(host, cxl_unlink_parent_dport, endpoint);
1398 devm_release_action(host, cxl_unlink_uport, endpoint);
1399 devm_release_action(host, unregister_port, endpoint);
1400 }
1401 cxlmd->endpoint = NULL;
1402 }
1403 put_device(&endpoint->dev);
1404 put_device(host);
1405}
1406
1407int cxl_endpoint_autoremove(struct cxl_memdev *cxlmd, struct cxl_port *endpoint)
1408{
1409 struct device *host = endpoint_host(endpoint);
1410 struct device *dev = &cxlmd->dev;
1411
1412 get_device(host);
1413 get_device(&endpoint->dev);
1414 cxlmd->depth = endpoint->depth;
1415 return devm_add_action_or_reset(dev, delete_endpoint, cxlmd);
1416}
1417EXPORT_SYMBOL_NS_GPL(cxl_endpoint_autoremove, "CXL");
1418
1419/*
1420 * The natural end of life of a non-root 'cxl_port' is when its parent port goes
1421 * through a ->remove() event ("top-down" unregistration). The unnatural trigger
1422 * for a port to be unregistered is when all memdevs beneath that port have gone
1423 * through ->remove(). This "bottom-up" removal selectively removes individual
1424 * child ports manually. This depends on devm_cxl_add_port() to not change is
1425 * devm action registration order, and for dports to have already been
1426 * destroyed by reap_dports().
1427 */
1428static void delete_switch_port(struct cxl_port *port)
1429{
1430 devm_release_action(port->dev.parent, cxl_unlink_parent_dport, port);
1431 devm_release_action(port->dev.parent, cxl_unlink_uport, port);
1432 devm_release_action(port->dev.parent, unregister_port, port);
1433}
1434
1435static void reap_dports(struct cxl_port *port)
1436{
1437 struct cxl_dport *dport;
1438 unsigned long index;
1439
1440 device_lock_assert(&port->dev);
1441
1442 xa_for_each(&port->dports, index, dport) {
1443 devm_release_action(&port->dev, cxl_dport_unlink, dport);
1444 devm_release_action(&port->dev, cxl_dport_remove, dport);
1445 devm_kfree(&port->dev, dport);
1446 }
1447}
1448
1449struct detach_ctx {
1450 struct cxl_memdev *cxlmd;
1451 int depth;
1452};
1453
1454static int port_has_memdev(struct device *dev, const void *data)
1455{
1456 const struct detach_ctx *ctx = data;
1457 struct cxl_port *port;
1458
1459 if (!is_cxl_port(dev))
1460 return 0;
1461
1462 port = to_cxl_port(dev);
1463 if (port->depth != ctx->depth)
1464 return 0;
1465
1466 return !!cxl_ep_load(port, ctx->cxlmd);
1467}
1468
1469static void cxl_detach_ep(void *data)
1470{
1471 struct cxl_memdev *cxlmd = data;
1472
1473 for (int i = cxlmd->depth - 1; i >= 1; i--) {
1474 struct cxl_port *port, *parent_port;
1475 struct detach_ctx ctx = {
1476 .cxlmd = cxlmd,
1477 .depth = i,
1478 };
1479 struct cxl_ep *ep;
1480 bool died = false;
1481
1482 struct device *dev __free(put_device) =
1483 bus_find_device(&cxl_bus_type, NULL, &ctx, port_has_memdev);
1484 if (!dev)
1485 continue;
1486 port = to_cxl_port(dev);
1487
1488 parent_port = to_cxl_port(port->dev.parent);
1489 device_lock(&parent_port->dev);
1490 device_lock(&port->dev);
1491 ep = cxl_ep_load(port, cxlmd);
1492 dev_dbg(&cxlmd->dev, "disconnect %s from %s\n",
1493 ep ? dev_name(ep->ep) : "", dev_name(&port->dev));
1494 cxl_ep_remove(port, ep);
1495 if (ep && !port->dead && xa_empty(&port->endpoints) &&
1496 !is_cxl_root(parent_port) && parent_port->dev.driver) {
1497 /*
1498 * This was the last ep attached to a dynamically
1499 * enumerated port. Block new cxl_add_ep() and garbage
1500 * collect the port.
1501 */
1502 died = true;
1503 port->dead = true;
1504 reap_dports(port);
1505 }
1506 device_unlock(&port->dev);
1507
1508 if (died) {
1509 dev_dbg(&cxlmd->dev, "delete %s\n",
1510 dev_name(&port->dev));
1511 delete_switch_port(port);
1512 }
1513 device_unlock(&parent_port->dev);
1514 }
1515}
1516
1517static resource_size_t find_component_registers(struct device *dev)
1518{
1519 struct cxl_register_map map;
1520 struct pci_dev *pdev;
1521
1522 /*
1523 * Theoretically, CXL component registers can be hosted on a
1524 * non-PCI device, in practice, only cxl_test hits this case.
1525 */
1526 if (!dev_is_pci(dev))
1527 return CXL_RESOURCE_NONE;
1528
1529 pdev = to_pci_dev(dev);
1530
1531 cxl_find_regblock(pdev, CXL_REGLOC_RBI_COMPONENT, &map);
1532 return map.resource;
1533}
1534
1535static int add_port_attach_ep(struct cxl_memdev *cxlmd,
1536 struct device *uport_dev,
1537 struct device *dport_dev)
1538{
1539 struct device *dparent = grandparent(dport_dev);
1540 struct cxl_dport *dport, *parent_dport;
1541 resource_size_t component_reg_phys;
1542 int rc;
1543
1544 if (!dparent) {
1545 /*
1546 * The iteration reached the topology root without finding the
1547 * CXL-root 'cxl_port' on a previous iteration, fail for now to
1548 * be re-probed after platform driver attaches.
1549 */
1550 dev_dbg(&cxlmd->dev, "%s is a root dport\n",
1551 dev_name(dport_dev));
1552 return -ENXIO;
1553 }
1554
1555 struct cxl_port *parent_port __free(put_cxl_port) =
1556 find_cxl_port(dparent, &parent_dport);
1557 if (!parent_port) {
1558 /* iterate to create this parent_port */
1559 return -EAGAIN;
1560 }
1561
1562 /*
1563 * Definition with __free() here to keep the sequence of
1564 * dereferencing the device of the port before the parent_port releasing.
1565 */
1566 struct cxl_port *port __free(put_cxl_port) = NULL;
1567 scoped_guard(device, &parent_port->dev) {
1568 if (!parent_port->dev.driver) {
1569 dev_warn(&cxlmd->dev,
1570 "port %s:%s disabled, failed to enumerate CXL.mem\n",
1571 dev_name(&parent_port->dev), dev_name(uport_dev));
1572 return -ENXIO;
1573 }
1574
1575 port = find_cxl_port_at(parent_port, dport_dev, &dport);
1576 if (!port) {
1577 component_reg_phys = find_component_registers(uport_dev);
1578 port = devm_cxl_add_port(&parent_port->dev, uport_dev,
1579 component_reg_phys, parent_dport);
1580 if (IS_ERR(port))
1581 return PTR_ERR(port);
1582
1583 /* retry find to pick up the new dport information */
1584 port = find_cxl_port_at(parent_port, dport_dev, &dport);
1585 if (!port)
1586 return -ENXIO;
1587 }
1588 }
1589
1590 dev_dbg(&cxlmd->dev, "add to new port %s:%s\n",
1591 dev_name(&port->dev), dev_name(port->uport_dev));
1592 rc = cxl_add_ep(dport, &cxlmd->dev);
1593 if (rc == -EBUSY) {
1594 /*
1595 * "can't" happen, but this error code means
1596 * something to the caller, so translate it.
1597 */
1598 rc = -ENXIO;
1599 }
1600
1601 return rc;
1602}
1603
1604int devm_cxl_enumerate_ports(struct cxl_memdev *cxlmd)
1605{
1606 struct device *dev = &cxlmd->dev;
1607 struct device *iter;
1608 int rc;
1609
1610 /*
1611 * Skip intermediate port enumeration in the RCH case, there
1612 * are no ports in between a host bridge and an endpoint.
1613 */
1614 if (cxlmd->cxlds->rcd)
1615 return 0;
1616
1617 rc = devm_add_action_or_reset(&cxlmd->dev, cxl_detach_ep, cxlmd);
1618 if (rc)
1619 return rc;
1620
1621 /*
1622 * Scan for and add all cxl_ports in this device's ancestry.
1623 * Repeat until no more ports are added. Abort if a port add
1624 * attempt fails.
1625 */
1626retry:
1627 for (iter = dev; iter; iter = grandparent(iter)) {
1628 struct device *dport_dev = grandparent(iter);
1629 struct device *uport_dev;
1630 struct cxl_dport *dport;
1631
1632 /*
1633 * The terminal "grandparent" in PCI is NULL and @platform_bus
1634 * for platform devices
1635 */
1636 if (!dport_dev || dport_dev == &platform_bus)
1637 return 0;
1638
1639 uport_dev = dport_dev->parent;
1640 if (!uport_dev) {
1641 dev_warn(dev, "at %s no parent for dport: %s\n",
1642 dev_name(iter), dev_name(dport_dev));
1643 return -ENXIO;
1644 }
1645
1646 dev_dbg(dev, "scan: iter: %s dport_dev: %s parent: %s\n",
1647 dev_name(iter), dev_name(dport_dev),
1648 dev_name(uport_dev));
1649 struct cxl_port *port __free(put_cxl_port) =
1650 find_cxl_port(dport_dev, &dport);
1651 if (port) {
1652 dev_dbg(&cxlmd->dev,
1653 "found already registered port %s:%s\n",
1654 dev_name(&port->dev),
1655 dev_name(port->uport_dev));
1656 rc = cxl_add_ep(dport, &cxlmd->dev);
1657
1658 /*
1659 * If the endpoint already exists in the port's list,
1660 * that's ok, it was added on a previous pass.
1661 * Otherwise, retry in add_port_attach_ep() after taking
1662 * the parent_port lock as the current port may be being
1663 * reaped.
1664 */
1665 if (rc && rc != -EBUSY)
1666 return rc;
1667
1668 cxl_gpf_port_setup(dport);
1669
1670 /* Any more ports to add between this one and the root? */
1671 if (!dev_is_cxl_root_child(&port->dev))
1672 continue;
1673
1674 return 0;
1675 }
1676
1677 rc = add_port_attach_ep(cxlmd, uport_dev, dport_dev);
1678 /* port missing, try to add parent */
1679 if (rc == -EAGAIN)
1680 continue;
1681 /* failed to add ep or port */
1682 if (rc)
1683 return rc;
1684 /* port added, new descendants possible, start over */
1685 goto retry;
1686 }
1687
1688 return 0;
1689}
1690EXPORT_SYMBOL_NS_GPL(devm_cxl_enumerate_ports, "CXL");
1691
1692struct cxl_port *cxl_pci_find_port(struct pci_dev *pdev,
1693 struct cxl_dport **dport)
1694{
1695 return find_cxl_port(pdev->dev.parent, dport);
1696}
1697EXPORT_SYMBOL_NS_GPL(cxl_pci_find_port, "CXL");
1698
1699struct cxl_port *cxl_mem_find_port(struct cxl_memdev *cxlmd,
1700 struct cxl_dport **dport)
1701{
1702 return find_cxl_port(grandparent(&cxlmd->dev), dport);
1703}
1704EXPORT_SYMBOL_NS_GPL(cxl_mem_find_port, "CXL");
1705
1706static int decoder_populate_targets(struct cxl_switch_decoder *cxlsd,
1707 struct cxl_port *port, int *target_map)
1708{
1709 int i;
1710
1711 if (!target_map)
1712 return 0;
1713
1714 device_lock_assert(&port->dev);
1715
1716 if (xa_empty(&port->dports))
1717 return -EINVAL;
1718
1719 guard(rwsem_write)(&cxl_rwsem.region);
1720 for (i = 0; i < cxlsd->cxld.interleave_ways; i++) {
1721 struct cxl_dport *dport = find_dport(port, target_map[i]);
1722
1723 if (!dport)
1724 return -ENXIO;
1725 cxlsd->target[i] = dport;
1726 }
1727
1728 return 0;
1729}
1730
1731static struct lock_class_key cxl_decoder_key;
1732
1733/**
1734 * cxl_decoder_init - Common decoder setup / initialization
1735 * @port: owning port of this decoder
1736 * @cxld: common decoder properties to initialize
1737 *
1738 * A port may contain one or more decoders. Each of those decoders
1739 * enable some address space for CXL.mem utilization. A decoder is
1740 * expected to be configured by the caller before registering via
1741 * cxl_decoder_add()
1742 */
1743static int cxl_decoder_init(struct cxl_port *port, struct cxl_decoder *cxld)
1744{
1745 struct device *dev;
1746 int rc;
1747
1748 rc = ida_alloc(&port->decoder_ida, GFP_KERNEL);
1749 if (rc < 0)
1750 return rc;
1751
1752 /* need parent to stick around to release the id */
1753 get_device(&port->dev);
1754 cxld->id = rc;
1755
1756 dev = &cxld->dev;
1757 device_initialize(dev);
1758 lockdep_set_class(&dev->mutex, &cxl_decoder_key);
1759 device_set_pm_not_required(dev);
1760 dev->parent = &port->dev;
1761 dev->bus = &cxl_bus_type;
1762
1763 /* Pre initialize an "empty" decoder */
1764 cxld->interleave_ways = 1;
1765 cxld->interleave_granularity = PAGE_SIZE;
1766 cxld->target_type = CXL_DECODER_HOSTONLYMEM;
1767 cxld->hpa_range = (struct range) {
1768 .start = 0,
1769 .end = -1,
1770 };
1771
1772 return 0;
1773}
1774
1775static int cxl_switch_decoder_init(struct cxl_port *port,
1776 struct cxl_switch_decoder *cxlsd,
1777 int nr_targets)
1778{
1779 if (nr_targets > CXL_DECODER_MAX_INTERLEAVE)
1780 return -EINVAL;
1781
1782 cxlsd->nr_targets = nr_targets;
1783 return cxl_decoder_init(port, &cxlsd->cxld);
1784}
1785
1786/**
1787 * cxl_root_decoder_alloc - Allocate a root level decoder
1788 * @port: owning CXL root of this decoder
1789 * @nr_targets: static number of downstream targets
1790 *
1791 * Return: A new cxl decoder to be registered by cxl_decoder_add(). A
1792 * 'CXL root' decoder is one that decodes from a top-level / static platform
1793 * firmware description of CXL resources into a CXL standard decode
1794 * topology.
1795 */
1796struct cxl_root_decoder *cxl_root_decoder_alloc(struct cxl_port *port,
1797 unsigned int nr_targets)
1798{
1799 struct cxl_root_decoder *cxlrd;
1800 struct cxl_switch_decoder *cxlsd;
1801 struct cxl_decoder *cxld;
1802 int rc;
1803
1804 if (!is_cxl_root(port))
1805 return ERR_PTR(-EINVAL);
1806
1807 cxlrd = kzalloc(struct_size(cxlrd, cxlsd.target, nr_targets),
1808 GFP_KERNEL);
1809 if (!cxlrd)
1810 return ERR_PTR(-ENOMEM);
1811
1812 cxlsd = &cxlrd->cxlsd;
1813 rc = cxl_switch_decoder_init(port, cxlsd, nr_targets);
1814 if (rc) {
1815 kfree(cxlrd);
1816 return ERR_PTR(rc);
1817 }
1818
1819 mutex_init(&cxlrd->range_lock);
1820
1821 cxld = &cxlsd->cxld;
1822 cxld->dev.type = &cxl_decoder_root_type;
1823 /*
1824 * cxl_root_decoder_release() special cases negative ids to
1825 * detect memregion_alloc() failures.
1826 */
1827 atomic_set(&cxlrd->region_id, -1);
1828 rc = memregion_alloc(GFP_KERNEL);
1829 if (rc < 0) {
1830 put_device(&cxld->dev);
1831 return ERR_PTR(rc);
1832 }
1833
1834 atomic_set(&cxlrd->region_id, rc);
1835 cxlrd->qos_class = CXL_QOS_CLASS_INVALID;
1836 return cxlrd;
1837}
1838EXPORT_SYMBOL_NS_GPL(cxl_root_decoder_alloc, "CXL");
1839
1840/**
1841 * cxl_switch_decoder_alloc - Allocate a switch level decoder
1842 * @port: owning CXL switch port of this decoder
1843 * @nr_targets: max number of dynamically addressable downstream targets
1844 *
1845 * Return: A new cxl decoder to be registered by cxl_decoder_add(). A
1846 * 'switch' decoder is any decoder that can be enumerated by PCIe
1847 * topology and the HDM Decoder Capability. This includes the decoders
1848 * that sit between Switch Upstream Ports / Switch Downstream Ports and
1849 * Host Bridges / Root Ports.
1850 */
1851struct cxl_switch_decoder *cxl_switch_decoder_alloc(struct cxl_port *port,
1852 unsigned int nr_targets)
1853{
1854 struct cxl_switch_decoder *cxlsd;
1855 struct cxl_decoder *cxld;
1856 int rc;
1857
1858 if (is_cxl_root(port) || is_cxl_endpoint(port))
1859 return ERR_PTR(-EINVAL);
1860
1861 cxlsd = kzalloc(struct_size(cxlsd, target, nr_targets), GFP_KERNEL);
1862 if (!cxlsd)
1863 return ERR_PTR(-ENOMEM);
1864
1865 rc = cxl_switch_decoder_init(port, cxlsd, nr_targets);
1866 if (rc) {
1867 kfree(cxlsd);
1868 return ERR_PTR(rc);
1869 }
1870
1871 cxld = &cxlsd->cxld;
1872 cxld->dev.type = &cxl_decoder_switch_type;
1873 return cxlsd;
1874}
1875EXPORT_SYMBOL_NS_GPL(cxl_switch_decoder_alloc, "CXL");
1876
1877/**
1878 * cxl_endpoint_decoder_alloc - Allocate an endpoint decoder
1879 * @port: owning port of this decoder
1880 *
1881 * Return: A new cxl decoder to be registered by cxl_decoder_add()
1882 */
1883struct cxl_endpoint_decoder *cxl_endpoint_decoder_alloc(struct cxl_port *port)
1884{
1885 struct cxl_endpoint_decoder *cxled;
1886 struct cxl_decoder *cxld;
1887 int rc;
1888
1889 if (!is_cxl_endpoint(port))
1890 return ERR_PTR(-EINVAL);
1891
1892 cxled = kzalloc(sizeof(*cxled), GFP_KERNEL);
1893 if (!cxled)
1894 return ERR_PTR(-ENOMEM);
1895
1896 cxled->pos = -1;
1897 cxled->part = -1;
1898 cxld = &cxled->cxld;
1899 rc = cxl_decoder_init(port, cxld);
1900 if (rc) {
1901 kfree(cxled);
1902 return ERR_PTR(rc);
1903 }
1904
1905 cxld->dev.type = &cxl_decoder_endpoint_type;
1906 return cxled;
1907}
1908EXPORT_SYMBOL_NS_GPL(cxl_endpoint_decoder_alloc, "CXL");
1909
1910/**
1911 * cxl_decoder_add_locked - Add a decoder with targets
1912 * @cxld: The cxl decoder allocated by cxl_<type>_decoder_alloc()
1913 * @target_map: A list of downstream ports that this decoder can direct memory
1914 * traffic to. These numbers should correspond with the port number
1915 * in the PCIe Link Capabilities structure.
1916 *
1917 * Certain types of decoders may not have any targets. The main example of this
1918 * is an endpoint device. A more awkward example is a hostbridge whose root
1919 * ports get hot added (technically possible, though unlikely).
1920 *
1921 * This is the locked variant of cxl_decoder_add().
1922 *
1923 * Context: Process context. Expects the device lock of the port that owns the
1924 * @cxld to be held.
1925 *
1926 * Return: Negative error code if the decoder wasn't properly configured; else
1927 * returns 0.
1928 */
1929int cxl_decoder_add_locked(struct cxl_decoder *cxld, int *target_map)
1930{
1931 struct cxl_port *port;
1932 struct device *dev;
1933 int rc;
1934
1935 if (WARN_ON_ONCE(!cxld))
1936 return -EINVAL;
1937
1938 if (WARN_ON_ONCE(IS_ERR(cxld)))
1939 return PTR_ERR(cxld);
1940
1941 if (cxld->interleave_ways < 1)
1942 return -EINVAL;
1943
1944 dev = &cxld->dev;
1945
1946 port = to_cxl_port(cxld->dev.parent);
1947 if (!is_endpoint_decoder(dev)) {
1948 struct cxl_switch_decoder *cxlsd = to_cxl_switch_decoder(dev);
1949
1950 rc = decoder_populate_targets(cxlsd, port, target_map);
1951 if (rc && (cxld->flags & CXL_DECODER_F_ENABLE)) {
1952 dev_err(&port->dev,
1953 "Failed to populate active decoder targets\n");
1954 return rc;
1955 }
1956 }
1957
1958 rc = dev_set_name(dev, "decoder%d.%d", port->id, cxld->id);
1959 if (rc)
1960 return rc;
1961
1962 return device_add(dev);
1963}
1964EXPORT_SYMBOL_NS_GPL(cxl_decoder_add_locked, "CXL");
1965
1966/**
1967 * cxl_decoder_add - Add a decoder with targets
1968 * @cxld: The cxl decoder allocated by cxl_<type>_decoder_alloc()
1969 * @target_map: A list of downstream ports that this decoder can direct memory
1970 * traffic to. These numbers should correspond with the port number
1971 * in the PCIe Link Capabilities structure.
1972 *
1973 * This is the unlocked variant of cxl_decoder_add_locked().
1974 * See cxl_decoder_add_locked().
1975 *
1976 * Context: Process context. Takes and releases the device lock of the port that
1977 * owns the @cxld.
1978 */
1979int cxl_decoder_add(struct cxl_decoder *cxld, int *target_map)
1980{
1981 struct cxl_port *port;
1982
1983 if (WARN_ON_ONCE(!cxld))
1984 return -EINVAL;
1985
1986 if (WARN_ON_ONCE(IS_ERR(cxld)))
1987 return PTR_ERR(cxld);
1988
1989 port = to_cxl_port(cxld->dev.parent);
1990
1991 guard(device)(&port->dev);
1992 return cxl_decoder_add_locked(cxld, target_map);
1993}
1994EXPORT_SYMBOL_NS_GPL(cxl_decoder_add, "CXL");
1995
1996static void cxld_unregister(void *dev)
1997{
1998 if (is_endpoint_decoder(dev))
1999 cxl_decoder_detach(NULL, to_cxl_endpoint_decoder(dev), -1,
2000 DETACH_INVALIDATE);
2001
2002 device_unregister(dev);
2003}
2004
2005int cxl_decoder_autoremove(struct device *host, struct cxl_decoder *cxld)
2006{
2007 return devm_add_action_or_reset(host, cxld_unregister, &cxld->dev);
2008}
2009EXPORT_SYMBOL_NS_GPL(cxl_decoder_autoremove, "CXL");
2010
2011/**
2012 * __cxl_driver_register - register a driver for the cxl bus
2013 * @cxl_drv: cxl driver structure to attach
2014 * @owner: owning module/driver
2015 * @modname: KBUILD_MODNAME for parent driver
2016 */
2017int __cxl_driver_register(struct cxl_driver *cxl_drv, struct module *owner,
2018 const char *modname)
2019{
2020 if (!cxl_drv->probe) {
2021 pr_debug("%s ->probe() must be specified\n", modname);
2022 return -EINVAL;
2023 }
2024
2025 if (!cxl_drv->name) {
2026 pr_debug("%s ->name must be specified\n", modname);
2027 return -EINVAL;
2028 }
2029
2030 if (!cxl_drv->id) {
2031 pr_debug("%s ->id must be specified\n", modname);
2032 return -EINVAL;
2033 }
2034
2035 cxl_drv->drv.bus = &cxl_bus_type;
2036 cxl_drv->drv.owner = owner;
2037 cxl_drv->drv.mod_name = modname;
2038 cxl_drv->drv.name = cxl_drv->name;
2039
2040 return driver_register(&cxl_drv->drv);
2041}
2042EXPORT_SYMBOL_NS_GPL(__cxl_driver_register, "CXL");
2043
2044void cxl_driver_unregister(struct cxl_driver *cxl_drv)
2045{
2046 driver_unregister(&cxl_drv->drv);
2047}
2048EXPORT_SYMBOL_NS_GPL(cxl_driver_unregister, "CXL");
2049
2050static int cxl_bus_uevent(const struct device *dev, struct kobj_uevent_env *env)
2051{
2052 return add_uevent_var(env, "MODALIAS=" CXL_MODALIAS_FMT,
2053 cxl_device_id(dev));
2054}
2055
2056static int cxl_bus_match(struct device *dev, const struct device_driver *drv)
2057{
2058 return cxl_device_id(dev) == to_cxl_drv(drv)->id;
2059}
2060
2061static int cxl_bus_probe(struct device *dev)
2062{
2063 int rc;
2064
2065 rc = to_cxl_drv(dev->driver)->probe(dev);
2066 dev_dbg(dev, "probe: %d\n", rc);
2067 return rc;
2068}
2069
2070static void cxl_bus_remove(struct device *dev)
2071{
2072 struct cxl_driver *cxl_drv = to_cxl_drv(dev->driver);
2073
2074 if (cxl_drv->remove)
2075 cxl_drv->remove(dev);
2076}
2077
2078static struct workqueue_struct *cxl_bus_wq;
2079
2080static int cxl_rescan_attach(struct device *dev, void *data)
2081{
2082 int rc = device_attach(dev);
2083
2084 dev_vdbg(dev, "rescan: %s\n", rc ? "attach" : "detached");
2085
2086 return 0;
2087}
2088
2089static void cxl_bus_rescan_queue(struct work_struct *w)
2090{
2091 bus_for_each_dev(&cxl_bus_type, NULL, NULL, cxl_rescan_attach);
2092}
2093
2094void cxl_bus_rescan(void)
2095{
2096 static DECLARE_WORK(rescan_work, cxl_bus_rescan_queue);
2097
2098 queue_work(cxl_bus_wq, &rescan_work);
2099}
2100EXPORT_SYMBOL_NS_GPL(cxl_bus_rescan, "CXL");
2101
2102void cxl_bus_drain(void)
2103{
2104 drain_workqueue(cxl_bus_wq);
2105}
2106EXPORT_SYMBOL_NS_GPL(cxl_bus_drain, "CXL");
2107
2108bool schedule_cxl_memdev_detach(struct cxl_memdev *cxlmd)
2109{
2110 return queue_work(cxl_bus_wq, &cxlmd->detach_work);
2111}
2112EXPORT_SYMBOL_NS_GPL(schedule_cxl_memdev_detach, "CXL");
2113
2114static void add_latency(struct access_coordinate *c, long latency)
2115{
2116 for (int i = 0; i < ACCESS_COORDINATE_MAX; i++) {
2117 c[i].write_latency += latency;
2118 c[i].read_latency += latency;
2119 }
2120}
2121
2122static bool coordinates_valid(struct access_coordinate *c)
2123{
2124 for (int i = 0; i < ACCESS_COORDINATE_MAX; i++) {
2125 if (c[i].read_bandwidth && c[i].write_bandwidth &&
2126 c[i].read_latency && c[i].write_latency)
2127 continue;
2128 return false;
2129 }
2130
2131 return true;
2132}
2133
2134static void set_min_bandwidth(struct access_coordinate *c, unsigned int bw)
2135{
2136 for (int i = 0; i < ACCESS_COORDINATE_MAX; i++) {
2137 c[i].write_bandwidth = min(c[i].write_bandwidth, bw);
2138 c[i].read_bandwidth = min(c[i].read_bandwidth, bw);
2139 }
2140}
2141
2142static void set_access_coordinates(struct access_coordinate *out,
2143 struct access_coordinate *in)
2144{
2145 for (int i = 0; i < ACCESS_COORDINATE_MAX; i++)
2146 out[i] = in[i];
2147}
2148
2149static bool parent_port_is_cxl_root(struct cxl_port *port)
2150{
2151 return is_cxl_root(to_cxl_port(port->dev.parent));
2152}
2153
2154/**
2155 * cxl_endpoint_get_perf_coordinates - Retrieve performance numbers stored in dports
2156 * of CXL path
2157 * @port: endpoint cxl_port
2158 * @coord: output performance data
2159 *
2160 * Return: errno on failure, 0 on success.
2161 */
2162int cxl_endpoint_get_perf_coordinates(struct cxl_port *port,
2163 struct access_coordinate *coord)
2164{
2165 struct cxl_memdev *cxlmd = to_cxl_memdev(port->uport_dev);
2166 struct access_coordinate c[] = {
2167 {
2168 .read_bandwidth = UINT_MAX,
2169 .write_bandwidth = UINT_MAX,
2170 },
2171 {
2172 .read_bandwidth = UINT_MAX,
2173 .write_bandwidth = UINT_MAX,
2174 },
2175 };
2176 struct cxl_port *iter = port;
2177 struct cxl_dport *dport;
2178 struct pci_dev *pdev;
2179 struct device *dev;
2180 unsigned int bw;
2181 bool is_cxl_root;
2182
2183 if (!is_cxl_endpoint(port))
2184 return -EINVAL;
2185
2186 /*
2187 * Skip calculation for RCD. Expectation is HMAT already covers RCD case
2188 * since RCH does not support hotplug.
2189 */
2190 if (cxlmd->cxlds->rcd)
2191 return 0;
2192
2193 /*
2194 * Exit the loop when the parent port of the current iter port is cxl
2195 * root. The iterative loop starts at the endpoint and gathers the
2196 * latency of the CXL link from the current device/port to the connected
2197 * downstream port each iteration.
2198 */
2199 do {
2200 dport = iter->parent_dport;
2201 iter = to_cxl_port(iter->dev.parent);
2202 is_cxl_root = parent_port_is_cxl_root(iter);
2203
2204 /*
2205 * There's no valid access_coordinate for a root port since RPs do not
2206 * have CDAT and therefore needs to be skipped.
2207 */
2208 if (!is_cxl_root) {
2209 if (!coordinates_valid(dport->coord))
2210 return -EINVAL;
2211 cxl_coordinates_combine(c, c, dport->coord);
2212 }
2213 add_latency(c, dport->link_latency);
2214 } while (!is_cxl_root);
2215
2216 dport = iter->parent_dport;
2217 /* Retrieve HB coords */
2218 if (!coordinates_valid(dport->coord))
2219 return -EINVAL;
2220 cxl_coordinates_combine(c, c, dport->coord);
2221
2222 dev = port->uport_dev->parent;
2223 if (!dev_is_pci(dev))
2224 return -ENODEV;
2225
2226 /* Get the calculated PCI paths bandwidth */
2227 pdev = to_pci_dev(dev);
2228 bw = pcie_bandwidth_available(pdev, NULL, NULL, NULL);
2229 if (bw == 0)
2230 return -ENXIO;
2231 bw /= BITS_PER_BYTE;
2232
2233 set_min_bandwidth(c, bw);
2234 set_access_coordinates(coord, c);
2235
2236 return 0;
2237}
2238EXPORT_SYMBOL_NS_GPL(cxl_endpoint_get_perf_coordinates, "CXL");
2239
2240int cxl_port_get_switch_dport_bandwidth(struct cxl_port *port,
2241 struct access_coordinate *c)
2242{
2243 struct cxl_dport *dport = port->parent_dport;
2244
2245 /* Check this port is connected to a switch DSP and not an RP */
2246 if (parent_port_is_cxl_root(to_cxl_port(port->dev.parent)))
2247 return -ENODEV;
2248
2249 if (!coordinates_valid(dport->coord))
2250 return -EINVAL;
2251
2252 for (int i = 0; i < ACCESS_COORDINATE_MAX; i++) {
2253 c[i].read_bandwidth = dport->coord[i].read_bandwidth;
2254 c[i].write_bandwidth = dport->coord[i].write_bandwidth;
2255 }
2256
2257 return 0;
2258}
2259
2260/* for user tooling to ensure port disable work has completed */
2261static ssize_t flush_store(const struct bus_type *bus, const char *buf, size_t count)
2262{
2263 if (sysfs_streq(buf, "1")) {
2264 flush_workqueue(cxl_bus_wq);
2265 return count;
2266 }
2267
2268 return -EINVAL;
2269}
2270
2271static BUS_ATTR_WO(flush);
2272
2273static struct attribute *cxl_bus_attributes[] = {
2274 &bus_attr_flush.attr,
2275 NULL,
2276};
2277
2278static struct attribute_group cxl_bus_attribute_group = {
2279 .attrs = cxl_bus_attributes,
2280};
2281
2282static const struct attribute_group *cxl_bus_attribute_groups[] = {
2283 &cxl_bus_attribute_group,
2284 NULL,
2285};
2286
2287const struct bus_type cxl_bus_type = {
2288 .name = "cxl",
2289 .uevent = cxl_bus_uevent,
2290 .match = cxl_bus_match,
2291 .probe = cxl_bus_probe,
2292 .remove = cxl_bus_remove,
2293 .bus_groups = cxl_bus_attribute_groups,
2294};
2295EXPORT_SYMBOL_NS_GPL(cxl_bus_type, "CXL");
2296
2297static struct dentry *cxl_debugfs;
2298
2299struct dentry *cxl_debugfs_create_dir(const char *dir)
2300{
2301 return debugfs_create_dir(dir, cxl_debugfs);
2302}
2303EXPORT_SYMBOL_NS_GPL(cxl_debugfs_create_dir, "CXL");
2304
2305static __init int cxl_core_init(void)
2306{
2307 int rc;
2308
2309 cxl_debugfs = debugfs_create_dir("cxl", NULL);
2310
2311 if (einj_cxl_is_initialized())
2312 debugfs_create_file("einj_types", 0400, cxl_debugfs, NULL,
2313 &einj_cxl_available_error_type_fops);
2314
2315 cxl_mbox_init();
2316
2317 rc = cxl_memdev_init();
2318 if (rc)
2319 return rc;
2320
2321 cxl_bus_wq = alloc_ordered_workqueue("cxl_port", 0);
2322 if (!cxl_bus_wq) {
2323 rc = -ENOMEM;
2324 goto err_wq;
2325 }
2326
2327 rc = bus_register(&cxl_bus_type);
2328 if (rc)
2329 goto err_bus;
2330
2331 rc = cxl_region_init();
2332 if (rc)
2333 goto err_region;
2334
2335 rc = cxl_ras_init();
2336 if (rc)
2337 goto err_ras;
2338
2339 return 0;
2340
2341err_ras:
2342 cxl_region_exit();
2343err_region:
2344 bus_unregister(&cxl_bus_type);
2345err_bus:
2346 destroy_workqueue(cxl_bus_wq);
2347err_wq:
2348 cxl_memdev_exit();
2349 return rc;
2350}
2351
2352static void cxl_core_exit(void)
2353{
2354 cxl_ras_exit();
2355 cxl_region_exit();
2356 bus_unregister(&cxl_bus_type);
2357 destroy_workqueue(cxl_bus_wq);
2358 cxl_memdev_exit();
2359 debugfs_remove_recursive(cxl_debugfs);
2360}
2361
2362subsys_initcall(cxl_core_init);
2363module_exit(cxl_core_exit);
2364MODULE_DESCRIPTION("CXL: Core Compute Express Link support");
2365MODULE_LICENSE("GPL v2");
2366MODULE_IMPORT_NS("CXL");