Book a Demo!
CoCalc Logo Icon
StoreFeaturesDocsShareSupportNewsAboutPoliciesSign UpSign In
torvalds
GitHub Repository: torvalds/linux
Path: blob/master/drivers/cxl/core/port.c
29537 views
1
// SPDX-License-Identifier: GPL-2.0-only
2
/* Copyright(c) 2020 Intel Corporation. All rights reserved. */
3
#include <linux/platform_device.h>
4
#include <linux/memregion.h>
5
#include <linux/workqueue.h>
6
#include <linux/debugfs.h>
7
#include <linux/device.h>
8
#include <linux/module.h>
9
#include <linux/pci.h>
10
#include <linux/slab.h>
11
#include <linux/idr.h>
12
#include <linux/node.h>
13
#include <cxl/einj.h>
14
#include <cxlmem.h>
15
#include <cxlpci.h>
16
#include <cxl.h>
17
#include "core.h"
18
19
/**
20
* DOC: cxl core
21
*
22
* The CXL core provides a set of interfaces that can be consumed by CXL aware
23
* drivers. The interfaces allow for creation, modification, and destruction of
24
* regions, memory devices, ports, and decoders. CXL aware drivers must register
25
* with the CXL core via these interfaces in order to be able to participate in
26
* cross-device interleave coordination. The CXL core also establishes and
27
* maintains the bridge to the nvdimm subsystem.
28
*
29
* CXL core introduces sysfs hierarchy to control the devices that are
30
* instantiated by the core.
31
*/
32
33
static DEFINE_IDA(cxl_port_ida);
34
static DEFINE_XARRAY(cxl_root_buses);
35
36
/*
37
* The terminal device in PCI is NULL and @platform_bus
38
* for platform devices (for cxl_test)
39
*/
40
static bool is_cxl_host_bridge(struct device *dev)
41
{
42
return (!dev || dev == &platform_bus);
43
}
44
45
int cxl_num_decoders_committed(struct cxl_port *port)
46
{
47
lockdep_assert_held(&cxl_rwsem.region);
48
49
return port->commit_end + 1;
50
}
51
52
static ssize_t devtype_show(struct device *dev, struct device_attribute *attr,
53
char *buf)
54
{
55
return sysfs_emit(buf, "%s\n", dev->type->name);
56
}
57
static DEVICE_ATTR_RO(devtype);
58
59
static int cxl_device_id(const struct device *dev)
60
{
61
if (dev->type == &cxl_nvdimm_bridge_type)
62
return CXL_DEVICE_NVDIMM_BRIDGE;
63
if (dev->type == &cxl_nvdimm_type)
64
return CXL_DEVICE_NVDIMM;
65
if (dev->type == CXL_PMEM_REGION_TYPE())
66
return CXL_DEVICE_PMEM_REGION;
67
if (dev->type == CXL_DAX_REGION_TYPE())
68
return CXL_DEVICE_DAX_REGION;
69
if (is_cxl_port(dev)) {
70
if (is_cxl_root(to_cxl_port(dev)))
71
return CXL_DEVICE_ROOT;
72
return CXL_DEVICE_PORT;
73
}
74
if (is_cxl_memdev(dev))
75
return CXL_DEVICE_MEMORY_EXPANDER;
76
if (dev->type == CXL_REGION_TYPE())
77
return CXL_DEVICE_REGION;
78
if (dev->type == &cxl_pmu_type)
79
return CXL_DEVICE_PMU;
80
return 0;
81
}
82
83
static ssize_t modalias_show(struct device *dev, struct device_attribute *attr,
84
char *buf)
85
{
86
return sysfs_emit(buf, CXL_MODALIAS_FMT "\n", cxl_device_id(dev));
87
}
88
static DEVICE_ATTR_RO(modalias);
89
90
static struct attribute *cxl_base_attributes[] = {
91
&dev_attr_devtype.attr,
92
&dev_attr_modalias.attr,
93
NULL,
94
};
95
96
struct attribute_group cxl_base_attribute_group = {
97
.attrs = cxl_base_attributes,
98
};
99
100
static ssize_t start_show(struct device *dev, struct device_attribute *attr,
101
char *buf)
102
{
103
struct cxl_decoder *cxld = to_cxl_decoder(dev);
104
105
return sysfs_emit(buf, "%#llx\n", cxld->hpa_range.start);
106
}
107
static DEVICE_ATTR_ADMIN_RO(start);
108
109
static ssize_t size_show(struct device *dev, struct device_attribute *attr,
110
char *buf)
111
{
112
struct cxl_decoder *cxld = to_cxl_decoder(dev);
113
114
return sysfs_emit(buf, "%#llx\n", range_len(&cxld->hpa_range));
115
}
116
static DEVICE_ATTR_RO(size);
117
118
#define CXL_DECODER_FLAG_ATTR(name, flag) \
119
static ssize_t name##_show(struct device *dev, \
120
struct device_attribute *attr, char *buf) \
121
{ \
122
struct cxl_decoder *cxld = to_cxl_decoder(dev); \
123
\
124
return sysfs_emit(buf, "%s\n", \
125
(cxld->flags & (flag)) ? "1" : "0"); \
126
} \
127
static DEVICE_ATTR_RO(name)
128
129
CXL_DECODER_FLAG_ATTR(cap_pmem, CXL_DECODER_F_PMEM);
130
CXL_DECODER_FLAG_ATTR(cap_ram, CXL_DECODER_F_RAM);
131
CXL_DECODER_FLAG_ATTR(cap_type2, CXL_DECODER_F_TYPE2);
132
CXL_DECODER_FLAG_ATTR(cap_type3, CXL_DECODER_F_TYPE3);
133
CXL_DECODER_FLAG_ATTR(locked, CXL_DECODER_F_LOCK);
134
135
static ssize_t target_type_show(struct device *dev,
136
struct device_attribute *attr, char *buf)
137
{
138
struct cxl_decoder *cxld = to_cxl_decoder(dev);
139
140
switch (cxld->target_type) {
141
case CXL_DECODER_DEVMEM:
142
return sysfs_emit(buf, "accelerator\n");
143
case CXL_DECODER_HOSTONLYMEM:
144
return sysfs_emit(buf, "expander\n");
145
}
146
return -ENXIO;
147
}
148
static DEVICE_ATTR_RO(target_type);
149
150
static ssize_t emit_target_list(struct cxl_switch_decoder *cxlsd, char *buf)
151
{
152
struct cxl_decoder *cxld = &cxlsd->cxld;
153
ssize_t offset = 0;
154
int i, rc = 0;
155
156
for (i = 0; i < cxld->interleave_ways; i++) {
157
struct cxl_dport *dport = cxlsd->target[i];
158
struct cxl_dport *next = NULL;
159
160
if (!dport)
161
break;
162
163
if (i + 1 < cxld->interleave_ways)
164
next = cxlsd->target[i + 1];
165
rc = sysfs_emit_at(buf, offset, "%d%s", dport->port_id,
166
next ? "," : "");
167
if (rc < 0)
168
return rc;
169
offset += rc;
170
}
171
172
return offset;
173
}
174
175
static ssize_t target_list_show(struct device *dev,
176
struct device_attribute *attr, char *buf)
177
{
178
struct cxl_switch_decoder *cxlsd = to_cxl_switch_decoder(dev);
179
ssize_t offset;
180
int rc;
181
182
guard(rwsem_read)(&cxl_rwsem.region);
183
rc = emit_target_list(cxlsd, buf);
184
if (rc < 0)
185
return rc;
186
offset = rc;
187
188
rc = sysfs_emit_at(buf, offset, "\n");
189
if (rc < 0)
190
return rc;
191
192
return offset + rc;
193
}
194
static DEVICE_ATTR_RO(target_list);
195
196
static ssize_t mode_show(struct device *dev, struct device_attribute *attr,
197
char *buf)
198
{
199
struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
200
struct cxl_memdev *cxlmd = cxled_to_memdev(cxled);
201
struct cxl_dev_state *cxlds = cxlmd->cxlds;
202
/* without @cxl_rwsem.dpa, make sure @part is not reloaded */
203
int part = READ_ONCE(cxled->part);
204
const char *desc;
205
206
if (part < 0)
207
desc = "none";
208
else
209
desc = cxlds->part[part].res.name;
210
211
return sysfs_emit(buf, "%s\n", desc);
212
}
213
214
static ssize_t mode_store(struct device *dev, struct device_attribute *attr,
215
const char *buf, size_t len)
216
{
217
struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
218
enum cxl_partition_mode mode;
219
ssize_t rc;
220
221
if (sysfs_streq(buf, "pmem"))
222
mode = CXL_PARTMODE_PMEM;
223
else if (sysfs_streq(buf, "ram"))
224
mode = CXL_PARTMODE_RAM;
225
else
226
return -EINVAL;
227
228
rc = cxl_dpa_set_part(cxled, mode);
229
if (rc)
230
return rc;
231
232
return len;
233
}
234
static DEVICE_ATTR_RW(mode);
235
236
static ssize_t dpa_resource_show(struct device *dev, struct device_attribute *attr,
237
char *buf)
238
{
239
struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
240
241
guard(rwsem_read)(&cxl_rwsem.dpa);
242
return sysfs_emit(buf, "%#llx\n", (u64)cxl_dpa_resource_start(cxled));
243
}
244
static DEVICE_ATTR_RO(dpa_resource);
245
246
static ssize_t dpa_size_show(struct device *dev, struct device_attribute *attr,
247
char *buf)
248
{
249
struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
250
resource_size_t size = cxl_dpa_size(cxled);
251
252
return sysfs_emit(buf, "%pa\n", &size);
253
}
254
255
static ssize_t dpa_size_store(struct device *dev, struct device_attribute *attr,
256
const char *buf, size_t len)
257
{
258
struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
259
unsigned long long size;
260
ssize_t rc;
261
262
rc = kstrtoull(buf, 0, &size);
263
if (rc)
264
return rc;
265
266
if (!IS_ALIGNED(size, SZ_256M))
267
return -EINVAL;
268
269
rc = cxl_dpa_free(cxled);
270
if (rc)
271
return rc;
272
273
if (size == 0)
274
return len;
275
276
rc = cxl_dpa_alloc(cxled, size);
277
if (rc)
278
return rc;
279
280
return len;
281
}
282
static DEVICE_ATTR_RW(dpa_size);
283
284
static ssize_t interleave_granularity_show(struct device *dev,
285
struct device_attribute *attr,
286
char *buf)
287
{
288
struct cxl_decoder *cxld = to_cxl_decoder(dev);
289
290
return sysfs_emit(buf, "%d\n", cxld->interleave_granularity);
291
}
292
293
static DEVICE_ATTR_RO(interleave_granularity);
294
295
static ssize_t interleave_ways_show(struct device *dev,
296
struct device_attribute *attr, char *buf)
297
{
298
struct cxl_decoder *cxld = to_cxl_decoder(dev);
299
300
return sysfs_emit(buf, "%d\n", cxld->interleave_ways);
301
}
302
303
static DEVICE_ATTR_RO(interleave_ways);
304
305
static ssize_t qos_class_show(struct device *dev,
306
struct device_attribute *attr, char *buf)
307
{
308
struct cxl_root_decoder *cxlrd = to_cxl_root_decoder(dev);
309
310
return sysfs_emit(buf, "%d\n", cxlrd->qos_class);
311
}
312
static DEVICE_ATTR_RO(qos_class);
313
314
static struct attribute *cxl_decoder_base_attrs[] = {
315
&dev_attr_start.attr,
316
&dev_attr_size.attr,
317
&dev_attr_locked.attr,
318
&dev_attr_interleave_granularity.attr,
319
&dev_attr_interleave_ways.attr,
320
NULL,
321
};
322
323
static struct attribute_group cxl_decoder_base_attribute_group = {
324
.attrs = cxl_decoder_base_attrs,
325
};
326
327
static struct attribute *cxl_decoder_root_attrs[] = {
328
&dev_attr_cap_pmem.attr,
329
&dev_attr_cap_ram.attr,
330
&dev_attr_cap_type2.attr,
331
&dev_attr_cap_type3.attr,
332
&dev_attr_target_list.attr,
333
&dev_attr_qos_class.attr,
334
SET_CXL_REGION_ATTR(create_pmem_region)
335
SET_CXL_REGION_ATTR(create_ram_region)
336
SET_CXL_REGION_ATTR(delete_region)
337
NULL,
338
};
339
340
static bool can_create_pmem(struct cxl_root_decoder *cxlrd)
341
{
342
unsigned long flags = CXL_DECODER_F_TYPE3 | CXL_DECODER_F_PMEM;
343
344
return (cxlrd->cxlsd.cxld.flags & flags) == flags;
345
}
346
347
static bool can_create_ram(struct cxl_root_decoder *cxlrd)
348
{
349
unsigned long flags = CXL_DECODER_F_TYPE3 | CXL_DECODER_F_RAM;
350
351
return (cxlrd->cxlsd.cxld.flags & flags) == flags;
352
}
353
354
static umode_t cxl_root_decoder_visible(struct kobject *kobj, struct attribute *a, int n)
355
{
356
struct device *dev = kobj_to_dev(kobj);
357
struct cxl_root_decoder *cxlrd = to_cxl_root_decoder(dev);
358
359
if (a == CXL_REGION_ATTR(create_pmem_region) && !can_create_pmem(cxlrd))
360
return 0;
361
362
if (a == CXL_REGION_ATTR(create_ram_region) && !can_create_ram(cxlrd))
363
return 0;
364
365
if (a == CXL_REGION_ATTR(delete_region) &&
366
!(can_create_pmem(cxlrd) || can_create_ram(cxlrd)))
367
return 0;
368
369
return a->mode;
370
}
371
372
static struct attribute_group cxl_decoder_root_attribute_group = {
373
.attrs = cxl_decoder_root_attrs,
374
.is_visible = cxl_root_decoder_visible,
375
};
376
377
static const struct attribute_group *cxl_decoder_root_attribute_groups[] = {
378
&cxl_decoder_root_attribute_group,
379
&cxl_decoder_base_attribute_group,
380
&cxl_base_attribute_group,
381
NULL,
382
};
383
384
static struct attribute *cxl_decoder_switch_attrs[] = {
385
&dev_attr_target_type.attr,
386
&dev_attr_target_list.attr,
387
SET_CXL_REGION_ATTR(region)
388
NULL,
389
};
390
391
static struct attribute_group cxl_decoder_switch_attribute_group = {
392
.attrs = cxl_decoder_switch_attrs,
393
};
394
395
static const struct attribute_group *cxl_decoder_switch_attribute_groups[] = {
396
&cxl_decoder_switch_attribute_group,
397
&cxl_decoder_base_attribute_group,
398
&cxl_base_attribute_group,
399
NULL,
400
};
401
402
static struct attribute *cxl_decoder_endpoint_attrs[] = {
403
&dev_attr_target_type.attr,
404
&dev_attr_mode.attr,
405
&dev_attr_dpa_size.attr,
406
&dev_attr_dpa_resource.attr,
407
SET_CXL_REGION_ATTR(region)
408
NULL,
409
};
410
411
static struct attribute_group cxl_decoder_endpoint_attribute_group = {
412
.attrs = cxl_decoder_endpoint_attrs,
413
};
414
415
static const struct attribute_group *cxl_decoder_endpoint_attribute_groups[] = {
416
&cxl_decoder_base_attribute_group,
417
&cxl_decoder_endpoint_attribute_group,
418
&cxl_base_attribute_group,
419
NULL,
420
};
421
422
static void __cxl_decoder_release(struct cxl_decoder *cxld)
423
{
424
struct cxl_port *port = to_cxl_port(cxld->dev.parent);
425
426
ida_free(&port->decoder_ida, cxld->id);
427
put_device(&port->dev);
428
}
429
430
static void cxl_endpoint_decoder_release(struct device *dev)
431
{
432
struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
433
434
__cxl_decoder_release(&cxled->cxld);
435
kfree(cxled);
436
}
437
438
static void cxl_switch_decoder_release(struct device *dev)
439
{
440
struct cxl_switch_decoder *cxlsd = to_cxl_switch_decoder(dev);
441
442
__cxl_decoder_release(&cxlsd->cxld);
443
kfree(cxlsd);
444
}
445
446
struct cxl_root_decoder *to_cxl_root_decoder(struct device *dev)
447
{
448
if (dev_WARN_ONCE(dev, !is_root_decoder(dev),
449
"not a cxl_root_decoder device\n"))
450
return NULL;
451
return container_of(dev, struct cxl_root_decoder, cxlsd.cxld.dev);
452
}
453
EXPORT_SYMBOL_NS_GPL(to_cxl_root_decoder, "CXL");
454
455
static void cxl_root_decoder_release(struct device *dev)
456
{
457
struct cxl_root_decoder *cxlrd = to_cxl_root_decoder(dev);
458
459
if (atomic_read(&cxlrd->region_id) >= 0)
460
memregion_free(atomic_read(&cxlrd->region_id));
461
__cxl_decoder_release(&cxlrd->cxlsd.cxld);
462
kfree(cxlrd->ops);
463
kfree(cxlrd);
464
}
465
466
static const struct device_type cxl_decoder_endpoint_type = {
467
.name = "cxl_decoder_endpoint",
468
.release = cxl_endpoint_decoder_release,
469
.groups = cxl_decoder_endpoint_attribute_groups,
470
};
471
472
static const struct device_type cxl_decoder_switch_type = {
473
.name = "cxl_decoder_switch",
474
.release = cxl_switch_decoder_release,
475
.groups = cxl_decoder_switch_attribute_groups,
476
};
477
478
static const struct device_type cxl_decoder_root_type = {
479
.name = "cxl_decoder_root",
480
.release = cxl_root_decoder_release,
481
.groups = cxl_decoder_root_attribute_groups,
482
};
483
484
bool is_endpoint_decoder(struct device *dev)
485
{
486
return dev->type == &cxl_decoder_endpoint_type;
487
}
488
EXPORT_SYMBOL_NS_GPL(is_endpoint_decoder, "CXL");
489
490
bool is_root_decoder(struct device *dev)
491
{
492
return dev->type == &cxl_decoder_root_type;
493
}
494
EXPORT_SYMBOL_NS_GPL(is_root_decoder, "CXL");
495
496
bool is_switch_decoder(struct device *dev)
497
{
498
return is_root_decoder(dev) || dev->type == &cxl_decoder_switch_type;
499
}
500
EXPORT_SYMBOL_NS_GPL(is_switch_decoder, "CXL");
501
502
struct cxl_decoder *to_cxl_decoder(struct device *dev)
503
{
504
if (dev_WARN_ONCE(dev,
505
!is_switch_decoder(dev) && !is_endpoint_decoder(dev),
506
"not a cxl_decoder device\n"))
507
return NULL;
508
return container_of(dev, struct cxl_decoder, dev);
509
}
510
EXPORT_SYMBOL_NS_GPL(to_cxl_decoder, "CXL");
511
512
struct cxl_endpoint_decoder *to_cxl_endpoint_decoder(struct device *dev)
513
{
514
if (dev_WARN_ONCE(dev, !is_endpoint_decoder(dev),
515
"not a cxl_endpoint_decoder device\n"))
516
return NULL;
517
return container_of(dev, struct cxl_endpoint_decoder, cxld.dev);
518
}
519
EXPORT_SYMBOL_NS_GPL(to_cxl_endpoint_decoder, "CXL");
520
521
struct cxl_switch_decoder *to_cxl_switch_decoder(struct device *dev)
522
{
523
if (dev_WARN_ONCE(dev, !is_switch_decoder(dev),
524
"not a cxl_switch_decoder device\n"))
525
return NULL;
526
return container_of(dev, struct cxl_switch_decoder, cxld.dev);
527
}
528
EXPORT_SYMBOL_NS_GPL(to_cxl_switch_decoder, "CXL");
529
530
static void cxl_ep_release(struct cxl_ep *ep)
531
{
532
put_device(ep->ep);
533
kfree(ep);
534
}
535
536
static void cxl_ep_remove(struct cxl_port *port, struct cxl_ep *ep)
537
{
538
if (!ep)
539
return;
540
xa_erase(&port->endpoints, (unsigned long) ep->ep);
541
cxl_ep_release(ep);
542
}
543
544
static void cxl_port_release(struct device *dev)
545
{
546
struct cxl_port *port = to_cxl_port(dev);
547
unsigned long index;
548
struct cxl_ep *ep;
549
550
xa_for_each(&port->endpoints, index, ep)
551
cxl_ep_remove(port, ep);
552
xa_destroy(&port->endpoints);
553
xa_destroy(&port->dports);
554
xa_destroy(&port->regions);
555
ida_free(&cxl_port_ida, port->id);
556
if (is_cxl_root(port))
557
kfree(to_cxl_root(port));
558
else
559
kfree(port);
560
}
561
562
static ssize_t decoders_committed_show(struct device *dev,
563
struct device_attribute *attr, char *buf)
564
{
565
struct cxl_port *port = to_cxl_port(dev);
566
567
guard(rwsem_read)(&cxl_rwsem.region);
568
return sysfs_emit(buf, "%d\n", cxl_num_decoders_committed(port));
569
}
570
571
static DEVICE_ATTR_RO(decoders_committed);
572
573
static struct attribute *cxl_port_attrs[] = {
574
&dev_attr_decoders_committed.attr,
575
NULL,
576
};
577
578
static struct attribute_group cxl_port_attribute_group = {
579
.attrs = cxl_port_attrs,
580
};
581
582
static const struct attribute_group *cxl_port_attribute_groups[] = {
583
&cxl_base_attribute_group,
584
&cxl_port_attribute_group,
585
NULL,
586
};
587
588
static const struct device_type cxl_port_type = {
589
.name = "cxl_port",
590
.release = cxl_port_release,
591
.groups = cxl_port_attribute_groups,
592
};
593
594
bool is_cxl_port(const struct device *dev)
595
{
596
return dev->type == &cxl_port_type;
597
}
598
EXPORT_SYMBOL_NS_GPL(is_cxl_port, "CXL");
599
600
struct cxl_port *to_cxl_port(const struct device *dev)
601
{
602
if (dev_WARN_ONCE(dev, dev->type != &cxl_port_type,
603
"not a cxl_port device\n"))
604
return NULL;
605
return container_of(dev, struct cxl_port, dev);
606
}
607
EXPORT_SYMBOL_NS_GPL(to_cxl_port, "CXL");
608
609
struct cxl_port *parent_port_of(struct cxl_port *port)
610
{
611
if (!port || !port->parent_dport)
612
return NULL;
613
return port->parent_dport->port;
614
}
615
616
static void unregister_port(void *_port)
617
{
618
struct cxl_port *port = _port;
619
struct cxl_port *parent = parent_port_of(port);
620
struct device *lock_dev;
621
622
/*
623
* CXL root port's and the first level of ports are unregistered
624
* under the platform firmware device lock, all other ports are
625
* unregistered while holding their parent port lock.
626
*/
627
if (!parent)
628
lock_dev = port->uport_dev;
629
else if (is_cxl_root(parent))
630
lock_dev = parent->uport_dev;
631
else
632
lock_dev = &parent->dev;
633
634
device_lock_assert(lock_dev);
635
port->dead = true;
636
device_unregister(&port->dev);
637
}
638
639
static void cxl_unlink_uport(void *_port)
640
{
641
struct cxl_port *port = _port;
642
643
sysfs_remove_link(&port->dev.kobj, "uport");
644
}
645
646
static int devm_cxl_link_uport(struct device *host, struct cxl_port *port)
647
{
648
int rc;
649
650
rc = sysfs_create_link(&port->dev.kobj, &port->uport_dev->kobj,
651
"uport");
652
if (rc)
653
return rc;
654
return devm_add_action_or_reset(host, cxl_unlink_uport, port);
655
}
656
657
static void cxl_unlink_parent_dport(void *_port)
658
{
659
struct cxl_port *port = _port;
660
661
sysfs_remove_link(&port->dev.kobj, "parent_dport");
662
}
663
664
static int devm_cxl_link_parent_dport(struct device *host,
665
struct cxl_port *port,
666
struct cxl_dport *parent_dport)
667
{
668
int rc;
669
670
if (!parent_dport)
671
return 0;
672
673
rc = sysfs_create_link(&port->dev.kobj, &parent_dport->dport_dev->kobj,
674
"parent_dport");
675
if (rc)
676
return rc;
677
return devm_add_action_or_reset(host, cxl_unlink_parent_dport, port);
678
}
679
680
static struct lock_class_key cxl_port_key;
681
682
static struct cxl_port *cxl_port_alloc(struct device *uport_dev,
683
struct cxl_dport *parent_dport)
684
{
685
struct cxl_root *cxl_root __free(kfree) = NULL;
686
struct cxl_port *port, *_port __free(kfree) = NULL;
687
struct device *dev;
688
int rc;
689
690
/* No parent_dport, root cxl_port */
691
if (!parent_dport) {
692
cxl_root = kzalloc(sizeof(*cxl_root), GFP_KERNEL);
693
if (!cxl_root)
694
return ERR_PTR(-ENOMEM);
695
} else {
696
_port = kzalloc(sizeof(*port), GFP_KERNEL);
697
if (!_port)
698
return ERR_PTR(-ENOMEM);
699
}
700
701
rc = ida_alloc(&cxl_port_ida, GFP_KERNEL);
702
if (rc < 0)
703
return ERR_PTR(rc);
704
705
if (cxl_root)
706
port = &no_free_ptr(cxl_root)->port;
707
else
708
port = no_free_ptr(_port);
709
710
port->id = rc;
711
port->uport_dev = uport_dev;
712
713
/*
714
* The top-level cxl_port "cxl_root" does not have a cxl_port as
715
* its parent and it does not have any corresponding component
716
* registers as its decode is described by a fixed platform
717
* description.
718
*/
719
dev = &port->dev;
720
if (parent_dport) {
721
struct cxl_port *parent_port = parent_dport->port;
722
struct cxl_port *iter;
723
724
dev->parent = &parent_port->dev;
725
port->depth = parent_port->depth + 1;
726
port->parent_dport = parent_dport;
727
728
/*
729
* walk to the host bridge, or the first ancestor that knows
730
* the host bridge
731
*/
732
iter = port;
733
while (!iter->host_bridge &&
734
!is_cxl_root(to_cxl_port(iter->dev.parent)))
735
iter = to_cxl_port(iter->dev.parent);
736
if (iter->host_bridge)
737
port->host_bridge = iter->host_bridge;
738
else if (parent_dport->rch)
739
port->host_bridge = parent_dport->dport_dev;
740
else
741
port->host_bridge = iter->uport_dev;
742
dev_dbg(uport_dev, "host-bridge: %s\n",
743
dev_name(port->host_bridge));
744
} else
745
dev->parent = uport_dev;
746
747
ida_init(&port->decoder_ida);
748
port->hdm_end = -1;
749
port->commit_end = -1;
750
xa_init(&port->dports);
751
xa_init(&port->endpoints);
752
xa_init(&port->regions);
753
port->component_reg_phys = CXL_RESOURCE_NONE;
754
755
device_initialize(dev);
756
lockdep_set_class_and_subclass(&dev->mutex, &cxl_port_key, port->depth);
757
device_set_pm_not_required(dev);
758
dev->bus = &cxl_bus_type;
759
dev->type = &cxl_port_type;
760
761
return port;
762
}
763
764
static int cxl_setup_comp_regs(struct device *host, struct cxl_register_map *map,
765
resource_size_t component_reg_phys)
766
{
767
*map = (struct cxl_register_map) {
768
.host = host,
769
.reg_type = CXL_REGLOC_RBI_EMPTY,
770
.resource = component_reg_phys,
771
};
772
773
if (component_reg_phys == CXL_RESOURCE_NONE)
774
return 0;
775
776
map->reg_type = CXL_REGLOC_RBI_COMPONENT;
777
map->max_size = CXL_COMPONENT_REG_BLOCK_SIZE;
778
779
return cxl_setup_regs(map);
780
}
781
782
static int cxl_port_setup_regs(struct cxl_port *port,
783
resource_size_t component_reg_phys)
784
{
785
if (dev_is_platform(port->uport_dev))
786
return 0;
787
return cxl_setup_comp_regs(&port->dev, &port->reg_map,
788
component_reg_phys);
789
}
790
791
static int cxl_dport_setup_regs(struct device *host, struct cxl_dport *dport,
792
resource_size_t component_reg_phys)
793
{
794
int rc;
795
796
if (dev_is_platform(dport->dport_dev))
797
return 0;
798
799
/*
800
* use @dport->dport_dev for the context for error messages during
801
* register probing, and fixup @host after the fact, since @host may be
802
* NULL.
803
*/
804
rc = cxl_setup_comp_regs(dport->dport_dev, &dport->reg_map,
805
component_reg_phys);
806
dport->reg_map.host = host;
807
return rc;
808
}
809
810
DEFINE_SHOW_ATTRIBUTE(einj_cxl_available_error_type);
811
812
static int cxl_einj_inject(void *data, u64 type)
813
{
814
struct cxl_dport *dport = data;
815
816
if (dport->rch)
817
return einj_cxl_inject_rch_error(dport->rcrb.base, type);
818
819
return einj_cxl_inject_error(to_pci_dev(dport->dport_dev), type);
820
}
821
DEFINE_DEBUGFS_ATTRIBUTE(cxl_einj_inject_fops, NULL, cxl_einj_inject,
822
"0x%llx\n");
823
824
static void cxl_debugfs_create_dport_dir(struct cxl_dport *dport)
825
{
826
struct dentry *dir;
827
828
if (!einj_cxl_is_initialized())
829
return;
830
831
/*
832
* dport_dev needs to be a PCIe port for CXL 2.0+ ports because
833
* EINJ expects a dport SBDF to be specified for 2.0 error injection.
834
*/
835
if (!dport->rch && !dev_is_pci(dport->dport_dev))
836
return;
837
838
dir = cxl_debugfs_create_dir(dev_name(dport->dport_dev));
839
840
debugfs_create_file("einj_inject", 0200, dir, dport,
841
&cxl_einj_inject_fops);
842
}
843
844
static int cxl_port_add(struct cxl_port *port,
845
resource_size_t component_reg_phys,
846
struct cxl_dport *parent_dport)
847
{
848
struct device *dev __free(put_device) = &port->dev;
849
int rc;
850
851
if (is_cxl_memdev(port->uport_dev)) {
852
struct cxl_memdev *cxlmd = to_cxl_memdev(port->uport_dev);
853
struct cxl_dev_state *cxlds = cxlmd->cxlds;
854
855
rc = dev_set_name(dev, "endpoint%d", port->id);
856
if (rc)
857
return rc;
858
859
/*
860
* The endpoint driver already enumerated the component and RAS
861
* registers. Reuse that enumeration while prepping them to be
862
* mapped by the cxl_port driver.
863
*/
864
port->reg_map = cxlds->reg_map;
865
port->reg_map.host = &port->dev;
866
cxlmd->endpoint = port;
867
} else if (parent_dport) {
868
rc = dev_set_name(dev, "port%d", port->id);
869
if (rc)
870
return rc;
871
872
port->component_reg_phys = component_reg_phys;
873
} else {
874
rc = dev_set_name(dev, "root%d", port->id);
875
if (rc)
876
return rc;
877
}
878
879
rc = device_add(dev);
880
if (rc)
881
return rc;
882
883
/* Inhibit the cleanup function invoked */
884
dev = NULL;
885
return 0;
886
}
887
888
static struct cxl_port *__devm_cxl_add_port(struct device *host,
889
struct device *uport_dev,
890
resource_size_t component_reg_phys,
891
struct cxl_dport *parent_dport)
892
{
893
struct cxl_port *port;
894
int rc;
895
896
port = cxl_port_alloc(uport_dev, parent_dport);
897
if (IS_ERR(port))
898
return port;
899
900
rc = cxl_port_add(port, component_reg_phys, parent_dport);
901
if (rc)
902
return ERR_PTR(rc);
903
904
rc = devm_add_action_or_reset(host, unregister_port, port);
905
if (rc)
906
return ERR_PTR(rc);
907
908
rc = devm_cxl_link_uport(host, port);
909
if (rc)
910
return ERR_PTR(rc);
911
912
rc = devm_cxl_link_parent_dport(host, port, parent_dport);
913
if (rc)
914
return ERR_PTR(rc);
915
916
if (parent_dport && dev_is_pci(uport_dev))
917
port->pci_latency = cxl_pci_get_latency(to_pci_dev(uport_dev));
918
919
return port;
920
}
921
922
/**
923
* devm_cxl_add_port - register a cxl_port in CXL memory decode hierarchy
924
* @host: host device for devm operations
925
* @uport_dev: "physical" device implementing this upstream port
926
* @component_reg_phys: (optional) for configurable cxl_port instances
927
* @parent_dport: next hop up in the CXL memory decode hierarchy
928
*/
929
struct cxl_port *devm_cxl_add_port(struct device *host,
930
struct device *uport_dev,
931
resource_size_t component_reg_phys,
932
struct cxl_dport *parent_dport)
933
{
934
struct cxl_port *port, *parent_port;
935
936
port = __devm_cxl_add_port(host, uport_dev, component_reg_phys,
937
parent_dport);
938
939
parent_port = parent_dport ? parent_dport->port : NULL;
940
if (IS_ERR(port)) {
941
dev_dbg(uport_dev, "Failed to add%s%s%s: %ld\n",
942
parent_port ? " port to " : "",
943
parent_port ? dev_name(&parent_port->dev) : "",
944
parent_port ? "" : " root port",
945
PTR_ERR(port));
946
} else {
947
dev_dbg(uport_dev, "%s added%s%s%s\n",
948
dev_name(&port->dev),
949
parent_port ? " to " : "",
950
parent_port ? dev_name(&parent_port->dev) : "",
951
parent_port ? "" : " (root port)");
952
}
953
954
return port;
955
}
956
EXPORT_SYMBOL_NS_GPL(devm_cxl_add_port, "CXL");
957
958
struct cxl_root *devm_cxl_add_root(struct device *host,
959
const struct cxl_root_ops *ops)
960
{
961
struct cxl_root *cxl_root;
962
struct cxl_port *port;
963
964
port = devm_cxl_add_port(host, host, CXL_RESOURCE_NONE, NULL);
965
if (IS_ERR(port))
966
return ERR_CAST(port);
967
968
cxl_root = to_cxl_root(port);
969
cxl_root->ops = ops;
970
return cxl_root;
971
}
972
EXPORT_SYMBOL_NS_GPL(devm_cxl_add_root, "CXL");
973
974
struct pci_bus *cxl_port_to_pci_bus(struct cxl_port *port)
975
{
976
/* There is no pci_bus associated with a CXL platform-root port */
977
if (is_cxl_root(port))
978
return NULL;
979
980
if (dev_is_pci(port->uport_dev)) {
981
struct pci_dev *pdev = to_pci_dev(port->uport_dev);
982
983
return pdev->subordinate;
984
}
985
986
return xa_load(&cxl_root_buses, (unsigned long)port->uport_dev);
987
}
988
EXPORT_SYMBOL_NS_GPL(cxl_port_to_pci_bus, "CXL");
989
990
static void unregister_pci_bus(void *uport_dev)
991
{
992
xa_erase(&cxl_root_buses, (unsigned long)uport_dev);
993
}
994
995
int devm_cxl_register_pci_bus(struct device *host, struct device *uport_dev,
996
struct pci_bus *bus)
997
{
998
int rc;
999
1000
if (dev_is_pci(uport_dev))
1001
return -EINVAL;
1002
1003
rc = xa_insert(&cxl_root_buses, (unsigned long)uport_dev, bus,
1004
GFP_KERNEL);
1005
if (rc)
1006
return rc;
1007
return devm_add_action_or_reset(host, unregister_pci_bus, uport_dev);
1008
}
1009
EXPORT_SYMBOL_NS_GPL(devm_cxl_register_pci_bus, "CXL");
1010
1011
static bool dev_is_cxl_root_child(struct device *dev)
1012
{
1013
struct cxl_port *port, *parent;
1014
1015
if (!is_cxl_port(dev))
1016
return false;
1017
1018
port = to_cxl_port(dev);
1019
if (is_cxl_root(port))
1020
return false;
1021
1022
parent = to_cxl_port(port->dev.parent);
1023
if (is_cxl_root(parent))
1024
return true;
1025
1026
return false;
1027
}
1028
1029
struct cxl_root *find_cxl_root(struct cxl_port *port)
1030
{
1031
struct cxl_port *iter = port;
1032
1033
while (iter && !is_cxl_root(iter))
1034
iter = to_cxl_port(iter->dev.parent);
1035
1036
if (!iter)
1037
return NULL;
1038
get_device(&iter->dev);
1039
return to_cxl_root(iter);
1040
}
1041
EXPORT_SYMBOL_NS_GPL(find_cxl_root, "CXL");
1042
1043
static struct cxl_dport *find_dport(struct cxl_port *port, int id)
1044
{
1045
struct cxl_dport *dport;
1046
unsigned long index;
1047
1048
device_lock_assert(&port->dev);
1049
xa_for_each(&port->dports, index, dport)
1050
if (dport->port_id == id)
1051
return dport;
1052
return NULL;
1053
}
1054
1055
static int add_dport(struct cxl_port *port, struct cxl_dport *dport)
1056
{
1057
struct cxl_dport *dup;
1058
int rc;
1059
1060
device_lock_assert(&port->dev);
1061
dup = find_dport(port, dport->port_id);
1062
if (dup) {
1063
dev_err(&port->dev,
1064
"unable to add dport%d-%s non-unique port id (%s)\n",
1065
dport->port_id, dev_name(dport->dport_dev),
1066
dev_name(dup->dport_dev));
1067
return -EBUSY;
1068
}
1069
1070
rc = xa_insert(&port->dports, (unsigned long)dport->dport_dev, dport,
1071
GFP_KERNEL);
1072
if (rc)
1073
return rc;
1074
1075
port->nr_dports++;
1076
return 0;
1077
}
1078
1079
/*
1080
* Since root-level CXL dports cannot be enumerated by PCI they are not
1081
* enumerated by the common port driver that acquires the port lock over
1082
* dport add/remove. Instead, root dports are manually added by a
1083
* platform driver and cond_cxl_root_lock() is used to take the missing
1084
* port lock in that case.
1085
*/
1086
static void cond_cxl_root_lock(struct cxl_port *port)
1087
{
1088
if (is_cxl_root(port))
1089
device_lock(&port->dev);
1090
}
1091
1092
static void cond_cxl_root_unlock(struct cxl_port *port)
1093
{
1094
if (is_cxl_root(port))
1095
device_unlock(&port->dev);
1096
}
1097
1098
static void cxl_dport_remove(void *data)
1099
{
1100
struct cxl_dport *dport = data;
1101
struct cxl_port *port = dport->port;
1102
1103
xa_erase(&port->dports, (unsigned long) dport->dport_dev);
1104
put_device(dport->dport_dev);
1105
}
1106
1107
static void cxl_dport_unlink(void *data)
1108
{
1109
struct cxl_dport *dport = data;
1110
struct cxl_port *port = dport->port;
1111
char link_name[CXL_TARGET_STRLEN];
1112
1113
sprintf(link_name, "dport%d", dport->port_id);
1114
sysfs_remove_link(&port->dev.kobj, link_name);
1115
}
1116
1117
static struct cxl_dport *
1118
__devm_cxl_add_dport(struct cxl_port *port, struct device *dport_dev,
1119
int port_id, resource_size_t component_reg_phys,
1120
resource_size_t rcrb)
1121
{
1122
char link_name[CXL_TARGET_STRLEN];
1123
struct cxl_dport *dport;
1124
struct device *host;
1125
int rc;
1126
1127
if (is_cxl_root(port))
1128
host = port->uport_dev;
1129
else
1130
host = &port->dev;
1131
1132
if (!host->driver) {
1133
dev_WARN_ONCE(&port->dev, 1, "dport:%s bad devm context\n",
1134
dev_name(dport_dev));
1135
return ERR_PTR(-ENXIO);
1136
}
1137
1138
if (snprintf(link_name, CXL_TARGET_STRLEN, "dport%d", port_id) >=
1139
CXL_TARGET_STRLEN)
1140
return ERR_PTR(-EINVAL);
1141
1142
dport = devm_kzalloc(host, sizeof(*dport), GFP_KERNEL);
1143
if (!dport)
1144
return ERR_PTR(-ENOMEM);
1145
1146
dport->dport_dev = dport_dev;
1147
dport->port_id = port_id;
1148
dport->port = port;
1149
1150
if (rcrb == CXL_RESOURCE_NONE) {
1151
rc = cxl_dport_setup_regs(&port->dev, dport,
1152
component_reg_phys);
1153
if (rc)
1154
return ERR_PTR(rc);
1155
} else {
1156
dport->rcrb.base = rcrb;
1157
component_reg_phys = __rcrb_to_component(dport_dev, &dport->rcrb,
1158
CXL_RCRB_DOWNSTREAM);
1159
if (component_reg_phys == CXL_RESOURCE_NONE) {
1160
dev_warn(dport_dev, "Invalid Component Registers in RCRB");
1161
return ERR_PTR(-ENXIO);
1162
}
1163
1164
/*
1165
* RCH @dport is not ready to map until associated with its
1166
* memdev
1167
*/
1168
rc = cxl_dport_setup_regs(NULL, dport, component_reg_phys);
1169
if (rc)
1170
return ERR_PTR(rc);
1171
1172
dport->rch = true;
1173
}
1174
1175
if (component_reg_phys != CXL_RESOURCE_NONE)
1176
dev_dbg(dport_dev, "Component Registers found for dport: %pa\n",
1177
&component_reg_phys);
1178
1179
cond_cxl_root_lock(port);
1180
rc = add_dport(port, dport);
1181
cond_cxl_root_unlock(port);
1182
if (rc)
1183
return ERR_PTR(rc);
1184
1185
get_device(dport_dev);
1186
rc = devm_add_action_or_reset(host, cxl_dport_remove, dport);
1187
if (rc)
1188
return ERR_PTR(rc);
1189
1190
rc = sysfs_create_link(&port->dev.kobj, &dport_dev->kobj, link_name);
1191
if (rc)
1192
return ERR_PTR(rc);
1193
1194
rc = devm_add_action_or_reset(host, cxl_dport_unlink, dport);
1195
if (rc)
1196
return ERR_PTR(rc);
1197
1198
if (dev_is_pci(dport_dev))
1199
dport->link_latency = cxl_pci_get_latency(to_pci_dev(dport_dev));
1200
1201
cxl_debugfs_create_dport_dir(dport);
1202
1203
/*
1204
* Setup port register if this is the first dport showed up. Having
1205
* a dport also means that there is at least 1 active link.
1206
*/
1207
if (port->nr_dports == 1 &&
1208
port->component_reg_phys != CXL_RESOURCE_NONE) {
1209
rc = cxl_port_setup_regs(port, port->component_reg_phys);
1210
if (rc)
1211
return ERR_PTR(rc);
1212
port->component_reg_phys = CXL_RESOURCE_NONE;
1213
}
1214
1215
return dport;
1216
}
1217
1218
/**
1219
* devm_cxl_add_dport - append VH downstream port data to a cxl_port
1220
* @port: the cxl_port that references this dport
1221
* @dport_dev: firmware or PCI device representing the dport
1222
* @port_id: identifier for this dport in a decoder's target list
1223
* @component_reg_phys: optional location of CXL component registers
1224
*
1225
* Note that dports are appended to the devm release action's of the
1226
* either the port's host (for root ports), or the port itself (for
1227
* switch ports)
1228
*/
1229
struct cxl_dport *devm_cxl_add_dport(struct cxl_port *port,
1230
struct device *dport_dev, int port_id,
1231
resource_size_t component_reg_phys)
1232
{
1233
struct cxl_dport *dport;
1234
1235
dport = __devm_cxl_add_dport(port, dport_dev, port_id,
1236
component_reg_phys, CXL_RESOURCE_NONE);
1237
if (IS_ERR(dport)) {
1238
dev_dbg(dport_dev, "failed to add dport to %s: %ld\n",
1239
dev_name(&port->dev), PTR_ERR(dport));
1240
} else {
1241
dev_dbg(dport_dev, "dport added to %s\n",
1242
dev_name(&port->dev));
1243
}
1244
1245
return dport;
1246
}
1247
EXPORT_SYMBOL_NS_GPL(devm_cxl_add_dport, "CXL");
1248
1249
/**
1250
* devm_cxl_add_rch_dport - append RCH downstream port data to a cxl_port
1251
* @port: the cxl_port that references this dport
1252
* @dport_dev: firmware or PCI device representing the dport
1253
* @port_id: identifier for this dport in a decoder's target list
1254
* @rcrb: mandatory location of a Root Complex Register Block
1255
*
1256
* See CXL 3.0 9.11.8 CXL Devices Attached to an RCH
1257
*/
1258
struct cxl_dport *devm_cxl_add_rch_dport(struct cxl_port *port,
1259
struct device *dport_dev, int port_id,
1260
resource_size_t rcrb)
1261
{
1262
struct cxl_dport *dport;
1263
1264
if (rcrb == CXL_RESOURCE_NONE) {
1265
dev_dbg(&port->dev, "failed to add RCH dport, missing RCRB\n");
1266
return ERR_PTR(-EINVAL);
1267
}
1268
1269
dport = __devm_cxl_add_dport(port, dport_dev, port_id,
1270
CXL_RESOURCE_NONE, rcrb);
1271
if (IS_ERR(dport)) {
1272
dev_dbg(dport_dev, "failed to add RCH dport to %s: %ld\n",
1273
dev_name(&port->dev), PTR_ERR(dport));
1274
} else {
1275
dev_dbg(dport_dev, "RCH dport added to %s\n",
1276
dev_name(&port->dev));
1277
}
1278
1279
return dport;
1280
}
1281
EXPORT_SYMBOL_NS_GPL(devm_cxl_add_rch_dport, "CXL");
1282
1283
static int add_ep(struct cxl_ep *new)
1284
{
1285
struct cxl_port *port = new->dport->port;
1286
1287
guard(device)(&port->dev);
1288
if (port->dead)
1289
return -ENXIO;
1290
1291
return xa_insert(&port->endpoints, (unsigned long)new->ep,
1292
new, GFP_KERNEL);
1293
}
1294
1295
/**
1296
* cxl_add_ep - register an endpoint's interest in a port
1297
* @dport: the dport that routes to @ep_dev
1298
* @ep_dev: device representing the endpoint
1299
*
1300
* Intermediate CXL ports are scanned based on the arrival of endpoints.
1301
* When those endpoints depart the port can be destroyed once all
1302
* endpoints that care about that port have been removed.
1303
*/
1304
static int cxl_add_ep(struct cxl_dport *dport, struct device *ep_dev)
1305
{
1306
struct cxl_ep *ep;
1307
int rc;
1308
1309
ep = kzalloc(sizeof(*ep), GFP_KERNEL);
1310
if (!ep)
1311
return -ENOMEM;
1312
1313
ep->ep = get_device(ep_dev);
1314
ep->dport = dport;
1315
1316
rc = add_ep(ep);
1317
if (rc)
1318
cxl_ep_release(ep);
1319
return rc;
1320
}
1321
1322
struct cxl_find_port_ctx {
1323
const struct device *dport_dev;
1324
const struct cxl_port *parent_port;
1325
struct cxl_dport **dport;
1326
};
1327
1328
static int match_port_by_dport(struct device *dev, const void *data)
1329
{
1330
const struct cxl_find_port_ctx *ctx = data;
1331
struct cxl_dport *dport;
1332
struct cxl_port *port;
1333
1334
if (!is_cxl_port(dev))
1335
return 0;
1336
if (ctx->parent_port && dev->parent != &ctx->parent_port->dev)
1337
return 0;
1338
1339
port = to_cxl_port(dev);
1340
dport = cxl_find_dport_by_dev(port, ctx->dport_dev);
1341
if (ctx->dport)
1342
*ctx->dport = dport;
1343
return dport != NULL;
1344
}
1345
1346
static struct cxl_port *__find_cxl_port(struct cxl_find_port_ctx *ctx)
1347
{
1348
struct device *dev;
1349
1350
if (!ctx->dport_dev)
1351
return NULL;
1352
1353
dev = bus_find_device(&cxl_bus_type, NULL, ctx, match_port_by_dport);
1354
if (dev)
1355
return to_cxl_port(dev);
1356
return NULL;
1357
}
1358
1359
static struct cxl_port *find_cxl_port(struct device *dport_dev,
1360
struct cxl_dport **dport)
1361
{
1362
struct cxl_find_port_ctx ctx = {
1363
.dport_dev = dport_dev,
1364
.dport = dport,
1365
};
1366
struct cxl_port *port;
1367
1368
port = __find_cxl_port(&ctx);
1369
return port;
1370
}
1371
1372
/*
1373
* All users of grandparent() are using it to walk PCIe-like switch port
1374
* hierarchy. A PCIe switch is comprised of a bridge device representing the
1375
* upstream switch port and N bridges representing downstream switch ports. When
1376
* bridges stack the grand-parent of a downstream switch port is another
1377
* downstream switch port in the immediate ancestor switch.
1378
*/
1379
static struct device *grandparent(struct device *dev)
1380
{
1381
if (dev && dev->parent)
1382
return dev->parent->parent;
1383
return NULL;
1384
}
1385
1386
static struct device *endpoint_host(struct cxl_port *endpoint)
1387
{
1388
struct cxl_port *port = to_cxl_port(endpoint->dev.parent);
1389
1390
if (is_cxl_root(port))
1391
return port->uport_dev;
1392
return &port->dev;
1393
}
1394
1395
static void delete_endpoint(void *data)
1396
{
1397
struct cxl_memdev *cxlmd = data;
1398
struct cxl_port *endpoint = cxlmd->endpoint;
1399
struct device *host = endpoint_host(endpoint);
1400
1401
scoped_guard(device, host) {
1402
if (host->driver && !endpoint->dead) {
1403
devm_release_action(host, cxl_unlink_parent_dport, endpoint);
1404
devm_release_action(host, cxl_unlink_uport, endpoint);
1405
devm_release_action(host, unregister_port, endpoint);
1406
}
1407
cxlmd->endpoint = NULL;
1408
}
1409
put_device(&endpoint->dev);
1410
put_device(host);
1411
}
1412
1413
int cxl_endpoint_autoremove(struct cxl_memdev *cxlmd, struct cxl_port *endpoint)
1414
{
1415
struct device *host = endpoint_host(endpoint);
1416
struct device *dev = &cxlmd->dev;
1417
1418
get_device(host);
1419
get_device(&endpoint->dev);
1420
cxlmd->depth = endpoint->depth;
1421
return devm_add_action_or_reset(dev, delete_endpoint, cxlmd);
1422
}
1423
EXPORT_SYMBOL_NS_GPL(cxl_endpoint_autoremove, "CXL");
1424
1425
/*
1426
* The natural end of life of a non-root 'cxl_port' is when its parent port goes
1427
* through a ->remove() event ("top-down" unregistration). The unnatural trigger
1428
* for a port to be unregistered is when all memdevs beneath that port have gone
1429
* through ->remove(). This "bottom-up" removal selectively removes individual
1430
* child ports manually. This depends on devm_cxl_add_port() to not change is
1431
* devm action registration order, and for dports to have already been
1432
* destroyed by del_dports().
1433
*/
1434
static void delete_switch_port(struct cxl_port *port)
1435
{
1436
devm_release_action(port->dev.parent, cxl_unlink_parent_dport, port);
1437
devm_release_action(port->dev.parent, cxl_unlink_uport, port);
1438
devm_release_action(port->dev.parent, unregister_port, port);
1439
}
1440
1441
static void del_dport(struct cxl_dport *dport)
1442
{
1443
struct cxl_port *port = dport->port;
1444
1445
devm_release_action(&port->dev, cxl_dport_unlink, dport);
1446
devm_release_action(&port->dev, cxl_dport_remove, dport);
1447
devm_kfree(&port->dev, dport);
1448
}
1449
1450
static void del_dports(struct cxl_port *port)
1451
{
1452
struct cxl_dport *dport;
1453
unsigned long index;
1454
1455
device_lock_assert(&port->dev);
1456
1457
xa_for_each(&port->dports, index, dport)
1458
del_dport(dport);
1459
}
1460
1461
struct detach_ctx {
1462
struct cxl_memdev *cxlmd;
1463
int depth;
1464
};
1465
1466
static int port_has_memdev(struct device *dev, const void *data)
1467
{
1468
const struct detach_ctx *ctx = data;
1469
struct cxl_port *port;
1470
1471
if (!is_cxl_port(dev))
1472
return 0;
1473
1474
port = to_cxl_port(dev);
1475
if (port->depth != ctx->depth)
1476
return 0;
1477
1478
return !!cxl_ep_load(port, ctx->cxlmd);
1479
}
1480
1481
static void cxl_detach_ep(void *data)
1482
{
1483
struct cxl_memdev *cxlmd = data;
1484
1485
for (int i = cxlmd->depth - 1; i >= 1; i--) {
1486
struct cxl_port *port, *parent_port;
1487
struct detach_ctx ctx = {
1488
.cxlmd = cxlmd,
1489
.depth = i,
1490
};
1491
struct cxl_ep *ep;
1492
bool died = false;
1493
1494
struct device *dev __free(put_device) =
1495
bus_find_device(&cxl_bus_type, NULL, &ctx, port_has_memdev);
1496
if (!dev)
1497
continue;
1498
port = to_cxl_port(dev);
1499
1500
parent_port = to_cxl_port(port->dev.parent);
1501
device_lock(&parent_port->dev);
1502
device_lock(&port->dev);
1503
ep = cxl_ep_load(port, cxlmd);
1504
dev_dbg(&cxlmd->dev, "disconnect %s from %s\n",
1505
ep ? dev_name(ep->ep) : "", dev_name(&port->dev));
1506
cxl_ep_remove(port, ep);
1507
if (ep && !port->dead && xa_empty(&port->endpoints) &&
1508
!is_cxl_root(parent_port) && parent_port->dev.driver) {
1509
/*
1510
* This was the last ep attached to a dynamically
1511
* enumerated port. Block new cxl_add_ep() and garbage
1512
* collect the port.
1513
*/
1514
died = true;
1515
port->dead = true;
1516
del_dports(port);
1517
}
1518
device_unlock(&port->dev);
1519
1520
if (died) {
1521
dev_dbg(&cxlmd->dev, "delete %s\n",
1522
dev_name(&port->dev));
1523
delete_switch_port(port);
1524
}
1525
device_unlock(&parent_port->dev);
1526
}
1527
}
1528
1529
static resource_size_t find_component_registers(struct device *dev)
1530
{
1531
struct cxl_register_map map;
1532
struct pci_dev *pdev;
1533
1534
/*
1535
* Theoretically, CXL component registers can be hosted on a
1536
* non-PCI device, in practice, only cxl_test hits this case.
1537
*/
1538
if (!dev_is_pci(dev))
1539
return CXL_RESOURCE_NONE;
1540
1541
pdev = to_pci_dev(dev);
1542
1543
cxl_find_regblock(pdev, CXL_REGLOC_RBI_COMPONENT, &map);
1544
return map.resource;
1545
}
1546
1547
static int match_port_by_uport(struct device *dev, const void *data)
1548
{
1549
const struct device *uport_dev = data;
1550
struct cxl_port *port;
1551
1552
if (!is_cxl_port(dev))
1553
return 0;
1554
1555
port = to_cxl_port(dev);
1556
return uport_dev == port->uport_dev;
1557
}
1558
1559
/*
1560
* Function takes a device reference on the port device. Caller should do a
1561
* put_device() when done.
1562
*/
1563
static struct cxl_port *find_cxl_port_by_uport(struct device *uport_dev)
1564
{
1565
struct device *dev;
1566
1567
dev = bus_find_device(&cxl_bus_type, NULL, uport_dev, match_port_by_uport);
1568
if (dev)
1569
return to_cxl_port(dev);
1570
return NULL;
1571
}
1572
1573
static int update_decoder_targets(struct device *dev, void *data)
1574
{
1575
struct cxl_dport *dport = data;
1576
struct cxl_switch_decoder *cxlsd;
1577
struct cxl_decoder *cxld;
1578
int i;
1579
1580
if (!is_switch_decoder(dev))
1581
return 0;
1582
1583
cxlsd = to_cxl_switch_decoder(dev);
1584
cxld = &cxlsd->cxld;
1585
guard(rwsem_write)(&cxl_rwsem.region);
1586
1587
for (i = 0; i < cxld->interleave_ways; i++) {
1588
if (cxld->target_map[i] == dport->port_id) {
1589
cxlsd->target[i] = dport;
1590
dev_dbg(dev, "dport%d found in target list, index %d\n",
1591
dport->port_id, i);
1592
return 1;
1593
}
1594
}
1595
1596
return 0;
1597
}
1598
1599
DEFINE_FREE(del_cxl_dport, struct cxl_dport *, if (!IS_ERR_OR_NULL(_T)) del_dport(_T))
1600
static struct cxl_dport *cxl_port_add_dport(struct cxl_port *port,
1601
struct device *dport_dev)
1602
{
1603
struct cxl_dport *dport;
1604
int rc;
1605
1606
device_lock_assert(&port->dev);
1607
if (!port->dev.driver)
1608
return ERR_PTR(-ENXIO);
1609
1610
dport = cxl_find_dport_by_dev(port, dport_dev);
1611
if (dport) {
1612
dev_dbg(&port->dev, "dport%d:%s already exists\n",
1613
dport->port_id, dev_name(dport_dev));
1614
return ERR_PTR(-EBUSY);
1615
}
1616
1617
struct cxl_dport *new_dport __free(del_cxl_dport) =
1618
devm_cxl_add_dport_by_dev(port, dport_dev);
1619
if (IS_ERR(new_dport))
1620
return new_dport;
1621
1622
cxl_switch_parse_cdat(new_dport);
1623
1624
if (ida_is_empty(&port->decoder_ida)) {
1625
rc = devm_cxl_switch_port_decoders_setup(port);
1626
if (rc)
1627
return ERR_PTR(rc);
1628
dev_dbg(&port->dev, "first dport%d:%s added with decoders\n",
1629
new_dport->port_id, dev_name(dport_dev));
1630
return no_free_ptr(new_dport);
1631
}
1632
1633
/* New dport added, update the decoder targets */
1634
device_for_each_child(&port->dev, new_dport, update_decoder_targets);
1635
1636
dev_dbg(&port->dev, "dport%d:%s added\n", new_dport->port_id,
1637
dev_name(dport_dev));
1638
1639
return no_free_ptr(new_dport);
1640
}
1641
1642
static struct cxl_dport *devm_cxl_create_port(struct device *ep_dev,
1643
struct cxl_port *parent_port,
1644
struct cxl_dport *parent_dport,
1645
struct device *uport_dev,
1646
struct device *dport_dev)
1647
{
1648
resource_size_t component_reg_phys;
1649
1650
device_lock_assert(&parent_port->dev);
1651
if (!parent_port->dev.driver) {
1652
dev_warn(ep_dev,
1653
"port %s:%s:%s disabled, failed to enumerate CXL.mem\n",
1654
dev_name(&parent_port->dev), dev_name(uport_dev),
1655
dev_name(dport_dev));
1656
}
1657
1658
struct cxl_port *port __free(put_cxl_port) =
1659
find_cxl_port_by_uport(uport_dev);
1660
if (!port) {
1661
component_reg_phys = find_component_registers(uport_dev);
1662
port = devm_cxl_add_port(&parent_port->dev, uport_dev,
1663
component_reg_phys, parent_dport);
1664
if (IS_ERR(port))
1665
return ERR_CAST(port);
1666
1667
/*
1668
* retry to make sure a port is found. a port device
1669
* reference is taken.
1670
*/
1671
port = find_cxl_port_by_uport(uport_dev);
1672
if (!port)
1673
return ERR_PTR(-ENODEV);
1674
1675
dev_dbg(ep_dev, "created port %s:%s\n",
1676
dev_name(&port->dev), dev_name(port->uport_dev));
1677
} else {
1678
/*
1679
* Port was created before right before this function is
1680
* called. Signal the caller to deal with it.
1681
*/
1682
return ERR_PTR(-EAGAIN);
1683
}
1684
1685
guard(device)(&port->dev);
1686
return cxl_port_add_dport(port, dport_dev);
1687
}
1688
1689
static int add_port_attach_ep(struct cxl_memdev *cxlmd,
1690
struct device *uport_dev,
1691
struct device *dport_dev)
1692
{
1693
struct device *dparent = grandparent(dport_dev);
1694
struct cxl_dport *dport, *parent_dport;
1695
int rc;
1696
1697
if (is_cxl_host_bridge(dparent)) {
1698
/*
1699
* The iteration reached the topology root without finding the
1700
* CXL-root 'cxl_port' on a previous iteration, fail for now to
1701
* be re-probed after platform driver attaches.
1702
*/
1703
dev_dbg(&cxlmd->dev, "%s is a root dport\n",
1704
dev_name(dport_dev));
1705
return -ENXIO;
1706
}
1707
1708
struct cxl_port *parent_port __free(put_cxl_port) =
1709
find_cxl_port_by_uport(dparent->parent);
1710
if (!parent_port) {
1711
/* iterate to create this parent_port */
1712
return -EAGAIN;
1713
}
1714
1715
scoped_guard(device, &parent_port->dev) {
1716
parent_dport = cxl_find_dport_by_dev(parent_port, dparent);
1717
if (!parent_dport) {
1718
parent_dport = cxl_port_add_dport(parent_port, dparent);
1719
if (IS_ERR(parent_dport))
1720
return PTR_ERR(parent_dport);
1721
}
1722
1723
dport = devm_cxl_create_port(&cxlmd->dev, parent_port,
1724
parent_dport, uport_dev,
1725
dport_dev);
1726
if (IS_ERR(dport)) {
1727
/* Port already exists, restart iteration */
1728
if (PTR_ERR(dport) == -EAGAIN)
1729
return 0;
1730
return PTR_ERR(dport);
1731
}
1732
}
1733
1734
rc = cxl_add_ep(dport, &cxlmd->dev);
1735
if (rc == -EBUSY) {
1736
/*
1737
* "can't" happen, but this error code means
1738
* something to the caller, so translate it.
1739
*/
1740
rc = -ENXIO;
1741
}
1742
1743
return rc;
1744
}
1745
1746
static struct cxl_dport *find_or_add_dport(struct cxl_port *port,
1747
struct device *dport_dev)
1748
{
1749
struct cxl_dport *dport;
1750
1751
device_lock_assert(&port->dev);
1752
dport = cxl_find_dport_by_dev(port, dport_dev);
1753
if (!dport) {
1754
dport = cxl_port_add_dport(port, dport_dev);
1755
if (IS_ERR(dport))
1756
return dport;
1757
1758
/* New dport added, restart iteration */
1759
return ERR_PTR(-EAGAIN);
1760
}
1761
1762
return dport;
1763
}
1764
1765
int devm_cxl_enumerate_ports(struct cxl_memdev *cxlmd)
1766
{
1767
struct device *dev = &cxlmd->dev;
1768
struct device *iter;
1769
int rc;
1770
1771
/*
1772
* Skip intermediate port enumeration in the RCH case, there
1773
* are no ports in between a host bridge and an endpoint.
1774
*/
1775
if (cxlmd->cxlds->rcd)
1776
return 0;
1777
1778
rc = devm_add_action_or_reset(&cxlmd->dev, cxl_detach_ep, cxlmd);
1779
if (rc)
1780
return rc;
1781
1782
/*
1783
* Scan for and add all cxl_ports in this device's ancestry.
1784
* Repeat until no more ports are added. Abort if a port add
1785
* attempt fails.
1786
*/
1787
retry:
1788
for (iter = dev; iter; iter = grandparent(iter)) {
1789
struct device *dport_dev = grandparent(iter);
1790
struct device *uport_dev;
1791
struct cxl_dport *dport;
1792
1793
if (is_cxl_host_bridge(dport_dev))
1794
return 0;
1795
1796
uport_dev = dport_dev->parent;
1797
if (!uport_dev) {
1798
dev_warn(dev, "at %s no parent for dport: %s\n",
1799
dev_name(iter), dev_name(dport_dev));
1800
return -ENXIO;
1801
}
1802
1803
dev_dbg(dev, "scan: iter: %s dport_dev: %s parent: %s\n",
1804
dev_name(iter), dev_name(dport_dev),
1805
dev_name(uport_dev));
1806
struct cxl_port *port __free(put_cxl_port) =
1807
find_cxl_port_by_uport(uport_dev);
1808
if (port) {
1809
dev_dbg(&cxlmd->dev,
1810
"found already registered port %s:%s\n",
1811
dev_name(&port->dev),
1812
dev_name(port->uport_dev));
1813
1814
/*
1815
* RP port enumerated by cxl_acpi without dport will
1816
* have the dport added here.
1817
*/
1818
scoped_guard(device, &port->dev) {
1819
dport = find_or_add_dport(port, dport_dev);
1820
if (IS_ERR(dport)) {
1821
if (PTR_ERR(dport) == -EAGAIN)
1822
goto retry;
1823
return PTR_ERR(dport);
1824
}
1825
}
1826
1827
rc = cxl_add_ep(dport, &cxlmd->dev);
1828
1829
/*
1830
* If the endpoint already exists in the port's list,
1831
* that's ok, it was added on a previous pass.
1832
* Otherwise, retry in add_port_attach_ep() after taking
1833
* the parent_port lock as the current port may be being
1834
* reaped.
1835
*/
1836
if (rc && rc != -EBUSY)
1837
return rc;
1838
1839
cxl_gpf_port_setup(dport);
1840
1841
/* Any more ports to add between this one and the root? */
1842
if (!dev_is_cxl_root_child(&port->dev))
1843
continue;
1844
1845
return 0;
1846
}
1847
1848
rc = add_port_attach_ep(cxlmd, uport_dev, dport_dev);
1849
/* port missing, try to add parent */
1850
if (rc == -EAGAIN)
1851
continue;
1852
/* failed to add ep or port */
1853
if (rc)
1854
return rc;
1855
/* port added, new descendants possible, start over */
1856
goto retry;
1857
}
1858
1859
return 0;
1860
}
1861
EXPORT_SYMBOL_NS_GPL(devm_cxl_enumerate_ports, "CXL");
1862
1863
struct cxl_port *cxl_pci_find_port(struct pci_dev *pdev,
1864
struct cxl_dport **dport)
1865
{
1866
return find_cxl_port(pdev->dev.parent, dport);
1867
}
1868
EXPORT_SYMBOL_NS_GPL(cxl_pci_find_port, "CXL");
1869
1870
struct cxl_port *cxl_mem_find_port(struct cxl_memdev *cxlmd,
1871
struct cxl_dport **dport)
1872
{
1873
return find_cxl_port(grandparent(&cxlmd->dev), dport);
1874
}
1875
EXPORT_SYMBOL_NS_GPL(cxl_mem_find_port, "CXL");
1876
1877
static int decoder_populate_targets(struct cxl_switch_decoder *cxlsd,
1878
struct cxl_port *port)
1879
{
1880
struct cxl_decoder *cxld = &cxlsd->cxld;
1881
int i;
1882
1883
device_lock_assert(&port->dev);
1884
1885
if (xa_empty(&port->dports))
1886
return 0;
1887
1888
guard(rwsem_write)(&cxl_rwsem.region);
1889
for (i = 0; i < cxlsd->cxld.interleave_ways; i++) {
1890
struct cxl_dport *dport = find_dport(port, cxld->target_map[i]);
1891
1892
if (!dport) {
1893
/* dport may be activated later */
1894
continue;
1895
}
1896
cxlsd->target[i] = dport;
1897
}
1898
1899
return 0;
1900
}
1901
1902
static struct lock_class_key cxl_decoder_key;
1903
1904
/**
1905
* cxl_decoder_init - Common decoder setup / initialization
1906
* @port: owning port of this decoder
1907
* @cxld: common decoder properties to initialize
1908
*
1909
* A port may contain one or more decoders. Each of those decoders
1910
* enable some address space for CXL.mem utilization. A decoder is
1911
* expected to be configured by the caller before registering via
1912
* cxl_decoder_add()
1913
*/
1914
static int cxl_decoder_init(struct cxl_port *port, struct cxl_decoder *cxld)
1915
{
1916
struct device *dev;
1917
int rc;
1918
1919
rc = ida_alloc(&port->decoder_ida, GFP_KERNEL);
1920
if (rc < 0)
1921
return rc;
1922
1923
/* need parent to stick around to release the id */
1924
get_device(&port->dev);
1925
cxld->id = rc;
1926
1927
dev = &cxld->dev;
1928
device_initialize(dev);
1929
lockdep_set_class(&dev->mutex, &cxl_decoder_key);
1930
device_set_pm_not_required(dev);
1931
dev->parent = &port->dev;
1932
dev->bus = &cxl_bus_type;
1933
1934
/* Pre initialize an "empty" decoder */
1935
cxld->interleave_ways = 1;
1936
cxld->interleave_granularity = PAGE_SIZE;
1937
cxld->target_type = CXL_DECODER_HOSTONLYMEM;
1938
cxld->hpa_range = (struct range) {
1939
.start = 0,
1940
.end = -1,
1941
};
1942
1943
return 0;
1944
}
1945
1946
static int cxl_switch_decoder_init(struct cxl_port *port,
1947
struct cxl_switch_decoder *cxlsd,
1948
int nr_targets)
1949
{
1950
if (nr_targets > CXL_DECODER_MAX_INTERLEAVE)
1951
return -EINVAL;
1952
1953
cxlsd->nr_targets = nr_targets;
1954
return cxl_decoder_init(port, &cxlsd->cxld);
1955
}
1956
1957
/**
1958
* cxl_root_decoder_alloc - Allocate a root level decoder
1959
* @port: owning CXL root of this decoder
1960
* @nr_targets: static number of downstream targets
1961
*
1962
* Return: A new cxl decoder to be registered by cxl_decoder_add(). A
1963
* 'CXL root' decoder is one that decodes from a top-level / static platform
1964
* firmware description of CXL resources into a CXL standard decode
1965
* topology.
1966
*/
1967
struct cxl_root_decoder *cxl_root_decoder_alloc(struct cxl_port *port,
1968
unsigned int nr_targets)
1969
{
1970
struct cxl_root_decoder *cxlrd;
1971
struct cxl_switch_decoder *cxlsd;
1972
struct cxl_decoder *cxld;
1973
int rc;
1974
1975
if (!is_cxl_root(port))
1976
return ERR_PTR(-EINVAL);
1977
1978
cxlrd = kzalloc(struct_size(cxlrd, cxlsd.target, nr_targets),
1979
GFP_KERNEL);
1980
if (!cxlrd)
1981
return ERR_PTR(-ENOMEM);
1982
1983
cxlsd = &cxlrd->cxlsd;
1984
rc = cxl_switch_decoder_init(port, cxlsd, nr_targets);
1985
if (rc) {
1986
kfree(cxlrd);
1987
return ERR_PTR(rc);
1988
}
1989
1990
mutex_init(&cxlrd->range_lock);
1991
1992
cxld = &cxlsd->cxld;
1993
cxld->dev.type = &cxl_decoder_root_type;
1994
/*
1995
* cxl_root_decoder_release() special cases negative ids to
1996
* detect memregion_alloc() failures.
1997
*/
1998
atomic_set(&cxlrd->region_id, -1);
1999
rc = memregion_alloc(GFP_KERNEL);
2000
if (rc < 0) {
2001
put_device(&cxld->dev);
2002
return ERR_PTR(rc);
2003
}
2004
2005
atomic_set(&cxlrd->region_id, rc);
2006
cxlrd->qos_class = CXL_QOS_CLASS_INVALID;
2007
return cxlrd;
2008
}
2009
EXPORT_SYMBOL_NS_GPL(cxl_root_decoder_alloc, "CXL");
2010
2011
/**
2012
* cxl_switch_decoder_alloc - Allocate a switch level decoder
2013
* @port: owning CXL switch port of this decoder
2014
* @nr_targets: max number of dynamically addressable downstream targets
2015
*
2016
* Return: A new cxl decoder to be registered by cxl_decoder_add(). A
2017
* 'switch' decoder is any decoder that can be enumerated by PCIe
2018
* topology and the HDM Decoder Capability. This includes the decoders
2019
* that sit between Switch Upstream Ports / Switch Downstream Ports and
2020
* Host Bridges / Root Ports.
2021
*/
2022
struct cxl_switch_decoder *cxl_switch_decoder_alloc(struct cxl_port *port,
2023
unsigned int nr_targets)
2024
{
2025
struct cxl_switch_decoder *cxlsd;
2026
struct cxl_decoder *cxld;
2027
int rc;
2028
2029
if (is_cxl_root(port) || is_cxl_endpoint(port))
2030
return ERR_PTR(-EINVAL);
2031
2032
cxlsd = kzalloc(struct_size(cxlsd, target, nr_targets), GFP_KERNEL);
2033
if (!cxlsd)
2034
return ERR_PTR(-ENOMEM);
2035
2036
rc = cxl_switch_decoder_init(port, cxlsd, nr_targets);
2037
if (rc) {
2038
kfree(cxlsd);
2039
return ERR_PTR(rc);
2040
}
2041
2042
cxld = &cxlsd->cxld;
2043
cxld->dev.type = &cxl_decoder_switch_type;
2044
return cxlsd;
2045
}
2046
EXPORT_SYMBOL_NS_GPL(cxl_switch_decoder_alloc, "CXL");
2047
2048
/**
2049
* cxl_endpoint_decoder_alloc - Allocate an endpoint decoder
2050
* @port: owning port of this decoder
2051
*
2052
* Return: A new cxl decoder to be registered by cxl_decoder_add()
2053
*/
2054
struct cxl_endpoint_decoder *cxl_endpoint_decoder_alloc(struct cxl_port *port)
2055
{
2056
struct cxl_endpoint_decoder *cxled;
2057
struct cxl_decoder *cxld;
2058
int rc;
2059
2060
if (!is_cxl_endpoint(port))
2061
return ERR_PTR(-EINVAL);
2062
2063
cxled = kzalloc(sizeof(*cxled), GFP_KERNEL);
2064
if (!cxled)
2065
return ERR_PTR(-ENOMEM);
2066
2067
cxled->pos = -1;
2068
cxled->part = -1;
2069
cxld = &cxled->cxld;
2070
rc = cxl_decoder_init(port, cxld);
2071
if (rc) {
2072
kfree(cxled);
2073
return ERR_PTR(rc);
2074
}
2075
2076
cxld->dev.type = &cxl_decoder_endpoint_type;
2077
return cxled;
2078
}
2079
EXPORT_SYMBOL_NS_GPL(cxl_endpoint_decoder_alloc, "CXL");
2080
2081
/**
2082
* cxl_decoder_add_locked - Add a decoder with targets
2083
* @cxld: The cxl decoder allocated by cxl_<type>_decoder_alloc()
2084
*
2085
* Certain types of decoders may not have any targets. The main example of this
2086
* is an endpoint device. A more awkward example is a hostbridge whose root
2087
* ports get hot added (technically possible, though unlikely).
2088
*
2089
* This is the locked variant of cxl_decoder_add().
2090
*
2091
* Context: Process context. Expects the device lock of the port that owns the
2092
* @cxld to be held.
2093
*
2094
* Return: Negative error code if the decoder wasn't properly configured; else
2095
* returns 0.
2096
*/
2097
int cxl_decoder_add_locked(struct cxl_decoder *cxld)
2098
{
2099
struct cxl_port *port;
2100
struct device *dev;
2101
int rc;
2102
2103
if (WARN_ON_ONCE(!cxld))
2104
return -EINVAL;
2105
2106
if (WARN_ON_ONCE(IS_ERR(cxld)))
2107
return PTR_ERR(cxld);
2108
2109
if (cxld->interleave_ways < 1)
2110
return -EINVAL;
2111
2112
dev = &cxld->dev;
2113
2114
port = to_cxl_port(cxld->dev.parent);
2115
if (!is_endpoint_decoder(dev)) {
2116
struct cxl_switch_decoder *cxlsd = to_cxl_switch_decoder(dev);
2117
2118
rc = decoder_populate_targets(cxlsd, port);
2119
if (rc && (cxld->flags & CXL_DECODER_F_ENABLE)) {
2120
dev_err(&port->dev,
2121
"Failed to populate active decoder targets\n");
2122
return rc;
2123
}
2124
}
2125
2126
rc = dev_set_name(dev, "decoder%d.%d", port->id, cxld->id);
2127
if (rc)
2128
return rc;
2129
2130
return device_add(dev);
2131
}
2132
EXPORT_SYMBOL_NS_GPL(cxl_decoder_add_locked, "CXL");
2133
2134
/**
2135
* cxl_decoder_add - Add a decoder with targets
2136
* @cxld: The cxl decoder allocated by cxl_<type>_decoder_alloc()
2137
*
2138
* This is the unlocked variant of cxl_decoder_add_locked().
2139
* See cxl_decoder_add_locked().
2140
*
2141
* Context: Process context. Takes and releases the device lock of the port that
2142
* owns the @cxld.
2143
*/
2144
int cxl_decoder_add(struct cxl_decoder *cxld)
2145
{
2146
struct cxl_port *port;
2147
2148
if (WARN_ON_ONCE(!cxld))
2149
return -EINVAL;
2150
2151
if (WARN_ON_ONCE(IS_ERR(cxld)))
2152
return PTR_ERR(cxld);
2153
2154
port = to_cxl_port(cxld->dev.parent);
2155
2156
guard(device)(&port->dev);
2157
return cxl_decoder_add_locked(cxld);
2158
}
2159
EXPORT_SYMBOL_NS_GPL(cxl_decoder_add, "CXL");
2160
2161
static void cxld_unregister(void *dev)
2162
{
2163
if (is_endpoint_decoder(dev))
2164
cxl_decoder_detach(NULL, to_cxl_endpoint_decoder(dev), -1,
2165
DETACH_INVALIDATE);
2166
2167
device_unregister(dev);
2168
}
2169
2170
int cxl_decoder_autoremove(struct device *host, struct cxl_decoder *cxld)
2171
{
2172
return devm_add_action_or_reset(host, cxld_unregister, &cxld->dev);
2173
}
2174
EXPORT_SYMBOL_NS_GPL(cxl_decoder_autoremove, "CXL");
2175
2176
/**
2177
* __cxl_driver_register - register a driver for the cxl bus
2178
* @cxl_drv: cxl driver structure to attach
2179
* @owner: owning module/driver
2180
* @modname: KBUILD_MODNAME for parent driver
2181
*/
2182
int __cxl_driver_register(struct cxl_driver *cxl_drv, struct module *owner,
2183
const char *modname)
2184
{
2185
if (!cxl_drv->probe) {
2186
pr_debug("%s ->probe() must be specified\n", modname);
2187
return -EINVAL;
2188
}
2189
2190
if (!cxl_drv->name) {
2191
pr_debug("%s ->name must be specified\n", modname);
2192
return -EINVAL;
2193
}
2194
2195
if (!cxl_drv->id) {
2196
pr_debug("%s ->id must be specified\n", modname);
2197
return -EINVAL;
2198
}
2199
2200
cxl_drv->drv.bus = &cxl_bus_type;
2201
cxl_drv->drv.owner = owner;
2202
cxl_drv->drv.mod_name = modname;
2203
cxl_drv->drv.name = cxl_drv->name;
2204
2205
return driver_register(&cxl_drv->drv);
2206
}
2207
EXPORT_SYMBOL_NS_GPL(__cxl_driver_register, "CXL");
2208
2209
void cxl_driver_unregister(struct cxl_driver *cxl_drv)
2210
{
2211
driver_unregister(&cxl_drv->drv);
2212
}
2213
EXPORT_SYMBOL_NS_GPL(cxl_driver_unregister, "CXL");
2214
2215
static int cxl_bus_uevent(const struct device *dev, struct kobj_uevent_env *env)
2216
{
2217
return add_uevent_var(env, "MODALIAS=" CXL_MODALIAS_FMT,
2218
cxl_device_id(dev));
2219
}
2220
2221
static int cxl_bus_match(struct device *dev, const struct device_driver *drv)
2222
{
2223
return cxl_device_id(dev) == to_cxl_drv(drv)->id;
2224
}
2225
2226
static int cxl_bus_probe(struct device *dev)
2227
{
2228
int rc;
2229
2230
rc = to_cxl_drv(dev->driver)->probe(dev);
2231
dev_dbg(dev, "probe: %d\n", rc);
2232
return rc;
2233
}
2234
2235
static void cxl_bus_remove(struct device *dev)
2236
{
2237
struct cxl_driver *cxl_drv = to_cxl_drv(dev->driver);
2238
2239
if (cxl_drv->remove)
2240
cxl_drv->remove(dev);
2241
}
2242
2243
static struct workqueue_struct *cxl_bus_wq;
2244
2245
static int cxl_rescan_attach(struct device *dev, void *data)
2246
{
2247
int rc = device_attach(dev);
2248
2249
dev_vdbg(dev, "rescan: %s\n", rc ? "attach" : "detached");
2250
2251
return 0;
2252
}
2253
2254
static void cxl_bus_rescan_queue(struct work_struct *w)
2255
{
2256
bus_for_each_dev(&cxl_bus_type, NULL, NULL, cxl_rescan_attach);
2257
}
2258
2259
void cxl_bus_rescan(void)
2260
{
2261
static DECLARE_WORK(rescan_work, cxl_bus_rescan_queue);
2262
2263
queue_work(cxl_bus_wq, &rescan_work);
2264
}
2265
EXPORT_SYMBOL_NS_GPL(cxl_bus_rescan, "CXL");
2266
2267
void cxl_bus_drain(void)
2268
{
2269
drain_workqueue(cxl_bus_wq);
2270
}
2271
EXPORT_SYMBOL_NS_GPL(cxl_bus_drain, "CXL");
2272
2273
bool schedule_cxl_memdev_detach(struct cxl_memdev *cxlmd)
2274
{
2275
return queue_work(cxl_bus_wq, &cxlmd->detach_work);
2276
}
2277
EXPORT_SYMBOL_NS_GPL(schedule_cxl_memdev_detach, "CXL");
2278
2279
static void add_latency(struct access_coordinate *c, long latency)
2280
{
2281
for (int i = 0; i < ACCESS_COORDINATE_MAX; i++) {
2282
c[i].write_latency += latency;
2283
c[i].read_latency += latency;
2284
}
2285
}
2286
2287
static bool coordinates_valid(struct access_coordinate *c)
2288
{
2289
for (int i = 0; i < ACCESS_COORDINATE_MAX; i++) {
2290
if (c[i].read_bandwidth && c[i].write_bandwidth &&
2291
c[i].read_latency && c[i].write_latency)
2292
continue;
2293
return false;
2294
}
2295
2296
return true;
2297
}
2298
2299
static void set_min_bandwidth(struct access_coordinate *c, unsigned int bw)
2300
{
2301
for (int i = 0; i < ACCESS_COORDINATE_MAX; i++) {
2302
c[i].write_bandwidth = min(c[i].write_bandwidth, bw);
2303
c[i].read_bandwidth = min(c[i].read_bandwidth, bw);
2304
}
2305
}
2306
2307
static void set_access_coordinates(struct access_coordinate *out,
2308
struct access_coordinate *in)
2309
{
2310
for (int i = 0; i < ACCESS_COORDINATE_MAX; i++)
2311
out[i] = in[i];
2312
}
2313
2314
static bool parent_port_is_cxl_root(struct cxl_port *port)
2315
{
2316
return is_cxl_root(to_cxl_port(port->dev.parent));
2317
}
2318
2319
/**
2320
* cxl_endpoint_get_perf_coordinates - Retrieve performance numbers stored in dports
2321
* of CXL path
2322
* @port: endpoint cxl_port
2323
* @coord: output performance data
2324
*
2325
* Return: errno on failure, 0 on success.
2326
*/
2327
int cxl_endpoint_get_perf_coordinates(struct cxl_port *port,
2328
struct access_coordinate *coord)
2329
{
2330
struct cxl_memdev *cxlmd = to_cxl_memdev(port->uport_dev);
2331
struct access_coordinate c[] = {
2332
{
2333
.read_bandwidth = UINT_MAX,
2334
.write_bandwidth = UINT_MAX,
2335
},
2336
{
2337
.read_bandwidth = UINT_MAX,
2338
.write_bandwidth = UINT_MAX,
2339
},
2340
};
2341
struct cxl_port *iter = port;
2342
struct cxl_dport *dport;
2343
struct pci_dev *pdev;
2344
struct device *dev;
2345
unsigned int bw;
2346
bool is_cxl_root;
2347
2348
if (!is_cxl_endpoint(port))
2349
return -EINVAL;
2350
2351
/*
2352
* Skip calculation for RCD. Expectation is HMAT already covers RCD case
2353
* since RCH does not support hotplug.
2354
*/
2355
if (cxlmd->cxlds->rcd)
2356
return 0;
2357
2358
/*
2359
* Exit the loop when the parent port of the current iter port is cxl
2360
* root. The iterative loop starts at the endpoint and gathers the
2361
* latency of the CXL link from the current device/port to the connected
2362
* downstream port each iteration.
2363
*/
2364
do {
2365
dport = iter->parent_dport;
2366
iter = to_cxl_port(iter->dev.parent);
2367
is_cxl_root = parent_port_is_cxl_root(iter);
2368
2369
/*
2370
* There's no valid access_coordinate for a root port since RPs do not
2371
* have CDAT and therefore needs to be skipped.
2372
*/
2373
if (!is_cxl_root) {
2374
if (!coordinates_valid(dport->coord))
2375
return -EINVAL;
2376
cxl_coordinates_combine(c, c, dport->coord);
2377
}
2378
add_latency(c, dport->link_latency);
2379
} while (!is_cxl_root);
2380
2381
dport = iter->parent_dport;
2382
/* Retrieve HB coords */
2383
if (!coordinates_valid(dport->coord))
2384
return -EINVAL;
2385
cxl_coordinates_combine(c, c, dport->coord);
2386
2387
dev = port->uport_dev->parent;
2388
if (!dev_is_pci(dev))
2389
return -ENODEV;
2390
2391
/* Get the calculated PCI paths bandwidth */
2392
pdev = to_pci_dev(dev);
2393
bw = pcie_bandwidth_available(pdev, NULL, NULL, NULL);
2394
if (bw == 0)
2395
return -ENXIO;
2396
bw /= BITS_PER_BYTE;
2397
2398
set_min_bandwidth(c, bw);
2399
set_access_coordinates(coord, c);
2400
2401
return 0;
2402
}
2403
EXPORT_SYMBOL_NS_GPL(cxl_endpoint_get_perf_coordinates, "CXL");
2404
2405
int cxl_port_get_switch_dport_bandwidth(struct cxl_port *port,
2406
struct access_coordinate *c)
2407
{
2408
struct cxl_dport *dport = port->parent_dport;
2409
2410
/* Check this port is connected to a switch DSP and not an RP */
2411
if (parent_port_is_cxl_root(to_cxl_port(port->dev.parent)))
2412
return -ENODEV;
2413
2414
if (!coordinates_valid(dport->coord))
2415
return -EINVAL;
2416
2417
for (int i = 0; i < ACCESS_COORDINATE_MAX; i++) {
2418
c[i].read_bandwidth = dport->coord[i].read_bandwidth;
2419
c[i].write_bandwidth = dport->coord[i].write_bandwidth;
2420
}
2421
2422
return 0;
2423
}
2424
2425
/* for user tooling to ensure port disable work has completed */
2426
static ssize_t flush_store(const struct bus_type *bus, const char *buf, size_t count)
2427
{
2428
if (sysfs_streq(buf, "1")) {
2429
flush_workqueue(cxl_bus_wq);
2430
return count;
2431
}
2432
2433
return -EINVAL;
2434
}
2435
2436
static BUS_ATTR_WO(flush);
2437
2438
static struct attribute *cxl_bus_attributes[] = {
2439
&bus_attr_flush.attr,
2440
NULL,
2441
};
2442
2443
static struct attribute_group cxl_bus_attribute_group = {
2444
.attrs = cxl_bus_attributes,
2445
};
2446
2447
static const struct attribute_group *cxl_bus_attribute_groups[] = {
2448
&cxl_bus_attribute_group,
2449
NULL,
2450
};
2451
2452
const struct bus_type cxl_bus_type = {
2453
.name = "cxl",
2454
.uevent = cxl_bus_uevent,
2455
.match = cxl_bus_match,
2456
.probe = cxl_bus_probe,
2457
.remove = cxl_bus_remove,
2458
.bus_groups = cxl_bus_attribute_groups,
2459
};
2460
EXPORT_SYMBOL_NS_GPL(cxl_bus_type, "CXL");
2461
2462
static struct dentry *cxl_debugfs;
2463
2464
struct dentry *cxl_debugfs_create_dir(const char *dir)
2465
{
2466
return debugfs_create_dir(dir, cxl_debugfs);
2467
}
2468
EXPORT_SYMBOL_NS_GPL(cxl_debugfs_create_dir, "CXL");
2469
2470
static __init int cxl_core_init(void)
2471
{
2472
int rc;
2473
2474
cxl_debugfs = debugfs_create_dir("cxl", NULL);
2475
2476
if (einj_cxl_is_initialized())
2477
debugfs_create_file("einj_types", 0400, cxl_debugfs, NULL,
2478
&einj_cxl_available_error_type_fops);
2479
2480
cxl_mbox_init();
2481
2482
rc = cxl_memdev_init();
2483
if (rc)
2484
return rc;
2485
2486
cxl_bus_wq = alloc_ordered_workqueue("cxl_port", 0);
2487
if (!cxl_bus_wq) {
2488
rc = -ENOMEM;
2489
goto err_wq;
2490
}
2491
2492
rc = bus_register(&cxl_bus_type);
2493
if (rc)
2494
goto err_bus;
2495
2496
rc = cxl_region_init();
2497
if (rc)
2498
goto err_region;
2499
2500
rc = cxl_ras_init();
2501
if (rc)
2502
goto err_ras;
2503
2504
return 0;
2505
2506
err_ras:
2507
cxl_region_exit();
2508
err_region:
2509
bus_unregister(&cxl_bus_type);
2510
err_bus:
2511
destroy_workqueue(cxl_bus_wq);
2512
err_wq:
2513
cxl_memdev_exit();
2514
return rc;
2515
}
2516
2517
static void cxl_core_exit(void)
2518
{
2519
cxl_ras_exit();
2520
cxl_region_exit();
2521
bus_unregister(&cxl_bus_type);
2522
destroy_workqueue(cxl_bus_wq);
2523
cxl_memdev_exit();
2524
debugfs_remove_recursive(cxl_debugfs);
2525
}
2526
2527
subsys_initcall(cxl_core_init);
2528
module_exit(cxl_core_exit);
2529
MODULE_DESCRIPTION("CXL: Core Compute Express Link support");
2530
MODULE_LICENSE("GPL v2");
2531
MODULE_IMPORT_NS("CXL");
2532
2533