Book a Demo!
CoCalc Logo Icon
StoreFeaturesDocsShareSupportNewsAboutPoliciesSign UpSign In
torvalds
GitHub Repository: torvalds/linux
Path: blob/master/drivers/cxl/core/port.c
26282 views
1
// SPDX-License-Identifier: GPL-2.0-only
2
/* Copyright(c) 2020 Intel Corporation. All rights reserved. */
3
#include <linux/platform_device.h>
4
#include <linux/memregion.h>
5
#include <linux/workqueue.h>
6
#include <linux/debugfs.h>
7
#include <linux/device.h>
8
#include <linux/module.h>
9
#include <linux/pci.h>
10
#include <linux/slab.h>
11
#include <linux/idr.h>
12
#include <linux/node.h>
13
#include <cxl/einj.h>
14
#include <cxlmem.h>
15
#include <cxlpci.h>
16
#include <cxl.h>
17
#include "core.h"
18
19
/**
20
* DOC: cxl core
21
*
22
* The CXL core provides a set of interfaces that can be consumed by CXL aware
23
* drivers. The interfaces allow for creation, modification, and destruction of
24
* regions, memory devices, ports, and decoders. CXL aware drivers must register
25
* with the CXL core via these interfaces in order to be able to participate in
26
* cross-device interleave coordination. The CXL core also establishes and
27
* maintains the bridge to the nvdimm subsystem.
28
*
29
* CXL core introduces sysfs hierarchy to control the devices that are
30
* instantiated by the core.
31
*/
32
33
static DEFINE_IDA(cxl_port_ida);
34
static DEFINE_XARRAY(cxl_root_buses);
35
36
int cxl_num_decoders_committed(struct cxl_port *port)
37
{
38
lockdep_assert_held(&cxl_rwsem.region);
39
40
return port->commit_end + 1;
41
}
42
43
static ssize_t devtype_show(struct device *dev, struct device_attribute *attr,
44
char *buf)
45
{
46
return sysfs_emit(buf, "%s\n", dev->type->name);
47
}
48
static DEVICE_ATTR_RO(devtype);
49
50
static int cxl_device_id(const struct device *dev)
51
{
52
if (dev->type == &cxl_nvdimm_bridge_type)
53
return CXL_DEVICE_NVDIMM_BRIDGE;
54
if (dev->type == &cxl_nvdimm_type)
55
return CXL_DEVICE_NVDIMM;
56
if (dev->type == CXL_PMEM_REGION_TYPE())
57
return CXL_DEVICE_PMEM_REGION;
58
if (dev->type == CXL_DAX_REGION_TYPE())
59
return CXL_DEVICE_DAX_REGION;
60
if (is_cxl_port(dev)) {
61
if (is_cxl_root(to_cxl_port(dev)))
62
return CXL_DEVICE_ROOT;
63
return CXL_DEVICE_PORT;
64
}
65
if (is_cxl_memdev(dev))
66
return CXL_DEVICE_MEMORY_EXPANDER;
67
if (dev->type == CXL_REGION_TYPE())
68
return CXL_DEVICE_REGION;
69
if (dev->type == &cxl_pmu_type)
70
return CXL_DEVICE_PMU;
71
return 0;
72
}
73
74
static ssize_t modalias_show(struct device *dev, struct device_attribute *attr,
75
char *buf)
76
{
77
return sysfs_emit(buf, CXL_MODALIAS_FMT "\n", cxl_device_id(dev));
78
}
79
static DEVICE_ATTR_RO(modalias);
80
81
static struct attribute *cxl_base_attributes[] = {
82
&dev_attr_devtype.attr,
83
&dev_attr_modalias.attr,
84
NULL,
85
};
86
87
struct attribute_group cxl_base_attribute_group = {
88
.attrs = cxl_base_attributes,
89
};
90
91
static ssize_t start_show(struct device *dev, struct device_attribute *attr,
92
char *buf)
93
{
94
struct cxl_decoder *cxld = to_cxl_decoder(dev);
95
96
return sysfs_emit(buf, "%#llx\n", cxld->hpa_range.start);
97
}
98
static DEVICE_ATTR_ADMIN_RO(start);
99
100
static ssize_t size_show(struct device *dev, struct device_attribute *attr,
101
char *buf)
102
{
103
struct cxl_decoder *cxld = to_cxl_decoder(dev);
104
105
return sysfs_emit(buf, "%#llx\n", range_len(&cxld->hpa_range));
106
}
107
static DEVICE_ATTR_RO(size);
108
109
#define CXL_DECODER_FLAG_ATTR(name, flag) \
110
static ssize_t name##_show(struct device *dev, \
111
struct device_attribute *attr, char *buf) \
112
{ \
113
struct cxl_decoder *cxld = to_cxl_decoder(dev); \
114
\
115
return sysfs_emit(buf, "%s\n", \
116
(cxld->flags & (flag)) ? "1" : "0"); \
117
} \
118
static DEVICE_ATTR_RO(name)
119
120
CXL_DECODER_FLAG_ATTR(cap_pmem, CXL_DECODER_F_PMEM);
121
CXL_DECODER_FLAG_ATTR(cap_ram, CXL_DECODER_F_RAM);
122
CXL_DECODER_FLAG_ATTR(cap_type2, CXL_DECODER_F_TYPE2);
123
CXL_DECODER_FLAG_ATTR(cap_type3, CXL_DECODER_F_TYPE3);
124
CXL_DECODER_FLAG_ATTR(locked, CXL_DECODER_F_LOCK);
125
126
static ssize_t target_type_show(struct device *dev,
127
struct device_attribute *attr, char *buf)
128
{
129
struct cxl_decoder *cxld = to_cxl_decoder(dev);
130
131
switch (cxld->target_type) {
132
case CXL_DECODER_DEVMEM:
133
return sysfs_emit(buf, "accelerator\n");
134
case CXL_DECODER_HOSTONLYMEM:
135
return sysfs_emit(buf, "expander\n");
136
}
137
return -ENXIO;
138
}
139
static DEVICE_ATTR_RO(target_type);
140
141
static ssize_t emit_target_list(struct cxl_switch_decoder *cxlsd, char *buf)
142
{
143
struct cxl_decoder *cxld = &cxlsd->cxld;
144
ssize_t offset = 0;
145
int i, rc = 0;
146
147
for (i = 0; i < cxld->interleave_ways; i++) {
148
struct cxl_dport *dport = cxlsd->target[i];
149
struct cxl_dport *next = NULL;
150
151
if (!dport)
152
break;
153
154
if (i + 1 < cxld->interleave_ways)
155
next = cxlsd->target[i + 1];
156
rc = sysfs_emit_at(buf, offset, "%d%s", dport->port_id,
157
next ? "," : "");
158
if (rc < 0)
159
return rc;
160
offset += rc;
161
}
162
163
return offset;
164
}
165
166
static ssize_t target_list_show(struct device *dev,
167
struct device_attribute *attr, char *buf)
168
{
169
struct cxl_switch_decoder *cxlsd = to_cxl_switch_decoder(dev);
170
ssize_t offset;
171
int rc;
172
173
guard(rwsem_read)(&cxl_rwsem.region);
174
rc = emit_target_list(cxlsd, buf);
175
if (rc < 0)
176
return rc;
177
offset = rc;
178
179
rc = sysfs_emit_at(buf, offset, "\n");
180
if (rc < 0)
181
return rc;
182
183
return offset + rc;
184
}
185
static DEVICE_ATTR_RO(target_list);
186
187
static ssize_t mode_show(struct device *dev, struct device_attribute *attr,
188
char *buf)
189
{
190
struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
191
struct cxl_memdev *cxlmd = cxled_to_memdev(cxled);
192
struct cxl_dev_state *cxlds = cxlmd->cxlds;
193
/* without @cxl_rwsem.dpa, make sure @part is not reloaded */
194
int part = READ_ONCE(cxled->part);
195
const char *desc;
196
197
if (part < 0)
198
desc = "none";
199
else
200
desc = cxlds->part[part].res.name;
201
202
return sysfs_emit(buf, "%s\n", desc);
203
}
204
205
static ssize_t mode_store(struct device *dev, struct device_attribute *attr,
206
const char *buf, size_t len)
207
{
208
struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
209
enum cxl_partition_mode mode;
210
ssize_t rc;
211
212
if (sysfs_streq(buf, "pmem"))
213
mode = CXL_PARTMODE_PMEM;
214
else if (sysfs_streq(buf, "ram"))
215
mode = CXL_PARTMODE_RAM;
216
else
217
return -EINVAL;
218
219
rc = cxl_dpa_set_part(cxled, mode);
220
if (rc)
221
return rc;
222
223
return len;
224
}
225
static DEVICE_ATTR_RW(mode);
226
227
static ssize_t dpa_resource_show(struct device *dev, struct device_attribute *attr,
228
char *buf)
229
{
230
struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
231
232
guard(rwsem_read)(&cxl_rwsem.dpa);
233
return sysfs_emit(buf, "%#llx\n", (u64)cxl_dpa_resource_start(cxled));
234
}
235
static DEVICE_ATTR_RO(dpa_resource);
236
237
static ssize_t dpa_size_show(struct device *dev, struct device_attribute *attr,
238
char *buf)
239
{
240
struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
241
resource_size_t size = cxl_dpa_size(cxled);
242
243
return sysfs_emit(buf, "%pa\n", &size);
244
}
245
246
static ssize_t dpa_size_store(struct device *dev, struct device_attribute *attr,
247
const char *buf, size_t len)
248
{
249
struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
250
unsigned long long size;
251
ssize_t rc;
252
253
rc = kstrtoull(buf, 0, &size);
254
if (rc)
255
return rc;
256
257
if (!IS_ALIGNED(size, SZ_256M))
258
return -EINVAL;
259
260
rc = cxl_dpa_free(cxled);
261
if (rc)
262
return rc;
263
264
if (size == 0)
265
return len;
266
267
rc = cxl_dpa_alloc(cxled, size);
268
if (rc)
269
return rc;
270
271
return len;
272
}
273
static DEVICE_ATTR_RW(dpa_size);
274
275
static ssize_t interleave_granularity_show(struct device *dev,
276
struct device_attribute *attr,
277
char *buf)
278
{
279
struct cxl_decoder *cxld = to_cxl_decoder(dev);
280
281
return sysfs_emit(buf, "%d\n", cxld->interleave_granularity);
282
}
283
284
static DEVICE_ATTR_RO(interleave_granularity);
285
286
static ssize_t interleave_ways_show(struct device *dev,
287
struct device_attribute *attr, char *buf)
288
{
289
struct cxl_decoder *cxld = to_cxl_decoder(dev);
290
291
return sysfs_emit(buf, "%d\n", cxld->interleave_ways);
292
}
293
294
static DEVICE_ATTR_RO(interleave_ways);
295
296
static ssize_t qos_class_show(struct device *dev,
297
struct device_attribute *attr, char *buf)
298
{
299
struct cxl_root_decoder *cxlrd = to_cxl_root_decoder(dev);
300
301
return sysfs_emit(buf, "%d\n", cxlrd->qos_class);
302
}
303
static DEVICE_ATTR_RO(qos_class);
304
305
static struct attribute *cxl_decoder_base_attrs[] = {
306
&dev_attr_start.attr,
307
&dev_attr_size.attr,
308
&dev_attr_locked.attr,
309
&dev_attr_interleave_granularity.attr,
310
&dev_attr_interleave_ways.attr,
311
NULL,
312
};
313
314
static struct attribute_group cxl_decoder_base_attribute_group = {
315
.attrs = cxl_decoder_base_attrs,
316
};
317
318
static struct attribute *cxl_decoder_root_attrs[] = {
319
&dev_attr_cap_pmem.attr,
320
&dev_attr_cap_ram.attr,
321
&dev_attr_cap_type2.attr,
322
&dev_attr_cap_type3.attr,
323
&dev_attr_target_list.attr,
324
&dev_attr_qos_class.attr,
325
SET_CXL_REGION_ATTR(create_pmem_region)
326
SET_CXL_REGION_ATTR(create_ram_region)
327
SET_CXL_REGION_ATTR(delete_region)
328
NULL,
329
};
330
331
static bool can_create_pmem(struct cxl_root_decoder *cxlrd)
332
{
333
unsigned long flags = CXL_DECODER_F_TYPE3 | CXL_DECODER_F_PMEM;
334
335
return (cxlrd->cxlsd.cxld.flags & flags) == flags;
336
}
337
338
static bool can_create_ram(struct cxl_root_decoder *cxlrd)
339
{
340
unsigned long flags = CXL_DECODER_F_TYPE3 | CXL_DECODER_F_RAM;
341
342
return (cxlrd->cxlsd.cxld.flags & flags) == flags;
343
}
344
345
static umode_t cxl_root_decoder_visible(struct kobject *kobj, struct attribute *a, int n)
346
{
347
struct device *dev = kobj_to_dev(kobj);
348
struct cxl_root_decoder *cxlrd = to_cxl_root_decoder(dev);
349
350
if (a == CXL_REGION_ATTR(create_pmem_region) && !can_create_pmem(cxlrd))
351
return 0;
352
353
if (a == CXL_REGION_ATTR(create_ram_region) && !can_create_ram(cxlrd))
354
return 0;
355
356
if (a == CXL_REGION_ATTR(delete_region) &&
357
!(can_create_pmem(cxlrd) || can_create_ram(cxlrd)))
358
return 0;
359
360
return a->mode;
361
}
362
363
static struct attribute_group cxl_decoder_root_attribute_group = {
364
.attrs = cxl_decoder_root_attrs,
365
.is_visible = cxl_root_decoder_visible,
366
};
367
368
static const struct attribute_group *cxl_decoder_root_attribute_groups[] = {
369
&cxl_decoder_root_attribute_group,
370
&cxl_decoder_base_attribute_group,
371
&cxl_base_attribute_group,
372
NULL,
373
};
374
375
static struct attribute *cxl_decoder_switch_attrs[] = {
376
&dev_attr_target_type.attr,
377
&dev_attr_target_list.attr,
378
SET_CXL_REGION_ATTR(region)
379
NULL,
380
};
381
382
static struct attribute_group cxl_decoder_switch_attribute_group = {
383
.attrs = cxl_decoder_switch_attrs,
384
};
385
386
static const struct attribute_group *cxl_decoder_switch_attribute_groups[] = {
387
&cxl_decoder_switch_attribute_group,
388
&cxl_decoder_base_attribute_group,
389
&cxl_base_attribute_group,
390
NULL,
391
};
392
393
static struct attribute *cxl_decoder_endpoint_attrs[] = {
394
&dev_attr_target_type.attr,
395
&dev_attr_mode.attr,
396
&dev_attr_dpa_size.attr,
397
&dev_attr_dpa_resource.attr,
398
SET_CXL_REGION_ATTR(region)
399
NULL,
400
};
401
402
static struct attribute_group cxl_decoder_endpoint_attribute_group = {
403
.attrs = cxl_decoder_endpoint_attrs,
404
};
405
406
static const struct attribute_group *cxl_decoder_endpoint_attribute_groups[] = {
407
&cxl_decoder_base_attribute_group,
408
&cxl_decoder_endpoint_attribute_group,
409
&cxl_base_attribute_group,
410
NULL,
411
};
412
413
static void __cxl_decoder_release(struct cxl_decoder *cxld)
414
{
415
struct cxl_port *port = to_cxl_port(cxld->dev.parent);
416
417
ida_free(&port->decoder_ida, cxld->id);
418
put_device(&port->dev);
419
}
420
421
static void cxl_endpoint_decoder_release(struct device *dev)
422
{
423
struct cxl_endpoint_decoder *cxled = to_cxl_endpoint_decoder(dev);
424
425
__cxl_decoder_release(&cxled->cxld);
426
kfree(cxled);
427
}
428
429
static void cxl_switch_decoder_release(struct device *dev)
430
{
431
struct cxl_switch_decoder *cxlsd = to_cxl_switch_decoder(dev);
432
433
__cxl_decoder_release(&cxlsd->cxld);
434
kfree(cxlsd);
435
}
436
437
struct cxl_root_decoder *to_cxl_root_decoder(struct device *dev)
438
{
439
if (dev_WARN_ONCE(dev, !is_root_decoder(dev),
440
"not a cxl_root_decoder device\n"))
441
return NULL;
442
return container_of(dev, struct cxl_root_decoder, cxlsd.cxld.dev);
443
}
444
EXPORT_SYMBOL_NS_GPL(to_cxl_root_decoder, "CXL");
445
446
static void cxl_root_decoder_release(struct device *dev)
447
{
448
struct cxl_root_decoder *cxlrd = to_cxl_root_decoder(dev);
449
450
if (atomic_read(&cxlrd->region_id) >= 0)
451
memregion_free(atomic_read(&cxlrd->region_id));
452
__cxl_decoder_release(&cxlrd->cxlsd.cxld);
453
kfree(cxlrd);
454
}
455
456
static const struct device_type cxl_decoder_endpoint_type = {
457
.name = "cxl_decoder_endpoint",
458
.release = cxl_endpoint_decoder_release,
459
.groups = cxl_decoder_endpoint_attribute_groups,
460
};
461
462
static const struct device_type cxl_decoder_switch_type = {
463
.name = "cxl_decoder_switch",
464
.release = cxl_switch_decoder_release,
465
.groups = cxl_decoder_switch_attribute_groups,
466
};
467
468
static const struct device_type cxl_decoder_root_type = {
469
.name = "cxl_decoder_root",
470
.release = cxl_root_decoder_release,
471
.groups = cxl_decoder_root_attribute_groups,
472
};
473
474
bool is_endpoint_decoder(struct device *dev)
475
{
476
return dev->type == &cxl_decoder_endpoint_type;
477
}
478
EXPORT_SYMBOL_NS_GPL(is_endpoint_decoder, "CXL");
479
480
bool is_root_decoder(struct device *dev)
481
{
482
return dev->type == &cxl_decoder_root_type;
483
}
484
EXPORT_SYMBOL_NS_GPL(is_root_decoder, "CXL");
485
486
bool is_switch_decoder(struct device *dev)
487
{
488
return is_root_decoder(dev) || dev->type == &cxl_decoder_switch_type;
489
}
490
EXPORT_SYMBOL_NS_GPL(is_switch_decoder, "CXL");
491
492
struct cxl_decoder *to_cxl_decoder(struct device *dev)
493
{
494
if (dev_WARN_ONCE(dev,
495
!is_switch_decoder(dev) && !is_endpoint_decoder(dev),
496
"not a cxl_decoder device\n"))
497
return NULL;
498
return container_of(dev, struct cxl_decoder, dev);
499
}
500
EXPORT_SYMBOL_NS_GPL(to_cxl_decoder, "CXL");
501
502
struct cxl_endpoint_decoder *to_cxl_endpoint_decoder(struct device *dev)
503
{
504
if (dev_WARN_ONCE(dev, !is_endpoint_decoder(dev),
505
"not a cxl_endpoint_decoder device\n"))
506
return NULL;
507
return container_of(dev, struct cxl_endpoint_decoder, cxld.dev);
508
}
509
EXPORT_SYMBOL_NS_GPL(to_cxl_endpoint_decoder, "CXL");
510
511
struct cxl_switch_decoder *to_cxl_switch_decoder(struct device *dev)
512
{
513
if (dev_WARN_ONCE(dev, !is_switch_decoder(dev),
514
"not a cxl_switch_decoder device\n"))
515
return NULL;
516
return container_of(dev, struct cxl_switch_decoder, cxld.dev);
517
}
518
EXPORT_SYMBOL_NS_GPL(to_cxl_switch_decoder, "CXL");
519
520
static void cxl_ep_release(struct cxl_ep *ep)
521
{
522
put_device(ep->ep);
523
kfree(ep);
524
}
525
526
static void cxl_ep_remove(struct cxl_port *port, struct cxl_ep *ep)
527
{
528
if (!ep)
529
return;
530
xa_erase(&port->endpoints, (unsigned long) ep->ep);
531
cxl_ep_release(ep);
532
}
533
534
static void cxl_port_release(struct device *dev)
535
{
536
struct cxl_port *port = to_cxl_port(dev);
537
unsigned long index;
538
struct cxl_ep *ep;
539
540
xa_for_each(&port->endpoints, index, ep)
541
cxl_ep_remove(port, ep);
542
xa_destroy(&port->endpoints);
543
xa_destroy(&port->dports);
544
xa_destroy(&port->regions);
545
ida_free(&cxl_port_ida, port->id);
546
if (is_cxl_root(port))
547
kfree(to_cxl_root(port));
548
else
549
kfree(port);
550
}
551
552
static ssize_t decoders_committed_show(struct device *dev,
553
struct device_attribute *attr, char *buf)
554
{
555
struct cxl_port *port = to_cxl_port(dev);
556
557
guard(rwsem_read)(&cxl_rwsem.region);
558
return sysfs_emit(buf, "%d\n", cxl_num_decoders_committed(port));
559
}
560
561
static DEVICE_ATTR_RO(decoders_committed);
562
563
static struct attribute *cxl_port_attrs[] = {
564
&dev_attr_decoders_committed.attr,
565
NULL,
566
};
567
568
static struct attribute_group cxl_port_attribute_group = {
569
.attrs = cxl_port_attrs,
570
};
571
572
static const struct attribute_group *cxl_port_attribute_groups[] = {
573
&cxl_base_attribute_group,
574
&cxl_port_attribute_group,
575
NULL,
576
};
577
578
static const struct device_type cxl_port_type = {
579
.name = "cxl_port",
580
.release = cxl_port_release,
581
.groups = cxl_port_attribute_groups,
582
};
583
584
bool is_cxl_port(const struct device *dev)
585
{
586
return dev->type == &cxl_port_type;
587
}
588
EXPORT_SYMBOL_NS_GPL(is_cxl_port, "CXL");
589
590
struct cxl_port *to_cxl_port(const struct device *dev)
591
{
592
if (dev_WARN_ONCE(dev, dev->type != &cxl_port_type,
593
"not a cxl_port device\n"))
594
return NULL;
595
return container_of(dev, struct cxl_port, dev);
596
}
597
EXPORT_SYMBOL_NS_GPL(to_cxl_port, "CXL");
598
599
struct cxl_port *parent_port_of(struct cxl_port *port)
600
{
601
if (!port || !port->parent_dport)
602
return NULL;
603
return port->parent_dport->port;
604
}
605
606
static void unregister_port(void *_port)
607
{
608
struct cxl_port *port = _port;
609
struct cxl_port *parent = parent_port_of(port);
610
struct device *lock_dev;
611
612
/*
613
* CXL root port's and the first level of ports are unregistered
614
* under the platform firmware device lock, all other ports are
615
* unregistered while holding their parent port lock.
616
*/
617
if (!parent)
618
lock_dev = port->uport_dev;
619
else if (is_cxl_root(parent))
620
lock_dev = parent->uport_dev;
621
else
622
lock_dev = &parent->dev;
623
624
device_lock_assert(lock_dev);
625
port->dead = true;
626
device_unregister(&port->dev);
627
}
628
629
static void cxl_unlink_uport(void *_port)
630
{
631
struct cxl_port *port = _port;
632
633
sysfs_remove_link(&port->dev.kobj, "uport");
634
}
635
636
static int devm_cxl_link_uport(struct device *host, struct cxl_port *port)
637
{
638
int rc;
639
640
rc = sysfs_create_link(&port->dev.kobj, &port->uport_dev->kobj,
641
"uport");
642
if (rc)
643
return rc;
644
return devm_add_action_or_reset(host, cxl_unlink_uport, port);
645
}
646
647
static void cxl_unlink_parent_dport(void *_port)
648
{
649
struct cxl_port *port = _port;
650
651
sysfs_remove_link(&port->dev.kobj, "parent_dport");
652
}
653
654
static int devm_cxl_link_parent_dport(struct device *host,
655
struct cxl_port *port,
656
struct cxl_dport *parent_dport)
657
{
658
int rc;
659
660
if (!parent_dport)
661
return 0;
662
663
rc = sysfs_create_link(&port->dev.kobj, &parent_dport->dport_dev->kobj,
664
"parent_dport");
665
if (rc)
666
return rc;
667
return devm_add_action_or_reset(host, cxl_unlink_parent_dport, port);
668
}
669
670
static struct lock_class_key cxl_port_key;
671
672
static struct cxl_port *cxl_port_alloc(struct device *uport_dev,
673
struct cxl_dport *parent_dport)
674
{
675
struct cxl_root *cxl_root __free(kfree) = NULL;
676
struct cxl_port *port, *_port __free(kfree) = NULL;
677
struct device *dev;
678
int rc;
679
680
/* No parent_dport, root cxl_port */
681
if (!parent_dport) {
682
cxl_root = kzalloc(sizeof(*cxl_root), GFP_KERNEL);
683
if (!cxl_root)
684
return ERR_PTR(-ENOMEM);
685
} else {
686
_port = kzalloc(sizeof(*port), GFP_KERNEL);
687
if (!_port)
688
return ERR_PTR(-ENOMEM);
689
}
690
691
rc = ida_alloc(&cxl_port_ida, GFP_KERNEL);
692
if (rc < 0)
693
return ERR_PTR(rc);
694
695
if (cxl_root)
696
port = &no_free_ptr(cxl_root)->port;
697
else
698
port = no_free_ptr(_port);
699
700
port->id = rc;
701
port->uport_dev = uport_dev;
702
703
/*
704
* The top-level cxl_port "cxl_root" does not have a cxl_port as
705
* its parent and it does not have any corresponding component
706
* registers as its decode is described by a fixed platform
707
* description.
708
*/
709
dev = &port->dev;
710
if (parent_dport) {
711
struct cxl_port *parent_port = parent_dport->port;
712
struct cxl_port *iter;
713
714
dev->parent = &parent_port->dev;
715
port->depth = parent_port->depth + 1;
716
port->parent_dport = parent_dport;
717
718
/*
719
* walk to the host bridge, or the first ancestor that knows
720
* the host bridge
721
*/
722
iter = port;
723
while (!iter->host_bridge &&
724
!is_cxl_root(to_cxl_port(iter->dev.parent)))
725
iter = to_cxl_port(iter->dev.parent);
726
if (iter->host_bridge)
727
port->host_bridge = iter->host_bridge;
728
else if (parent_dport->rch)
729
port->host_bridge = parent_dport->dport_dev;
730
else
731
port->host_bridge = iter->uport_dev;
732
dev_dbg(uport_dev, "host-bridge: %s\n",
733
dev_name(port->host_bridge));
734
} else
735
dev->parent = uport_dev;
736
737
ida_init(&port->decoder_ida);
738
port->hdm_end = -1;
739
port->commit_end = -1;
740
xa_init(&port->dports);
741
xa_init(&port->endpoints);
742
xa_init(&port->regions);
743
744
device_initialize(dev);
745
lockdep_set_class_and_subclass(&dev->mutex, &cxl_port_key, port->depth);
746
device_set_pm_not_required(dev);
747
dev->bus = &cxl_bus_type;
748
dev->type = &cxl_port_type;
749
750
return port;
751
}
752
753
static int cxl_setup_comp_regs(struct device *host, struct cxl_register_map *map,
754
resource_size_t component_reg_phys)
755
{
756
*map = (struct cxl_register_map) {
757
.host = host,
758
.reg_type = CXL_REGLOC_RBI_EMPTY,
759
.resource = component_reg_phys,
760
};
761
762
if (component_reg_phys == CXL_RESOURCE_NONE)
763
return 0;
764
765
map->reg_type = CXL_REGLOC_RBI_COMPONENT;
766
map->max_size = CXL_COMPONENT_REG_BLOCK_SIZE;
767
768
return cxl_setup_regs(map);
769
}
770
771
static int cxl_port_setup_regs(struct cxl_port *port,
772
resource_size_t component_reg_phys)
773
{
774
if (dev_is_platform(port->uport_dev))
775
return 0;
776
return cxl_setup_comp_regs(&port->dev, &port->reg_map,
777
component_reg_phys);
778
}
779
780
static int cxl_dport_setup_regs(struct device *host, struct cxl_dport *dport,
781
resource_size_t component_reg_phys)
782
{
783
int rc;
784
785
if (dev_is_platform(dport->dport_dev))
786
return 0;
787
788
/*
789
* use @dport->dport_dev for the context for error messages during
790
* register probing, and fixup @host after the fact, since @host may be
791
* NULL.
792
*/
793
rc = cxl_setup_comp_regs(dport->dport_dev, &dport->reg_map,
794
component_reg_phys);
795
dport->reg_map.host = host;
796
return rc;
797
}
798
799
DEFINE_SHOW_ATTRIBUTE(einj_cxl_available_error_type);
800
801
static int cxl_einj_inject(void *data, u64 type)
802
{
803
struct cxl_dport *dport = data;
804
805
if (dport->rch)
806
return einj_cxl_inject_rch_error(dport->rcrb.base, type);
807
808
return einj_cxl_inject_error(to_pci_dev(dport->dport_dev), type);
809
}
810
DEFINE_DEBUGFS_ATTRIBUTE(cxl_einj_inject_fops, NULL, cxl_einj_inject,
811
"0x%llx\n");
812
813
static void cxl_debugfs_create_dport_dir(struct cxl_dport *dport)
814
{
815
struct dentry *dir;
816
817
if (!einj_cxl_is_initialized())
818
return;
819
820
/*
821
* dport_dev needs to be a PCIe port for CXL 2.0+ ports because
822
* EINJ expects a dport SBDF to be specified for 2.0 error injection.
823
*/
824
if (!dport->rch && !dev_is_pci(dport->dport_dev))
825
return;
826
827
dir = cxl_debugfs_create_dir(dev_name(dport->dport_dev));
828
829
debugfs_create_file("einj_inject", 0200, dir, dport,
830
&cxl_einj_inject_fops);
831
}
832
833
static int cxl_port_add(struct cxl_port *port,
834
resource_size_t component_reg_phys,
835
struct cxl_dport *parent_dport)
836
{
837
struct device *dev __free(put_device) = &port->dev;
838
int rc;
839
840
if (is_cxl_memdev(port->uport_dev)) {
841
struct cxl_memdev *cxlmd = to_cxl_memdev(port->uport_dev);
842
struct cxl_dev_state *cxlds = cxlmd->cxlds;
843
844
rc = dev_set_name(dev, "endpoint%d", port->id);
845
if (rc)
846
return rc;
847
848
/*
849
* The endpoint driver already enumerated the component and RAS
850
* registers. Reuse that enumeration while prepping them to be
851
* mapped by the cxl_port driver.
852
*/
853
port->reg_map = cxlds->reg_map;
854
port->reg_map.host = &port->dev;
855
cxlmd->endpoint = port;
856
} else if (parent_dport) {
857
rc = dev_set_name(dev, "port%d", port->id);
858
if (rc)
859
return rc;
860
861
rc = cxl_port_setup_regs(port, component_reg_phys);
862
if (rc)
863
return rc;
864
} else {
865
rc = dev_set_name(dev, "root%d", port->id);
866
if (rc)
867
return rc;
868
}
869
870
rc = device_add(dev);
871
if (rc)
872
return rc;
873
874
/* Inhibit the cleanup function invoked */
875
dev = NULL;
876
return 0;
877
}
878
879
static struct cxl_port *__devm_cxl_add_port(struct device *host,
880
struct device *uport_dev,
881
resource_size_t component_reg_phys,
882
struct cxl_dport *parent_dport)
883
{
884
struct cxl_port *port;
885
int rc;
886
887
port = cxl_port_alloc(uport_dev, parent_dport);
888
if (IS_ERR(port))
889
return port;
890
891
rc = cxl_port_add(port, component_reg_phys, parent_dport);
892
if (rc)
893
return ERR_PTR(rc);
894
895
rc = devm_add_action_or_reset(host, unregister_port, port);
896
if (rc)
897
return ERR_PTR(rc);
898
899
rc = devm_cxl_link_uport(host, port);
900
if (rc)
901
return ERR_PTR(rc);
902
903
rc = devm_cxl_link_parent_dport(host, port, parent_dport);
904
if (rc)
905
return ERR_PTR(rc);
906
907
if (parent_dport && dev_is_pci(uport_dev))
908
port->pci_latency = cxl_pci_get_latency(to_pci_dev(uport_dev));
909
910
return port;
911
}
912
913
/**
914
* devm_cxl_add_port - register a cxl_port in CXL memory decode hierarchy
915
* @host: host device for devm operations
916
* @uport_dev: "physical" device implementing this upstream port
917
* @component_reg_phys: (optional) for configurable cxl_port instances
918
* @parent_dport: next hop up in the CXL memory decode hierarchy
919
*/
920
struct cxl_port *devm_cxl_add_port(struct device *host,
921
struct device *uport_dev,
922
resource_size_t component_reg_phys,
923
struct cxl_dport *parent_dport)
924
{
925
struct cxl_port *port, *parent_port;
926
927
port = __devm_cxl_add_port(host, uport_dev, component_reg_phys,
928
parent_dport);
929
930
parent_port = parent_dport ? parent_dport->port : NULL;
931
if (IS_ERR(port)) {
932
dev_dbg(uport_dev, "Failed to add%s%s%s: %ld\n",
933
parent_port ? " port to " : "",
934
parent_port ? dev_name(&parent_port->dev) : "",
935
parent_port ? "" : " root port",
936
PTR_ERR(port));
937
} else {
938
dev_dbg(uport_dev, "%s added%s%s%s\n",
939
dev_name(&port->dev),
940
parent_port ? " to " : "",
941
parent_port ? dev_name(&parent_port->dev) : "",
942
parent_port ? "" : " (root port)");
943
}
944
945
return port;
946
}
947
EXPORT_SYMBOL_NS_GPL(devm_cxl_add_port, "CXL");
948
949
struct cxl_root *devm_cxl_add_root(struct device *host,
950
const struct cxl_root_ops *ops)
951
{
952
struct cxl_root *cxl_root;
953
struct cxl_port *port;
954
955
port = devm_cxl_add_port(host, host, CXL_RESOURCE_NONE, NULL);
956
if (IS_ERR(port))
957
return ERR_CAST(port);
958
959
cxl_root = to_cxl_root(port);
960
cxl_root->ops = ops;
961
return cxl_root;
962
}
963
EXPORT_SYMBOL_NS_GPL(devm_cxl_add_root, "CXL");
964
965
struct pci_bus *cxl_port_to_pci_bus(struct cxl_port *port)
966
{
967
/* There is no pci_bus associated with a CXL platform-root port */
968
if (is_cxl_root(port))
969
return NULL;
970
971
if (dev_is_pci(port->uport_dev)) {
972
struct pci_dev *pdev = to_pci_dev(port->uport_dev);
973
974
return pdev->subordinate;
975
}
976
977
return xa_load(&cxl_root_buses, (unsigned long)port->uport_dev);
978
}
979
EXPORT_SYMBOL_NS_GPL(cxl_port_to_pci_bus, "CXL");
980
981
static void unregister_pci_bus(void *uport_dev)
982
{
983
xa_erase(&cxl_root_buses, (unsigned long)uport_dev);
984
}
985
986
int devm_cxl_register_pci_bus(struct device *host, struct device *uport_dev,
987
struct pci_bus *bus)
988
{
989
int rc;
990
991
if (dev_is_pci(uport_dev))
992
return -EINVAL;
993
994
rc = xa_insert(&cxl_root_buses, (unsigned long)uport_dev, bus,
995
GFP_KERNEL);
996
if (rc)
997
return rc;
998
return devm_add_action_or_reset(host, unregister_pci_bus, uport_dev);
999
}
1000
EXPORT_SYMBOL_NS_GPL(devm_cxl_register_pci_bus, "CXL");
1001
1002
static bool dev_is_cxl_root_child(struct device *dev)
1003
{
1004
struct cxl_port *port, *parent;
1005
1006
if (!is_cxl_port(dev))
1007
return false;
1008
1009
port = to_cxl_port(dev);
1010
if (is_cxl_root(port))
1011
return false;
1012
1013
parent = to_cxl_port(port->dev.parent);
1014
if (is_cxl_root(parent))
1015
return true;
1016
1017
return false;
1018
}
1019
1020
struct cxl_root *find_cxl_root(struct cxl_port *port)
1021
{
1022
struct cxl_port *iter = port;
1023
1024
while (iter && !is_cxl_root(iter))
1025
iter = to_cxl_port(iter->dev.parent);
1026
1027
if (!iter)
1028
return NULL;
1029
get_device(&iter->dev);
1030
return to_cxl_root(iter);
1031
}
1032
EXPORT_SYMBOL_NS_GPL(find_cxl_root, "CXL");
1033
1034
static struct cxl_dport *find_dport(struct cxl_port *port, int id)
1035
{
1036
struct cxl_dport *dport;
1037
unsigned long index;
1038
1039
device_lock_assert(&port->dev);
1040
xa_for_each(&port->dports, index, dport)
1041
if (dport->port_id == id)
1042
return dport;
1043
return NULL;
1044
}
1045
1046
static int add_dport(struct cxl_port *port, struct cxl_dport *dport)
1047
{
1048
struct cxl_dport *dup;
1049
int rc;
1050
1051
device_lock_assert(&port->dev);
1052
dup = find_dport(port, dport->port_id);
1053
if (dup) {
1054
dev_err(&port->dev,
1055
"unable to add dport%d-%s non-unique port id (%s)\n",
1056
dport->port_id, dev_name(dport->dport_dev),
1057
dev_name(dup->dport_dev));
1058
return -EBUSY;
1059
}
1060
1061
rc = xa_insert(&port->dports, (unsigned long)dport->dport_dev, dport,
1062
GFP_KERNEL);
1063
if (rc)
1064
return rc;
1065
1066
port->nr_dports++;
1067
return 0;
1068
}
1069
1070
/*
1071
* Since root-level CXL dports cannot be enumerated by PCI they are not
1072
* enumerated by the common port driver that acquires the port lock over
1073
* dport add/remove. Instead, root dports are manually added by a
1074
* platform driver and cond_cxl_root_lock() is used to take the missing
1075
* port lock in that case.
1076
*/
1077
static void cond_cxl_root_lock(struct cxl_port *port)
1078
{
1079
if (is_cxl_root(port))
1080
device_lock(&port->dev);
1081
}
1082
1083
static void cond_cxl_root_unlock(struct cxl_port *port)
1084
{
1085
if (is_cxl_root(port))
1086
device_unlock(&port->dev);
1087
}
1088
1089
static void cxl_dport_remove(void *data)
1090
{
1091
struct cxl_dport *dport = data;
1092
struct cxl_port *port = dport->port;
1093
1094
xa_erase(&port->dports, (unsigned long) dport->dport_dev);
1095
put_device(dport->dport_dev);
1096
}
1097
1098
static void cxl_dport_unlink(void *data)
1099
{
1100
struct cxl_dport *dport = data;
1101
struct cxl_port *port = dport->port;
1102
char link_name[CXL_TARGET_STRLEN];
1103
1104
sprintf(link_name, "dport%d", dport->port_id);
1105
sysfs_remove_link(&port->dev.kobj, link_name);
1106
}
1107
1108
static struct cxl_dport *
1109
__devm_cxl_add_dport(struct cxl_port *port, struct device *dport_dev,
1110
int port_id, resource_size_t component_reg_phys,
1111
resource_size_t rcrb)
1112
{
1113
char link_name[CXL_TARGET_STRLEN];
1114
struct cxl_dport *dport;
1115
struct device *host;
1116
int rc;
1117
1118
if (is_cxl_root(port))
1119
host = port->uport_dev;
1120
else
1121
host = &port->dev;
1122
1123
if (!host->driver) {
1124
dev_WARN_ONCE(&port->dev, 1, "dport:%s bad devm context\n",
1125
dev_name(dport_dev));
1126
return ERR_PTR(-ENXIO);
1127
}
1128
1129
if (snprintf(link_name, CXL_TARGET_STRLEN, "dport%d", port_id) >=
1130
CXL_TARGET_STRLEN)
1131
return ERR_PTR(-EINVAL);
1132
1133
dport = devm_kzalloc(host, sizeof(*dport), GFP_KERNEL);
1134
if (!dport)
1135
return ERR_PTR(-ENOMEM);
1136
1137
dport->dport_dev = dport_dev;
1138
dport->port_id = port_id;
1139
dport->port = port;
1140
1141
if (rcrb == CXL_RESOURCE_NONE) {
1142
rc = cxl_dport_setup_regs(&port->dev, dport,
1143
component_reg_phys);
1144
if (rc)
1145
return ERR_PTR(rc);
1146
} else {
1147
dport->rcrb.base = rcrb;
1148
component_reg_phys = __rcrb_to_component(dport_dev, &dport->rcrb,
1149
CXL_RCRB_DOWNSTREAM);
1150
if (component_reg_phys == CXL_RESOURCE_NONE) {
1151
dev_warn(dport_dev, "Invalid Component Registers in RCRB");
1152
return ERR_PTR(-ENXIO);
1153
}
1154
1155
/*
1156
* RCH @dport is not ready to map until associated with its
1157
* memdev
1158
*/
1159
rc = cxl_dport_setup_regs(NULL, dport, component_reg_phys);
1160
if (rc)
1161
return ERR_PTR(rc);
1162
1163
dport->rch = true;
1164
}
1165
1166
if (component_reg_phys != CXL_RESOURCE_NONE)
1167
dev_dbg(dport_dev, "Component Registers found for dport: %pa\n",
1168
&component_reg_phys);
1169
1170
cond_cxl_root_lock(port);
1171
rc = add_dport(port, dport);
1172
cond_cxl_root_unlock(port);
1173
if (rc)
1174
return ERR_PTR(rc);
1175
1176
get_device(dport_dev);
1177
rc = devm_add_action_or_reset(host, cxl_dport_remove, dport);
1178
if (rc)
1179
return ERR_PTR(rc);
1180
1181
rc = sysfs_create_link(&port->dev.kobj, &dport_dev->kobj, link_name);
1182
if (rc)
1183
return ERR_PTR(rc);
1184
1185
rc = devm_add_action_or_reset(host, cxl_dport_unlink, dport);
1186
if (rc)
1187
return ERR_PTR(rc);
1188
1189
if (dev_is_pci(dport_dev))
1190
dport->link_latency = cxl_pci_get_latency(to_pci_dev(dport_dev));
1191
1192
cxl_debugfs_create_dport_dir(dport);
1193
1194
return dport;
1195
}
1196
1197
/**
1198
* devm_cxl_add_dport - append VH downstream port data to a cxl_port
1199
* @port: the cxl_port that references this dport
1200
* @dport_dev: firmware or PCI device representing the dport
1201
* @port_id: identifier for this dport in a decoder's target list
1202
* @component_reg_phys: optional location of CXL component registers
1203
*
1204
* Note that dports are appended to the devm release action's of the
1205
* either the port's host (for root ports), or the port itself (for
1206
* switch ports)
1207
*/
1208
struct cxl_dport *devm_cxl_add_dport(struct cxl_port *port,
1209
struct device *dport_dev, int port_id,
1210
resource_size_t component_reg_phys)
1211
{
1212
struct cxl_dport *dport;
1213
1214
dport = __devm_cxl_add_dport(port, dport_dev, port_id,
1215
component_reg_phys, CXL_RESOURCE_NONE);
1216
if (IS_ERR(dport)) {
1217
dev_dbg(dport_dev, "failed to add dport to %s: %ld\n",
1218
dev_name(&port->dev), PTR_ERR(dport));
1219
} else {
1220
dev_dbg(dport_dev, "dport added to %s\n",
1221
dev_name(&port->dev));
1222
}
1223
1224
return dport;
1225
}
1226
EXPORT_SYMBOL_NS_GPL(devm_cxl_add_dport, "CXL");
1227
1228
/**
1229
* devm_cxl_add_rch_dport - append RCH downstream port data to a cxl_port
1230
* @port: the cxl_port that references this dport
1231
* @dport_dev: firmware or PCI device representing the dport
1232
* @port_id: identifier for this dport in a decoder's target list
1233
* @rcrb: mandatory location of a Root Complex Register Block
1234
*
1235
* See CXL 3.0 9.11.8 CXL Devices Attached to an RCH
1236
*/
1237
struct cxl_dport *devm_cxl_add_rch_dport(struct cxl_port *port,
1238
struct device *dport_dev, int port_id,
1239
resource_size_t rcrb)
1240
{
1241
struct cxl_dport *dport;
1242
1243
if (rcrb == CXL_RESOURCE_NONE) {
1244
dev_dbg(&port->dev, "failed to add RCH dport, missing RCRB\n");
1245
return ERR_PTR(-EINVAL);
1246
}
1247
1248
dport = __devm_cxl_add_dport(port, dport_dev, port_id,
1249
CXL_RESOURCE_NONE, rcrb);
1250
if (IS_ERR(dport)) {
1251
dev_dbg(dport_dev, "failed to add RCH dport to %s: %ld\n",
1252
dev_name(&port->dev), PTR_ERR(dport));
1253
} else {
1254
dev_dbg(dport_dev, "RCH dport added to %s\n",
1255
dev_name(&port->dev));
1256
}
1257
1258
return dport;
1259
}
1260
EXPORT_SYMBOL_NS_GPL(devm_cxl_add_rch_dport, "CXL");
1261
1262
static int add_ep(struct cxl_ep *new)
1263
{
1264
struct cxl_port *port = new->dport->port;
1265
1266
guard(device)(&port->dev);
1267
if (port->dead)
1268
return -ENXIO;
1269
1270
return xa_insert(&port->endpoints, (unsigned long)new->ep,
1271
new, GFP_KERNEL);
1272
}
1273
1274
/**
1275
* cxl_add_ep - register an endpoint's interest in a port
1276
* @dport: the dport that routes to @ep_dev
1277
* @ep_dev: device representing the endpoint
1278
*
1279
* Intermediate CXL ports are scanned based on the arrival of endpoints.
1280
* When those endpoints depart the port can be destroyed once all
1281
* endpoints that care about that port have been removed.
1282
*/
1283
static int cxl_add_ep(struct cxl_dport *dport, struct device *ep_dev)
1284
{
1285
struct cxl_ep *ep;
1286
int rc;
1287
1288
ep = kzalloc(sizeof(*ep), GFP_KERNEL);
1289
if (!ep)
1290
return -ENOMEM;
1291
1292
ep->ep = get_device(ep_dev);
1293
ep->dport = dport;
1294
1295
rc = add_ep(ep);
1296
if (rc)
1297
cxl_ep_release(ep);
1298
return rc;
1299
}
1300
1301
struct cxl_find_port_ctx {
1302
const struct device *dport_dev;
1303
const struct cxl_port *parent_port;
1304
struct cxl_dport **dport;
1305
};
1306
1307
static int match_port_by_dport(struct device *dev, const void *data)
1308
{
1309
const struct cxl_find_port_ctx *ctx = data;
1310
struct cxl_dport *dport;
1311
struct cxl_port *port;
1312
1313
if (!is_cxl_port(dev))
1314
return 0;
1315
if (ctx->parent_port && dev->parent != &ctx->parent_port->dev)
1316
return 0;
1317
1318
port = to_cxl_port(dev);
1319
dport = cxl_find_dport_by_dev(port, ctx->dport_dev);
1320
if (ctx->dport)
1321
*ctx->dport = dport;
1322
return dport != NULL;
1323
}
1324
1325
static struct cxl_port *__find_cxl_port(struct cxl_find_port_ctx *ctx)
1326
{
1327
struct device *dev;
1328
1329
if (!ctx->dport_dev)
1330
return NULL;
1331
1332
dev = bus_find_device(&cxl_bus_type, NULL, ctx, match_port_by_dport);
1333
if (dev)
1334
return to_cxl_port(dev);
1335
return NULL;
1336
}
1337
1338
static struct cxl_port *find_cxl_port(struct device *dport_dev,
1339
struct cxl_dport **dport)
1340
{
1341
struct cxl_find_port_ctx ctx = {
1342
.dport_dev = dport_dev,
1343
.dport = dport,
1344
};
1345
struct cxl_port *port;
1346
1347
port = __find_cxl_port(&ctx);
1348
return port;
1349
}
1350
1351
static struct cxl_port *find_cxl_port_at(struct cxl_port *parent_port,
1352
struct device *dport_dev,
1353
struct cxl_dport **dport)
1354
{
1355
struct cxl_find_port_ctx ctx = {
1356
.dport_dev = dport_dev,
1357
.parent_port = parent_port,
1358
.dport = dport,
1359
};
1360
struct cxl_port *port;
1361
1362
port = __find_cxl_port(&ctx);
1363
return port;
1364
}
1365
1366
/*
1367
* All users of grandparent() are using it to walk PCIe-like switch port
1368
* hierarchy. A PCIe switch is comprised of a bridge device representing the
1369
* upstream switch port and N bridges representing downstream switch ports. When
1370
* bridges stack the grand-parent of a downstream switch port is another
1371
* downstream switch port in the immediate ancestor switch.
1372
*/
1373
static struct device *grandparent(struct device *dev)
1374
{
1375
if (dev && dev->parent)
1376
return dev->parent->parent;
1377
return NULL;
1378
}
1379
1380
static struct device *endpoint_host(struct cxl_port *endpoint)
1381
{
1382
struct cxl_port *port = to_cxl_port(endpoint->dev.parent);
1383
1384
if (is_cxl_root(port))
1385
return port->uport_dev;
1386
return &port->dev;
1387
}
1388
1389
static void delete_endpoint(void *data)
1390
{
1391
struct cxl_memdev *cxlmd = data;
1392
struct cxl_port *endpoint = cxlmd->endpoint;
1393
struct device *host = endpoint_host(endpoint);
1394
1395
scoped_guard(device, host) {
1396
if (host->driver && !endpoint->dead) {
1397
devm_release_action(host, cxl_unlink_parent_dport, endpoint);
1398
devm_release_action(host, cxl_unlink_uport, endpoint);
1399
devm_release_action(host, unregister_port, endpoint);
1400
}
1401
cxlmd->endpoint = NULL;
1402
}
1403
put_device(&endpoint->dev);
1404
put_device(host);
1405
}
1406
1407
int cxl_endpoint_autoremove(struct cxl_memdev *cxlmd, struct cxl_port *endpoint)
1408
{
1409
struct device *host = endpoint_host(endpoint);
1410
struct device *dev = &cxlmd->dev;
1411
1412
get_device(host);
1413
get_device(&endpoint->dev);
1414
cxlmd->depth = endpoint->depth;
1415
return devm_add_action_or_reset(dev, delete_endpoint, cxlmd);
1416
}
1417
EXPORT_SYMBOL_NS_GPL(cxl_endpoint_autoremove, "CXL");
1418
1419
/*
1420
* The natural end of life of a non-root 'cxl_port' is when its parent port goes
1421
* through a ->remove() event ("top-down" unregistration). The unnatural trigger
1422
* for a port to be unregistered is when all memdevs beneath that port have gone
1423
* through ->remove(). This "bottom-up" removal selectively removes individual
1424
* child ports manually. This depends on devm_cxl_add_port() to not change is
1425
* devm action registration order, and for dports to have already been
1426
* destroyed by reap_dports().
1427
*/
1428
static void delete_switch_port(struct cxl_port *port)
1429
{
1430
devm_release_action(port->dev.parent, cxl_unlink_parent_dport, port);
1431
devm_release_action(port->dev.parent, cxl_unlink_uport, port);
1432
devm_release_action(port->dev.parent, unregister_port, port);
1433
}
1434
1435
static void reap_dports(struct cxl_port *port)
1436
{
1437
struct cxl_dport *dport;
1438
unsigned long index;
1439
1440
device_lock_assert(&port->dev);
1441
1442
xa_for_each(&port->dports, index, dport) {
1443
devm_release_action(&port->dev, cxl_dport_unlink, dport);
1444
devm_release_action(&port->dev, cxl_dport_remove, dport);
1445
devm_kfree(&port->dev, dport);
1446
}
1447
}
1448
1449
struct detach_ctx {
1450
struct cxl_memdev *cxlmd;
1451
int depth;
1452
};
1453
1454
static int port_has_memdev(struct device *dev, const void *data)
1455
{
1456
const struct detach_ctx *ctx = data;
1457
struct cxl_port *port;
1458
1459
if (!is_cxl_port(dev))
1460
return 0;
1461
1462
port = to_cxl_port(dev);
1463
if (port->depth != ctx->depth)
1464
return 0;
1465
1466
return !!cxl_ep_load(port, ctx->cxlmd);
1467
}
1468
1469
static void cxl_detach_ep(void *data)
1470
{
1471
struct cxl_memdev *cxlmd = data;
1472
1473
for (int i = cxlmd->depth - 1; i >= 1; i--) {
1474
struct cxl_port *port, *parent_port;
1475
struct detach_ctx ctx = {
1476
.cxlmd = cxlmd,
1477
.depth = i,
1478
};
1479
struct cxl_ep *ep;
1480
bool died = false;
1481
1482
struct device *dev __free(put_device) =
1483
bus_find_device(&cxl_bus_type, NULL, &ctx, port_has_memdev);
1484
if (!dev)
1485
continue;
1486
port = to_cxl_port(dev);
1487
1488
parent_port = to_cxl_port(port->dev.parent);
1489
device_lock(&parent_port->dev);
1490
device_lock(&port->dev);
1491
ep = cxl_ep_load(port, cxlmd);
1492
dev_dbg(&cxlmd->dev, "disconnect %s from %s\n",
1493
ep ? dev_name(ep->ep) : "", dev_name(&port->dev));
1494
cxl_ep_remove(port, ep);
1495
if (ep && !port->dead && xa_empty(&port->endpoints) &&
1496
!is_cxl_root(parent_port) && parent_port->dev.driver) {
1497
/*
1498
* This was the last ep attached to a dynamically
1499
* enumerated port. Block new cxl_add_ep() and garbage
1500
* collect the port.
1501
*/
1502
died = true;
1503
port->dead = true;
1504
reap_dports(port);
1505
}
1506
device_unlock(&port->dev);
1507
1508
if (died) {
1509
dev_dbg(&cxlmd->dev, "delete %s\n",
1510
dev_name(&port->dev));
1511
delete_switch_port(port);
1512
}
1513
device_unlock(&parent_port->dev);
1514
}
1515
}
1516
1517
static resource_size_t find_component_registers(struct device *dev)
1518
{
1519
struct cxl_register_map map;
1520
struct pci_dev *pdev;
1521
1522
/*
1523
* Theoretically, CXL component registers can be hosted on a
1524
* non-PCI device, in practice, only cxl_test hits this case.
1525
*/
1526
if (!dev_is_pci(dev))
1527
return CXL_RESOURCE_NONE;
1528
1529
pdev = to_pci_dev(dev);
1530
1531
cxl_find_regblock(pdev, CXL_REGLOC_RBI_COMPONENT, &map);
1532
return map.resource;
1533
}
1534
1535
static int add_port_attach_ep(struct cxl_memdev *cxlmd,
1536
struct device *uport_dev,
1537
struct device *dport_dev)
1538
{
1539
struct device *dparent = grandparent(dport_dev);
1540
struct cxl_dport *dport, *parent_dport;
1541
resource_size_t component_reg_phys;
1542
int rc;
1543
1544
if (!dparent) {
1545
/*
1546
* The iteration reached the topology root without finding the
1547
* CXL-root 'cxl_port' on a previous iteration, fail for now to
1548
* be re-probed after platform driver attaches.
1549
*/
1550
dev_dbg(&cxlmd->dev, "%s is a root dport\n",
1551
dev_name(dport_dev));
1552
return -ENXIO;
1553
}
1554
1555
struct cxl_port *parent_port __free(put_cxl_port) =
1556
find_cxl_port(dparent, &parent_dport);
1557
if (!parent_port) {
1558
/* iterate to create this parent_port */
1559
return -EAGAIN;
1560
}
1561
1562
/*
1563
* Definition with __free() here to keep the sequence of
1564
* dereferencing the device of the port before the parent_port releasing.
1565
*/
1566
struct cxl_port *port __free(put_cxl_port) = NULL;
1567
scoped_guard(device, &parent_port->dev) {
1568
if (!parent_port->dev.driver) {
1569
dev_warn(&cxlmd->dev,
1570
"port %s:%s disabled, failed to enumerate CXL.mem\n",
1571
dev_name(&parent_port->dev), dev_name(uport_dev));
1572
return -ENXIO;
1573
}
1574
1575
port = find_cxl_port_at(parent_port, dport_dev, &dport);
1576
if (!port) {
1577
component_reg_phys = find_component_registers(uport_dev);
1578
port = devm_cxl_add_port(&parent_port->dev, uport_dev,
1579
component_reg_phys, parent_dport);
1580
if (IS_ERR(port))
1581
return PTR_ERR(port);
1582
1583
/* retry find to pick up the new dport information */
1584
port = find_cxl_port_at(parent_port, dport_dev, &dport);
1585
if (!port)
1586
return -ENXIO;
1587
}
1588
}
1589
1590
dev_dbg(&cxlmd->dev, "add to new port %s:%s\n",
1591
dev_name(&port->dev), dev_name(port->uport_dev));
1592
rc = cxl_add_ep(dport, &cxlmd->dev);
1593
if (rc == -EBUSY) {
1594
/*
1595
* "can't" happen, but this error code means
1596
* something to the caller, so translate it.
1597
*/
1598
rc = -ENXIO;
1599
}
1600
1601
return rc;
1602
}
1603
1604
int devm_cxl_enumerate_ports(struct cxl_memdev *cxlmd)
1605
{
1606
struct device *dev = &cxlmd->dev;
1607
struct device *iter;
1608
int rc;
1609
1610
/*
1611
* Skip intermediate port enumeration in the RCH case, there
1612
* are no ports in between a host bridge and an endpoint.
1613
*/
1614
if (cxlmd->cxlds->rcd)
1615
return 0;
1616
1617
rc = devm_add_action_or_reset(&cxlmd->dev, cxl_detach_ep, cxlmd);
1618
if (rc)
1619
return rc;
1620
1621
/*
1622
* Scan for and add all cxl_ports in this device's ancestry.
1623
* Repeat until no more ports are added. Abort if a port add
1624
* attempt fails.
1625
*/
1626
retry:
1627
for (iter = dev; iter; iter = grandparent(iter)) {
1628
struct device *dport_dev = grandparent(iter);
1629
struct device *uport_dev;
1630
struct cxl_dport *dport;
1631
1632
/*
1633
* The terminal "grandparent" in PCI is NULL and @platform_bus
1634
* for platform devices
1635
*/
1636
if (!dport_dev || dport_dev == &platform_bus)
1637
return 0;
1638
1639
uport_dev = dport_dev->parent;
1640
if (!uport_dev) {
1641
dev_warn(dev, "at %s no parent for dport: %s\n",
1642
dev_name(iter), dev_name(dport_dev));
1643
return -ENXIO;
1644
}
1645
1646
dev_dbg(dev, "scan: iter: %s dport_dev: %s parent: %s\n",
1647
dev_name(iter), dev_name(dport_dev),
1648
dev_name(uport_dev));
1649
struct cxl_port *port __free(put_cxl_port) =
1650
find_cxl_port(dport_dev, &dport);
1651
if (port) {
1652
dev_dbg(&cxlmd->dev,
1653
"found already registered port %s:%s\n",
1654
dev_name(&port->dev),
1655
dev_name(port->uport_dev));
1656
rc = cxl_add_ep(dport, &cxlmd->dev);
1657
1658
/*
1659
* If the endpoint already exists in the port's list,
1660
* that's ok, it was added on a previous pass.
1661
* Otherwise, retry in add_port_attach_ep() after taking
1662
* the parent_port lock as the current port may be being
1663
* reaped.
1664
*/
1665
if (rc && rc != -EBUSY)
1666
return rc;
1667
1668
cxl_gpf_port_setup(dport);
1669
1670
/* Any more ports to add between this one and the root? */
1671
if (!dev_is_cxl_root_child(&port->dev))
1672
continue;
1673
1674
return 0;
1675
}
1676
1677
rc = add_port_attach_ep(cxlmd, uport_dev, dport_dev);
1678
/* port missing, try to add parent */
1679
if (rc == -EAGAIN)
1680
continue;
1681
/* failed to add ep or port */
1682
if (rc)
1683
return rc;
1684
/* port added, new descendants possible, start over */
1685
goto retry;
1686
}
1687
1688
return 0;
1689
}
1690
EXPORT_SYMBOL_NS_GPL(devm_cxl_enumerate_ports, "CXL");
1691
1692
struct cxl_port *cxl_pci_find_port(struct pci_dev *pdev,
1693
struct cxl_dport **dport)
1694
{
1695
return find_cxl_port(pdev->dev.parent, dport);
1696
}
1697
EXPORT_SYMBOL_NS_GPL(cxl_pci_find_port, "CXL");
1698
1699
struct cxl_port *cxl_mem_find_port(struct cxl_memdev *cxlmd,
1700
struct cxl_dport **dport)
1701
{
1702
return find_cxl_port(grandparent(&cxlmd->dev), dport);
1703
}
1704
EXPORT_SYMBOL_NS_GPL(cxl_mem_find_port, "CXL");
1705
1706
static int decoder_populate_targets(struct cxl_switch_decoder *cxlsd,
1707
struct cxl_port *port, int *target_map)
1708
{
1709
int i;
1710
1711
if (!target_map)
1712
return 0;
1713
1714
device_lock_assert(&port->dev);
1715
1716
if (xa_empty(&port->dports))
1717
return -EINVAL;
1718
1719
guard(rwsem_write)(&cxl_rwsem.region);
1720
for (i = 0; i < cxlsd->cxld.interleave_ways; i++) {
1721
struct cxl_dport *dport = find_dport(port, target_map[i]);
1722
1723
if (!dport)
1724
return -ENXIO;
1725
cxlsd->target[i] = dport;
1726
}
1727
1728
return 0;
1729
}
1730
1731
static struct lock_class_key cxl_decoder_key;
1732
1733
/**
1734
* cxl_decoder_init - Common decoder setup / initialization
1735
* @port: owning port of this decoder
1736
* @cxld: common decoder properties to initialize
1737
*
1738
* A port may contain one or more decoders. Each of those decoders
1739
* enable some address space for CXL.mem utilization. A decoder is
1740
* expected to be configured by the caller before registering via
1741
* cxl_decoder_add()
1742
*/
1743
static int cxl_decoder_init(struct cxl_port *port, struct cxl_decoder *cxld)
1744
{
1745
struct device *dev;
1746
int rc;
1747
1748
rc = ida_alloc(&port->decoder_ida, GFP_KERNEL);
1749
if (rc < 0)
1750
return rc;
1751
1752
/* need parent to stick around to release the id */
1753
get_device(&port->dev);
1754
cxld->id = rc;
1755
1756
dev = &cxld->dev;
1757
device_initialize(dev);
1758
lockdep_set_class(&dev->mutex, &cxl_decoder_key);
1759
device_set_pm_not_required(dev);
1760
dev->parent = &port->dev;
1761
dev->bus = &cxl_bus_type;
1762
1763
/* Pre initialize an "empty" decoder */
1764
cxld->interleave_ways = 1;
1765
cxld->interleave_granularity = PAGE_SIZE;
1766
cxld->target_type = CXL_DECODER_HOSTONLYMEM;
1767
cxld->hpa_range = (struct range) {
1768
.start = 0,
1769
.end = -1,
1770
};
1771
1772
return 0;
1773
}
1774
1775
static int cxl_switch_decoder_init(struct cxl_port *port,
1776
struct cxl_switch_decoder *cxlsd,
1777
int nr_targets)
1778
{
1779
if (nr_targets > CXL_DECODER_MAX_INTERLEAVE)
1780
return -EINVAL;
1781
1782
cxlsd->nr_targets = nr_targets;
1783
return cxl_decoder_init(port, &cxlsd->cxld);
1784
}
1785
1786
/**
1787
* cxl_root_decoder_alloc - Allocate a root level decoder
1788
* @port: owning CXL root of this decoder
1789
* @nr_targets: static number of downstream targets
1790
*
1791
* Return: A new cxl decoder to be registered by cxl_decoder_add(). A
1792
* 'CXL root' decoder is one that decodes from a top-level / static platform
1793
* firmware description of CXL resources into a CXL standard decode
1794
* topology.
1795
*/
1796
struct cxl_root_decoder *cxl_root_decoder_alloc(struct cxl_port *port,
1797
unsigned int nr_targets)
1798
{
1799
struct cxl_root_decoder *cxlrd;
1800
struct cxl_switch_decoder *cxlsd;
1801
struct cxl_decoder *cxld;
1802
int rc;
1803
1804
if (!is_cxl_root(port))
1805
return ERR_PTR(-EINVAL);
1806
1807
cxlrd = kzalloc(struct_size(cxlrd, cxlsd.target, nr_targets),
1808
GFP_KERNEL);
1809
if (!cxlrd)
1810
return ERR_PTR(-ENOMEM);
1811
1812
cxlsd = &cxlrd->cxlsd;
1813
rc = cxl_switch_decoder_init(port, cxlsd, nr_targets);
1814
if (rc) {
1815
kfree(cxlrd);
1816
return ERR_PTR(rc);
1817
}
1818
1819
mutex_init(&cxlrd->range_lock);
1820
1821
cxld = &cxlsd->cxld;
1822
cxld->dev.type = &cxl_decoder_root_type;
1823
/*
1824
* cxl_root_decoder_release() special cases negative ids to
1825
* detect memregion_alloc() failures.
1826
*/
1827
atomic_set(&cxlrd->region_id, -1);
1828
rc = memregion_alloc(GFP_KERNEL);
1829
if (rc < 0) {
1830
put_device(&cxld->dev);
1831
return ERR_PTR(rc);
1832
}
1833
1834
atomic_set(&cxlrd->region_id, rc);
1835
cxlrd->qos_class = CXL_QOS_CLASS_INVALID;
1836
return cxlrd;
1837
}
1838
EXPORT_SYMBOL_NS_GPL(cxl_root_decoder_alloc, "CXL");
1839
1840
/**
1841
* cxl_switch_decoder_alloc - Allocate a switch level decoder
1842
* @port: owning CXL switch port of this decoder
1843
* @nr_targets: max number of dynamically addressable downstream targets
1844
*
1845
* Return: A new cxl decoder to be registered by cxl_decoder_add(). A
1846
* 'switch' decoder is any decoder that can be enumerated by PCIe
1847
* topology and the HDM Decoder Capability. This includes the decoders
1848
* that sit between Switch Upstream Ports / Switch Downstream Ports and
1849
* Host Bridges / Root Ports.
1850
*/
1851
struct cxl_switch_decoder *cxl_switch_decoder_alloc(struct cxl_port *port,
1852
unsigned int nr_targets)
1853
{
1854
struct cxl_switch_decoder *cxlsd;
1855
struct cxl_decoder *cxld;
1856
int rc;
1857
1858
if (is_cxl_root(port) || is_cxl_endpoint(port))
1859
return ERR_PTR(-EINVAL);
1860
1861
cxlsd = kzalloc(struct_size(cxlsd, target, nr_targets), GFP_KERNEL);
1862
if (!cxlsd)
1863
return ERR_PTR(-ENOMEM);
1864
1865
rc = cxl_switch_decoder_init(port, cxlsd, nr_targets);
1866
if (rc) {
1867
kfree(cxlsd);
1868
return ERR_PTR(rc);
1869
}
1870
1871
cxld = &cxlsd->cxld;
1872
cxld->dev.type = &cxl_decoder_switch_type;
1873
return cxlsd;
1874
}
1875
EXPORT_SYMBOL_NS_GPL(cxl_switch_decoder_alloc, "CXL");
1876
1877
/**
1878
* cxl_endpoint_decoder_alloc - Allocate an endpoint decoder
1879
* @port: owning port of this decoder
1880
*
1881
* Return: A new cxl decoder to be registered by cxl_decoder_add()
1882
*/
1883
struct cxl_endpoint_decoder *cxl_endpoint_decoder_alloc(struct cxl_port *port)
1884
{
1885
struct cxl_endpoint_decoder *cxled;
1886
struct cxl_decoder *cxld;
1887
int rc;
1888
1889
if (!is_cxl_endpoint(port))
1890
return ERR_PTR(-EINVAL);
1891
1892
cxled = kzalloc(sizeof(*cxled), GFP_KERNEL);
1893
if (!cxled)
1894
return ERR_PTR(-ENOMEM);
1895
1896
cxled->pos = -1;
1897
cxled->part = -1;
1898
cxld = &cxled->cxld;
1899
rc = cxl_decoder_init(port, cxld);
1900
if (rc) {
1901
kfree(cxled);
1902
return ERR_PTR(rc);
1903
}
1904
1905
cxld->dev.type = &cxl_decoder_endpoint_type;
1906
return cxled;
1907
}
1908
EXPORT_SYMBOL_NS_GPL(cxl_endpoint_decoder_alloc, "CXL");
1909
1910
/**
1911
* cxl_decoder_add_locked - Add a decoder with targets
1912
* @cxld: The cxl decoder allocated by cxl_<type>_decoder_alloc()
1913
* @target_map: A list of downstream ports that this decoder can direct memory
1914
* traffic to. These numbers should correspond with the port number
1915
* in the PCIe Link Capabilities structure.
1916
*
1917
* Certain types of decoders may not have any targets. The main example of this
1918
* is an endpoint device. A more awkward example is a hostbridge whose root
1919
* ports get hot added (technically possible, though unlikely).
1920
*
1921
* This is the locked variant of cxl_decoder_add().
1922
*
1923
* Context: Process context. Expects the device lock of the port that owns the
1924
* @cxld to be held.
1925
*
1926
* Return: Negative error code if the decoder wasn't properly configured; else
1927
* returns 0.
1928
*/
1929
int cxl_decoder_add_locked(struct cxl_decoder *cxld, int *target_map)
1930
{
1931
struct cxl_port *port;
1932
struct device *dev;
1933
int rc;
1934
1935
if (WARN_ON_ONCE(!cxld))
1936
return -EINVAL;
1937
1938
if (WARN_ON_ONCE(IS_ERR(cxld)))
1939
return PTR_ERR(cxld);
1940
1941
if (cxld->interleave_ways < 1)
1942
return -EINVAL;
1943
1944
dev = &cxld->dev;
1945
1946
port = to_cxl_port(cxld->dev.parent);
1947
if (!is_endpoint_decoder(dev)) {
1948
struct cxl_switch_decoder *cxlsd = to_cxl_switch_decoder(dev);
1949
1950
rc = decoder_populate_targets(cxlsd, port, target_map);
1951
if (rc && (cxld->flags & CXL_DECODER_F_ENABLE)) {
1952
dev_err(&port->dev,
1953
"Failed to populate active decoder targets\n");
1954
return rc;
1955
}
1956
}
1957
1958
rc = dev_set_name(dev, "decoder%d.%d", port->id, cxld->id);
1959
if (rc)
1960
return rc;
1961
1962
return device_add(dev);
1963
}
1964
EXPORT_SYMBOL_NS_GPL(cxl_decoder_add_locked, "CXL");
1965
1966
/**
1967
* cxl_decoder_add - Add a decoder with targets
1968
* @cxld: The cxl decoder allocated by cxl_<type>_decoder_alloc()
1969
* @target_map: A list of downstream ports that this decoder can direct memory
1970
* traffic to. These numbers should correspond with the port number
1971
* in the PCIe Link Capabilities structure.
1972
*
1973
* This is the unlocked variant of cxl_decoder_add_locked().
1974
* See cxl_decoder_add_locked().
1975
*
1976
* Context: Process context. Takes and releases the device lock of the port that
1977
* owns the @cxld.
1978
*/
1979
int cxl_decoder_add(struct cxl_decoder *cxld, int *target_map)
1980
{
1981
struct cxl_port *port;
1982
1983
if (WARN_ON_ONCE(!cxld))
1984
return -EINVAL;
1985
1986
if (WARN_ON_ONCE(IS_ERR(cxld)))
1987
return PTR_ERR(cxld);
1988
1989
port = to_cxl_port(cxld->dev.parent);
1990
1991
guard(device)(&port->dev);
1992
return cxl_decoder_add_locked(cxld, target_map);
1993
}
1994
EXPORT_SYMBOL_NS_GPL(cxl_decoder_add, "CXL");
1995
1996
static void cxld_unregister(void *dev)
1997
{
1998
if (is_endpoint_decoder(dev))
1999
cxl_decoder_detach(NULL, to_cxl_endpoint_decoder(dev), -1,
2000
DETACH_INVALIDATE);
2001
2002
device_unregister(dev);
2003
}
2004
2005
int cxl_decoder_autoremove(struct device *host, struct cxl_decoder *cxld)
2006
{
2007
return devm_add_action_or_reset(host, cxld_unregister, &cxld->dev);
2008
}
2009
EXPORT_SYMBOL_NS_GPL(cxl_decoder_autoremove, "CXL");
2010
2011
/**
2012
* __cxl_driver_register - register a driver for the cxl bus
2013
* @cxl_drv: cxl driver structure to attach
2014
* @owner: owning module/driver
2015
* @modname: KBUILD_MODNAME for parent driver
2016
*/
2017
int __cxl_driver_register(struct cxl_driver *cxl_drv, struct module *owner,
2018
const char *modname)
2019
{
2020
if (!cxl_drv->probe) {
2021
pr_debug("%s ->probe() must be specified\n", modname);
2022
return -EINVAL;
2023
}
2024
2025
if (!cxl_drv->name) {
2026
pr_debug("%s ->name must be specified\n", modname);
2027
return -EINVAL;
2028
}
2029
2030
if (!cxl_drv->id) {
2031
pr_debug("%s ->id must be specified\n", modname);
2032
return -EINVAL;
2033
}
2034
2035
cxl_drv->drv.bus = &cxl_bus_type;
2036
cxl_drv->drv.owner = owner;
2037
cxl_drv->drv.mod_name = modname;
2038
cxl_drv->drv.name = cxl_drv->name;
2039
2040
return driver_register(&cxl_drv->drv);
2041
}
2042
EXPORT_SYMBOL_NS_GPL(__cxl_driver_register, "CXL");
2043
2044
void cxl_driver_unregister(struct cxl_driver *cxl_drv)
2045
{
2046
driver_unregister(&cxl_drv->drv);
2047
}
2048
EXPORT_SYMBOL_NS_GPL(cxl_driver_unregister, "CXL");
2049
2050
static int cxl_bus_uevent(const struct device *dev, struct kobj_uevent_env *env)
2051
{
2052
return add_uevent_var(env, "MODALIAS=" CXL_MODALIAS_FMT,
2053
cxl_device_id(dev));
2054
}
2055
2056
static int cxl_bus_match(struct device *dev, const struct device_driver *drv)
2057
{
2058
return cxl_device_id(dev) == to_cxl_drv(drv)->id;
2059
}
2060
2061
static int cxl_bus_probe(struct device *dev)
2062
{
2063
int rc;
2064
2065
rc = to_cxl_drv(dev->driver)->probe(dev);
2066
dev_dbg(dev, "probe: %d\n", rc);
2067
return rc;
2068
}
2069
2070
static void cxl_bus_remove(struct device *dev)
2071
{
2072
struct cxl_driver *cxl_drv = to_cxl_drv(dev->driver);
2073
2074
if (cxl_drv->remove)
2075
cxl_drv->remove(dev);
2076
}
2077
2078
static struct workqueue_struct *cxl_bus_wq;
2079
2080
static int cxl_rescan_attach(struct device *dev, void *data)
2081
{
2082
int rc = device_attach(dev);
2083
2084
dev_vdbg(dev, "rescan: %s\n", rc ? "attach" : "detached");
2085
2086
return 0;
2087
}
2088
2089
static void cxl_bus_rescan_queue(struct work_struct *w)
2090
{
2091
bus_for_each_dev(&cxl_bus_type, NULL, NULL, cxl_rescan_attach);
2092
}
2093
2094
void cxl_bus_rescan(void)
2095
{
2096
static DECLARE_WORK(rescan_work, cxl_bus_rescan_queue);
2097
2098
queue_work(cxl_bus_wq, &rescan_work);
2099
}
2100
EXPORT_SYMBOL_NS_GPL(cxl_bus_rescan, "CXL");
2101
2102
void cxl_bus_drain(void)
2103
{
2104
drain_workqueue(cxl_bus_wq);
2105
}
2106
EXPORT_SYMBOL_NS_GPL(cxl_bus_drain, "CXL");
2107
2108
bool schedule_cxl_memdev_detach(struct cxl_memdev *cxlmd)
2109
{
2110
return queue_work(cxl_bus_wq, &cxlmd->detach_work);
2111
}
2112
EXPORT_SYMBOL_NS_GPL(schedule_cxl_memdev_detach, "CXL");
2113
2114
static void add_latency(struct access_coordinate *c, long latency)
2115
{
2116
for (int i = 0; i < ACCESS_COORDINATE_MAX; i++) {
2117
c[i].write_latency += latency;
2118
c[i].read_latency += latency;
2119
}
2120
}
2121
2122
static bool coordinates_valid(struct access_coordinate *c)
2123
{
2124
for (int i = 0; i < ACCESS_COORDINATE_MAX; i++) {
2125
if (c[i].read_bandwidth && c[i].write_bandwidth &&
2126
c[i].read_latency && c[i].write_latency)
2127
continue;
2128
return false;
2129
}
2130
2131
return true;
2132
}
2133
2134
static void set_min_bandwidth(struct access_coordinate *c, unsigned int bw)
2135
{
2136
for (int i = 0; i < ACCESS_COORDINATE_MAX; i++) {
2137
c[i].write_bandwidth = min(c[i].write_bandwidth, bw);
2138
c[i].read_bandwidth = min(c[i].read_bandwidth, bw);
2139
}
2140
}
2141
2142
static void set_access_coordinates(struct access_coordinate *out,
2143
struct access_coordinate *in)
2144
{
2145
for (int i = 0; i < ACCESS_COORDINATE_MAX; i++)
2146
out[i] = in[i];
2147
}
2148
2149
static bool parent_port_is_cxl_root(struct cxl_port *port)
2150
{
2151
return is_cxl_root(to_cxl_port(port->dev.parent));
2152
}
2153
2154
/**
2155
* cxl_endpoint_get_perf_coordinates - Retrieve performance numbers stored in dports
2156
* of CXL path
2157
* @port: endpoint cxl_port
2158
* @coord: output performance data
2159
*
2160
* Return: errno on failure, 0 on success.
2161
*/
2162
int cxl_endpoint_get_perf_coordinates(struct cxl_port *port,
2163
struct access_coordinate *coord)
2164
{
2165
struct cxl_memdev *cxlmd = to_cxl_memdev(port->uport_dev);
2166
struct access_coordinate c[] = {
2167
{
2168
.read_bandwidth = UINT_MAX,
2169
.write_bandwidth = UINT_MAX,
2170
},
2171
{
2172
.read_bandwidth = UINT_MAX,
2173
.write_bandwidth = UINT_MAX,
2174
},
2175
};
2176
struct cxl_port *iter = port;
2177
struct cxl_dport *dport;
2178
struct pci_dev *pdev;
2179
struct device *dev;
2180
unsigned int bw;
2181
bool is_cxl_root;
2182
2183
if (!is_cxl_endpoint(port))
2184
return -EINVAL;
2185
2186
/*
2187
* Skip calculation for RCD. Expectation is HMAT already covers RCD case
2188
* since RCH does not support hotplug.
2189
*/
2190
if (cxlmd->cxlds->rcd)
2191
return 0;
2192
2193
/*
2194
* Exit the loop when the parent port of the current iter port is cxl
2195
* root. The iterative loop starts at the endpoint and gathers the
2196
* latency of the CXL link from the current device/port to the connected
2197
* downstream port each iteration.
2198
*/
2199
do {
2200
dport = iter->parent_dport;
2201
iter = to_cxl_port(iter->dev.parent);
2202
is_cxl_root = parent_port_is_cxl_root(iter);
2203
2204
/*
2205
* There's no valid access_coordinate for a root port since RPs do not
2206
* have CDAT and therefore needs to be skipped.
2207
*/
2208
if (!is_cxl_root) {
2209
if (!coordinates_valid(dport->coord))
2210
return -EINVAL;
2211
cxl_coordinates_combine(c, c, dport->coord);
2212
}
2213
add_latency(c, dport->link_latency);
2214
} while (!is_cxl_root);
2215
2216
dport = iter->parent_dport;
2217
/* Retrieve HB coords */
2218
if (!coordinates_valid(dport->coord))
2219
return -EINVAL;
2220
cxl_coordinates_combine(c, c, dport->coord);
2221
2222
dev = port->uport_dev->parent;
2223
if (!dev_is_pci(dev))
2224
return -ENODEV;
2225
2226
/* Get the calculated PCI paths bandwidth */
2227
pdev = to_pci_dev(dev);
2228
bw = pcie_bandwidth_available(pdev, NULL, NULL, NULL);
2229
if (bw == 0)
2230
return -ENXIO;
2231
bw /= BITS_PER_BYTE;
2232
2233
set_min_bandwidth(c, bw);
2234
set_access_coordinates(coord, c);
2235
2236
return 0;
2237
}
2238
EXPORT_SYMBOL_NS_GPL(cxl_endpoint_get_perf_coordinates, "CXL");
2239
2240
int cxl_port_get_switch_dport_bandwidth(struct cxl_port *port,
2241
struct access_coordinate *c)
2242
{
2243
struct cxl_dport *dport = port->parent_dport;
2244
2245
/* Check this port is connected to a switch DSP and not an RP */
2246
if (parent_port_is_cxl_root(to_cxl_port(port->dev.parent)))
2247
return -ENODEV;
2248
2249
if (!coordinates_valid(dport->coord))
2250
return -EINVAL;
2251
2252
for (int i = 0; i < ACCESS_COORDINATE_MAX; i++) {
2253
c[i].read_bandwidth = dport->coord[i].read_bandwidth;
2254
c[i].write_bandwidth = dport->coord[i].write_bandwidth;
2255
}
2256
2257
return 0;
2258
}
2259
2260
/* for user tooling to ensure port disable work has completed */
2261
static ssize_t flush_store(const struct bus_type *bus, const char *buf, size_t count)
2262
{
2263
if (sysfs_streq(buf, "1")) {
2264
flush_workqueue(cxl_bus_wq);
2265
return count;
2266
}
2267
2268
return -EINVAL;
2269
}
2270
2271
static BUS_ATTR_WO(flush);
2272
2273
static struct attribute *cxl_bus_attributes[] = {
2274
&bus_attr_flush.attr,
2275
NULL,
2276
};
2277
2278
static struct attribute_group cxl_bus_attribute_group = {
2279
.attrs = cxl_bus_attributes,
2280
};
2281
2282
static const struct attribute_group *cxl_bus_attribute_groups[] = {
2283
&cxl_bus_attribute_group,
2284
NULL,
2285
};
2286
2287
const struct bus_type cxl_bus_type = {
2288
.name = "cxl",
2289
.uevent = cxl_bus_uevent,
2290
.match = cxl_bus_match,
2291
.probe = cxl_bus_probe,
2292
.remove = cxl_bus_remove,
2293
.bus_groups = cxl_bus_attribute_groups,
2294
};
2295
EXPORT_SYMBOL_NS_GPL(cxl_bus_type, "CXL");
2296
2297
static struct dentry *cxl_debugfs;
2298
2299
struct dentry *cxl_debugfs_create_dir(const char *dir)
2300
{
2301
return debugfs_create_dir(dir, cxl_debugfs);
2302
}
2303
EXPORT_SYMBOL_NS_GPL(cxl_debugfs_create_dir, "CXL");
2304
2305
static __init int cxl_core_init(void)
2306
{
2307
int rc;
2308
2309
cxl_debugfs = debugfs_create_dir("cxl", NULL);
2310
2311
if (einj_cxl_is_initialized())
2312
debugfs_create_file("einj_types", 0400, cxl_debugfs, NULL,
2313
&einj_cxl_available_error_type_fops);
2314
2315
cxl_mbox_init();
2316
2317
rc = cxl_memdev_init();
2318
if (rc)
2319
return rc;
2320
2321
cxl_bus_wq = alloc_ordered_workqueue("cxl_port", 0);
2322
if (!cxl_bus_wq) {
2323
rc = -ENOMEM;
2324
goto err_wq;
2325
}
2326
2327
rc = bus_register(&cxl_bus_type);
2328
if (rc)
2329
goto err_bus;
2330
2331
rc = cxl_region_init();
2332
if (rc)
2333
goto err_region;
2334
2335
rc = cxl_ras_init();
2336
if (rc)
2337
goto err_ras;
2338
2339
return 0;
2340
2341
err_ras:
2342
cxl_region_exit();
2343
err_region:
2344
bus_unregister(&cxl_bus_type);
2345
err_bus:
2346
destroy_workqueue(cxl_bus_wq);
2347
err_wq:
2348
cxl_memdev_exit();
2349
return rc;
2350
}
2351
2352
static void cxl_core_exit(void)
2353
{
2354
cxl_ras_exit();
2355
cxl_region_exit();
2356
bus_unregister(&cxl_bus_type);
2357
destroy_workqueue(cxl_bus_wq);
2358
cxl_memdev_exit();
2359
debugfs_remove_recursive(cxl_debugfs);
2360
}
2361
2362
subsys_initcall(cxl_core_init);
2363
module_exit(cxl_core_exit);
2364
MODULE_DESCRIPTION("CXL: Core Compute Express Link support");
2365
MODULE_LICENSE("GPL v2");
2366
MODULE_IMPORT_NS("CXL");
2367
2368