Linux kernel mirror (for testing)
git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
kernel
os
linux
1// SPDX-License-Identifier: GPL-2.0
2// Copyright (C) 2025 Arm Ltd.
3
4#define pr_fmt(fmt) "%s:%s: " fmt, KBUILD_MODNAME, __func__
5
6#include <linux/acpi.h>
7#include <linux/atomic.h>
8#include <linux/arm_mpam.h>
9#include <linux/bitfield.h>
10#include <linux/bitmap.h>
11#include <linux/cacheinfo.h>
12#include <linux/cpu.h>
13#include <linux/cpumask.h>
14#include <linux/device.h>
15#include <linux/errno.h>
16#include <linux/gfp.h>
17#include <linux/interrupt.h>
18#include <linux/irq.h>
19#include <linux/irqdesc.h>
20#include <linux/list.h>
21#include <linux/lockdep.h>
22#include <linux/mutex.h>
23#include <linux/platform_device.h>
24#include <linux/printk.h>
25#include <linux/srcu.h>
26#include <linux/spinlock.h>
27#include <linux/types.h>
28#include <linux/workqueue.h>
29
30#include "mpam_internal.h"
31
32DEFINE_STATIC_KEY_FALSE(mpam_enabled); /* This moves to arch code */
33
34/*
35 * mpam_list_lock protects the SRCU lists when writing. Once the
36 * mpam_enabled key is enabled these lists are read-only,
37 * unless the error interrupt disables the driver.
38 */
39static DEFINE_MUTEX(mpam_list_lock);
40static LIST_HEAD(mpam_all_msc);
41
42struct srcu_struct mpam_srcu;
43
44/*
45 * Number of MSCs that have been probed. Once all MSCs have been probed MPAM
46 * can be enabled.
47 */
48static atomic_t mpam_num_msc;
49
50static int mpam_cpuhp_state;
51static DEFINE_MUTEX(mpam_cpuhp_state_lock);
52
53/*
54 * The smallest common values for any CPU or MSC in the system.
55 * Generating traffic outside this range will result in screaming interrupts.
56 */
57u16 mpam_partid_max;
58u8 mpam_pmg_max;
59static bool partid_max_init, partid_max_published;
60static DEFINE_SPINLOCK(partid_max_lock);
61
62/*
63 * mpam is enabled once all devices have been probed from CPU online callbacks,
64 * scheduled via this work_struct. If access to an MSC depends on a CPU that
65 * was not brought online at boot, this can happen surprisingly late.
66 */
67static DECLARE_WORK(mpam_enable_work, &mpam_enable);
68
69/*
70 * All mpam error interrupts indicate a software bug. On receipt, disable the
71 * driver.
72 */
73static DECLARE_WORK(mpam_broken_work, &mpam_disable);
74
75/* When mpam is disabled, the printed reason to aid debugging */
76static char *mpam_disable_reason;
77
78/*
79 * An MSC is a physical container for controls and monitors, each identified by
80 * their RIS index. These share a base-address, interrupts and some MMIO
81 * registers. A vMSC is a virtual container for RIS in an MSC that control or
82 * monitor the same thing. Members of a vMSC are all RIS in the same MSC, but
83 * not all RIS in an MSC share a vMSC.
84 *
85 * Components are a group of vMSC that control or monitor the same thing but
86 * are from different MSC, so have different base-address, interrupts etc.
87 * Classes are the set components of the same type.
88 *
89 * The features of a vMSC is the union of the RIS it contains.
90 * The features of a Class and Component are the common subset of the vMSC
91 * they contain.
92 *
93 * e.g. The system cache may have bandwidth controls on multiple interfaces,
94 * for regulating traffic from devices independently of traffic from CPUs.
95 * If these are two RIS in one MSC, they will be treated as controlling
96 * different things, and will not share a vMSC/component/class.
97 *
98 * e.g. The L2 may have one MSC and two RIS, one for cache-controls another
99 * for bandwidth. These two RIS are members of the same vMSC.
100 *
101 * e.g. The set of RIS that make up the L2 are grouped as a component. These
102 * are sometimes termed slices. They should be configured the same, as if there
103 * were only one.
104 *
105 * e.g. The SoC probably has more than one L2, each attached to a distinct set
106 * of CPUs. All the L2 components are grouped as a class.
107 *
108 * When creating an MSC, struct mpam_msc is added to the all mpam_all_msc list,
109 * then linked via struct mpam_ris to a vmsc, component and class.
110 * The same MSC may exist under different class->component->vmsc paths, but the
111 * RIS index will be unique.
112 */
113LIST_HEAD(mpam_classes);
114
115/* List of all objects that can be free()d after synchronise_srcu() */
116static LLIST_HEAD(mpam_garbage);
117
118static inline void init_garbage(struct mpam_garbage *garbage)
119{
120 init_llist_node(&garbage->llist);
121}
122
123#define add_to_garbage(x) \
124do { \
125 __typeof__(x) _x = (x); \
126 _x->garbage.to_free = _x; \
127 llist_add(&_x->garbage.llist, &mpam_garbage); \
128} while (0)
129
130static void mpam_free_garbage(void)
131{
132 struct mpam_garbage *iter, *tmp;
133 struct llist_node *to_free = llist_del_all(&mpam_garbage);
134
135 if (!to_free)
136 return;
137
138 synchronize_srcu(&mpam_srcu);
139
140 llist_for_each_entry_safe(iter, tmp, to_free, llist) {
141 if (iter->pdev)
142 devm_kfree(&iter->pdev->dev, iter->to_free);
143 else
144 kfree(iter->to_free);
145 }
146}
147
148/*
149 * Once mpam is enabled, new requestors cannot further reduce the available
150 * partid. Assert that the size is fixed, and new requestors will be turned
151 * away.
152 */
153static void mpam_assert_partid_sizes_fixed(void)
154{
155 WARN_ON_ONCE(!partid_max_published);
156}
157
158static u32 __mpam_read_reg(struct mpam_msc *msc, u16 reg)
159{
160 WARN_ON_ONCE(!cpumask_test_cpu(smp_processor_id(), &msc->accessibility));
161
162 return readl_relaxed(msc->mapped_hwpage + reg);
163}
164
165static inline u32 _mpam_read_partsel_reg(struct mpam_msc *msc, u16 reg)
166{
167 lockdep_assert_held_once(&msc->part_sel_lock);
168 return __mpam_read_reg(msc, reg);
169}
170
171#define mpam_read_partsel_reg(msc, reg) _mpam_read_partsel_reg(msc, MPAMF_##reg)
172
173static void __mpam_write_reg(struct mpam_msc *msc, u16 reg, u32 val)
174{
175 WARN_ON_ONCE(reg + sizeof(u32) > msc->mapped_hwpage_sz);
176 WARN_ON_ONCE(!cpumask_test_cpu(smp_processor_id(), &msc->accessibility));
177
178 writel_relaxed(val, msc->mapped_hwpage + reg);
179}
180
181static inline void _mpam_write_partsel_reg(struct mpam_msc *msc, u16 reg, u32 val)
182{
183 lockdep_assert_held_once(&msc->part_sel_lock);
184 __mpam_write_reg(msc, reg, val);
185}
186
187#define mpam_write_partsel_reg(msc, reg, val) _mpam_write_partsel_reg(msc, MPAMCFG_##reg, val)
188
189static inline u32 _mpam_read_monsel_reg(struct mpam_msc *msc, u16 reg)
190{
191 mpam_mon_sel_lock_held(msc);
192 return __mpam_read_reg(msc, reg);
193}
194
195#define mpam_read_monsel_reg(msc, reg) _mpam_read_monsel_reg(msc, MSMON_##reg)
196
197static inline void _mpam_write_monsel_reg(struct mpam_msc *msc, u16 reg, u32 val)
198{
199 mpam_mon_sel_lock_held(msc);
200 __mpam_write_reg(msc, reg, val);
201}
202
203#define mpam_write_monsel_reg(msc, reg, val) _mpam_write_monsel_reg(msc, MSMON_##reg, val)
204
205static u64 mpam_msc_read_idr(struct mpam_msc *msc)
206{
207 u64 idr_high = 0, idr_low;
208
209 lockdep_assert_held(&msc->part_sel_lock);
210
211 idr_low = mpam_read_partsel_reg(msc, IDR);
212 if (FIELD_GET(MPAMF_IDR_EXT, idr_low))
213 idr_high = mpam_read_partsel_reg(msc, IDR + 4);
214
215 return (idr_high << 32) | idr_low;
216}
217
218static void mpam_msc_clear_esr(struct mpam_msc *msc)
219{
220 u64 esr_low = __mpam_read_reg(msc, MPAMF_ESR);
221
222 if (!esr_low)
223 return;
224
225 /*
226 * Clearing the high/low bits of MPAMF_ESR can not be atomic.
227 * Clear the top half first, so that the pending error bits in the
228 * lower half prevent hardware from updating either half of the
229 * register.
230 */
231 if (msc->has_extd_esr)
232 __mpam_write_reg(msc, MPAMF_ESR + 4, 0);
233 __mpam_write_reg(msc, MPAMF_ESR, 0);
234}
235
236static u64 mpam_msc_read_esr(struct mpam_msc *msc)
237{
238 u64 esr_high = 0, esr_low;
239
240 esr_low = __mpam_read_reg(msc, MPAMF_ESR);
241 if (msc->has_extd_esr)
242 esr_high = __mpam_read_reg(msc, MPAMF_ESR + 4);
243
244 return (esr_high << 32) | esr_low;
245}
246
247static void __mpam_part_sel_raw(u32 partsel, struct mpam_msc *msc)
248{
249 lockdep_assert_held(&msc->part_sel_lock);
250
251 mpam_write_partsel_reg(msc, PART_SEL, partsel);
252}
253
254static void __mpam_part_sel(u8 ris_idx, u16 partid, struct mpam_msc *msc)
255{
256 u32 partsel = FIELD_PREP(MPAMCFG_PART_SEL_RIS, ris_idx) |
257 FIELD_PREP(MPAMCFG_PART_SEL_PARTID_SEL, partid);
258
259 __mpam_part_sel_raw(partsel, msc);
260}
261
262static void __mpam_intpart_sel(u8 ris_idx, u16 intpartid, struct mpam_msc *msc)
263{
264 u32 partsel = FIELD_PREP(MPAMCFG_PART_SEL_RIS, ris_idx) |
265 FIELD_PREP(MPAMCFG_PART_SEL_PARTID_SEL, intpartid) |
266 MPAMCFG_PART_SEL_INTERNAL;
267
268 __mpam_part_sel_raw(partsel, msc);
269}
270
271int mpam_register_requestor(u16 partid_max, u8 pmg_max)
272{
273 guard(spinlock)(&partid_max_lock);
274 if (!partid_max_init) {
275 mpam_partid_max = partid_max;
276 mpam_pmg_max = pmg_max;
277 partid_max_init = true;
278 } else if (!partid_max_published) {
279 mpam_partid_max = min(mpam_partid_max, partid_max);
280 mpam_pmg_max = min(mpam_pmg_max, pmg_max);
281 } else {
282 /* New requestors can't lower the values */
283 if (partid_max < mpam_partid_max || pmg_max < mpam_pmg_max)
284 return -EBUSY;
285 }
286
287 return 0;
288}
289EXPORT_SYMBOL(mpam_register_requestor);
290
291static struct mpam_class *
292mpam_class_alloc(u8 level_idx, enum mpam_class_types type)
293{
294 struct mpam_class *class;
295
296 lockdep_assert_held(&mpam_list_lock);
297
298 class = kzalloc(sizeof(*class), GFP_KERNEL);
299 if (!class)
300 return ERR_PTR(-ENOMEM);
301 init_garbage(&class->garbage);
302
303 INIT_LIST_HEAD_RCU(&class->components);
304 /* Affinity is updated when ris are added */
305 class->level = level_idx;
306 class->type = type;
307 INIT_LIST_HEAD_RCU(&class->classes_list);
308 ida_init(&class->ida_csu_mon);
309 ida_init(&class->ida_mbwu_mon);
310
311 list_add_rcu(&class->classes_list, &mpam_classes);
312
313 return class;
314}
315
316static void mpam_class_destroy(struct mpam_class *class)
317{
318 lockdep_assert_held(&mpam_list_lock);
319
320 list_del_rcu(&class->classes_list);
321 add_to_garbage(class);
322}
323
324static struct mpam_class *
325mpam_class_find(u8 level_idx, enum mpam_class_types type)
326{
327 struct mpam_class *class;
328
329 lockdep_assert_held(&mpam_list_lock);
330
331 list_for_each_entry(class, &mpam_classes, classes_list) {
332 if (class->type == type && class->level == level_idx)
333 return class;
334 }
335
336 return mpam_class_alloc(level_idx, type);
337}
338
339static struct mpam_component *
340mpam_component_alloc(struct mpam_class *class, int id)
341{
342 struct mpam_component *comp;
343
344 lockdep_assert_held(&mpam_list_lock);
345
346 comp = kzalloc(sizeof(*comp), GFP_KERNEL);
347 if (!comp)
348 return ERR_PTR(-ENOMEM);
349 init_garbage(&comp->garbage);
350
351 comp->comp_id = id;
352 INIT_LIST_HEAD_RCU(&comp->vmsc);
353 /* Affinity is updated when RIS are added */
354 INIT_LIST_HEAD_RCU(&comp->class_list);
355 comp->class = class;
356
357 list_add_rcu(&comp->class_list, &class->components);
358
359 return comp;
360}
361
362static void __destroy_component_cfg(struct mpam_component *comp);
363
364static void mpam_component_destroy(struct mpam_component *comp)
365{
366 struct mpam_class *class = comp->class;
367
368 lockdep_assert_held(&mpam_list_lock);
369
370 __destroy_component_cfg(comp);
371
372 list_del_rcu(&comp->class_list);
373 add_to_garbage(comp);
374
375 if (list_empty(&class->components))
376 mpam_class_destroy(class);
377}
378
379static struct mpam_component *
380mpam_component_find(struct mpam_class *class, int id)
381{
382 struct mpam_component *comp;
383
384 lockdep_assert_held(&mpam_list_lock);
385
386 list_for_each_entry(comp, &class->components, class_list) {
387 if (comp->comp_id == id)
388 return comp;
389 }
390
391 return mpam_component_alloc(class, id);
392}
393
394static struct mpam_vmsc *
395mpam_vmsc_alloc(struct mpam_component *comp, struct mpam_msc *msc)
396{
397 struct mpam_vmsc *vmsc;
398
399 lockdep_assert_held(&mpam_list_lock);
400
401 vmsc = kzalloc(sizeof(*vmsc), GFP_KERNEL);
402 if (!vmsc)
403 return ERR_PTR(-ENOMEM);
404 init_garbage(&vmsc->garbage);
405
406 INIT_LIST_HEAD_RCU(&vmsc->ris);
407 INIT_LIST_HEAD_RCU(&vmsc->comp_list);
408 vmsc->comp = comp;
409 vmsc->msc = msc;
410
411 list_add_rcu(&vmsc->comp_list, &comp->vmsc);
412
413 return vmsc;
414}
415
416static void mpam_vmsc_destroy(struct mpam_vmsc *vmsc)
417{
418 struct mpam_component *comp = vmsc->comp;
419
420 lockdep_assert_held(&mpam_list_lock);
421
422 list_del_rcu(&vmsc->comp_list);
423 add_to_garbage(vmsc);
424
425 if (list_empty(&comp->vmsc))
426 mpam_component_destroy(comp);
427}
428
429static struct mpam_vmsc *
430mpam_vmsc_find(struct mpam_component *comp, struct mpam_msc *msc)
431{
432 struct mpam_vmsc *vmsc;
433
434 lockdep_assert_held(&mpam_list_lock);
435
436 list_for_each_entry(vmsc, &comp->vmsc, comp_list) {
437 if (vmsc->msc->id == msc->id)
438 return vmsc;
439 }
440
441 return mpam_vmsc_alloc(comp, msc);
442}
443
444/*
445 * The cacheinfo structures are only populated when CPUs are online.
446 * This helper walks the acpi tables to include offline CPUs too.
447 */
448int mpam_get_cpumask_from_cache_id(unsigned long cache_id, u32 cache_level,
449 cpumask_t *affinity)
450{
451 return acpi_pptt_get_cpumask_from_cache_id(cache_id, affinity);
452}
453
454/*
455 * cpumask_of_node() only knows about online CPUs. This can't tell us whether
456 * a class is represented on all possible CPUs.
457 */
458static void get_cpumask_from_node_id(u32 node_id, cpumask_t *affinity)
459{
460 int cpu;
461
462 for_each_possible_cpu(cpu) {
463 if (node_id == cpu_to_node(cpu))
464 cpumask_set_cpu(cpu, affinity);
465 }
466}
467
468static int mpam_ris_get_affinity(struct mpam_msc *msc, cpumask_t *affinity,
469 enum mpam_class_types type,
470 struct mpam_class *class,
471 struct mpam_component *comp)
472{
473 int err;
474
475 switch (type) {
476 case MPAM_CLASS_CACHE:
477 err = mpam_get_cpumask_from_cache_id(comp->comp_id, class->level,
478 affinity);
479 if (err) {
480 dev_warn_once(&msc->pdev->dev,
481 "Failed to determine CPU affinity\n");
482 return err;
483 }
484
485 if (cpumask_empty(affinity))
486 dev_warn_once(&msc->pdev->dev, "no CPUs associated with cache node\n");
487
488 break;
489 case MPAM_CLASS_MEMORY:
490 get_cpumask_from_node_id(comp->comp_id, affinity);
491 /* affinity may be empty for CPU-less memory nodes */
492 break;
493 case MPAM_CLASS_UNKNOWN:
494 return 0;
495 }
496
497 cpumask_and(affinity, affinity, &msc->accessibility);
498
499 return 0;
500}
501
502static int mpam_ris_create_locked(struct mpam_msc *msc, u8 ris_idx,
503 enum mpam_class_types type, u8 class_id,
504 int component_id)
505{
506 int err;
507 struct mpam_vmsc *vmsc;
508 struct mpam_msc_ris *ris;
509 struct mpam_class *class;
510 struct mpam_component *comp;
511 struct platform_device *pdev = msc->pdev;
512
513 lockdep_assert_held(&mpam_list_lock);
514
515 if (ris_idx > MPAM_MSC_MAX_NUM_RIS)
516 return -EINVAL;
517
518 if (test_and_set_bit(ris_idx, &msc->ris_idxs))
519 return -EBUSY;
520
521 ris = devm_kzalloc(&msc->pdev->dev, sizeof(*ris), GFP_KERNEL);
522 if (!ris)
523 return -ENOMEM;
524 init_garbage(&ris->garbage);
525 ris->garbage.pdev = pdev;
526
527 class = mpam_class_find(class_id, type);
528 if (IS_ERR(class))
529 return PTR_ERR(class);
530
531 comp = mpam_component_find(class, component_id);
532 if (IS_ERR(comp)) {
533 if (list_empty(&class->components))
534 mpam_class_destroy(class);
535 return PTR_ERR(comp);
536 }
537
538 vmsc = mpam_vmsc_find(comp, msc);
539 if (IS_ERR(vmsc)) {
540 if (list_empty(&comp->vmsc))
541 mpam_component_destroy(comp);
542 return PTR_ERR(vmsc);
543 }
544
545 err = mpam_ris_get_affinity(msc, &ris->affinity, type, class, comp);
546 if (err) {
547 if (list_empty(&vmsc->ris))
548 mpam_vmsc_destroy(vmsc);
549 return err;
550 }
551
552 ris->ris_idx = ris_idx;
553 INIT_LIST_HEAD_RCU(&ris->msc_list);
554 INIT_LIST_HEAD_RCU(&ris->vmsc_list);
555 ris->vmsc = vmsc;
556
557 cpumask_or(&comp->affinity, &comp->affinity, &ris->affinity);
558 cpumask_or(&class->affinity, &class->affinity, &ris->affinity);
559 list_add_rcu(&ris->vmsc_list, &vmsc->ris);
560 list_add_rcu(&ris->msc_list, &msc->ris);
561
562 return 0;
563}
564
565static void mpam_ris_destroy(struct mpam_msc_ris *ris)
566{
567 struct mpam_vmsc *vmsc = ris->vmsc;
568 struct mpam_msc *msc = vmsc->msc;
569 struct mpam_component *comp = vmsc->comp;
570 struct mpam_class *class = comp->class;
571
572 lockdep_assert_held(&mpam_list_lock);
573
574 /*
575 * It is assumed affinities don't overlap. If they do the class becomes
576 * unusable immediately.
577 */
578 cpumask_andnot(&class->affinity, &class->affinity, &ris->affinity);
579 cpumask_andnot(&comp->affinity, &comp->affinity, &ris->affinity);
580 clear_bit(ris->ris_idx, &msc->ris_idxs);
581 list_del_rcu(&ris->msc_list);
582 list_del_rcu(&ris->vmsc_list);
583 add_to_garbage(ris);
584
585 if (list_empty(&vmsc->ris))
586 mpam_vmsc_destroy(vmsc);
587}
588
589int mpam_ris_create(struct mpam_msc *msc, u8 ris_idx,
590 enum mpam_class_types type, u8 class_id, int component_id)
591{
592 int err;
593
594 mutex_lock(&mpam_list_lock);
595 err = mpam_ris_create_locked(msc, ris_idx, type, class_id,
596 component_id);
597 mutex_unlock(&mpam_list_lock);
598 if (err)
599 mpam_free_garbage();
600
601 return err;
602}
603
604static struct mpam_msc_ris *mpam_get_or_create_ris(struct mpam_msc *msc,
605 u8 ris_idx)
606{
607 int err;
608 struct mpam_msc_ris *ris;
609
610 lockdep_assert_held(&mpam_list_lock);
611
612 if (!test_bit(ris_idx, &msc->ris_idxs)) {
613 err = mpam_ris_create_locked(msc, ris_idx, MPAM_CLASS_UNKNOWN,
614 0, 0);
615 if (err)
616 return ERR_PTR(err);
617 }
618
619 list_for_each_entry(ris, &msc->ris, msc_list) {
620 if (ris->ris_idx == ris_idx)
621 return ris;
622 }
623
624 return ERR_PTR(-ENOENT);
625}
626
627/*
628 * IHI009A.a has this nugget: "If a monitor does not support automatic behaviour
629 * of NRDY, software can use this bit for any purpose" - so hardware might not
630 * implement this - but it isn't RES0.
631 *
632 * Try and see what values stick in this bit. If we can write either value,
633 * its probably not implemented by hardware.
634 */
635static bool _mpam_ris_hw_probe_hw_nrdy(struct mpam_msc_ris *ris, u32 mon_reg)
636{
637 u32 now;
638 u64 mon_sel;
639 bool can_set, can_clear;
640 struct mpam_msc *msc = ris->vmsc->msc;
641
642 if (WARN_ON_ONCE(!mpam_mon_sel_lock(msc)))
643 return false;
644
645 mon_sel = FIELD_PREP(MSMON_CFG_MON_SEL_MON_SEL, 0) |
646 FIELD_PREP(MSMON_CFG_MON_SEL_RIS, ris->ris_idx);
647 _mpam_write_monsel_reg(msc, mon_reg, mon_sel);
648
649 _mpam_write_monsel_reg(msc, mon_reg, MSMON___NRDY);
650 now = _mpam_read_monsel_reg(msc, mon_reg);
651 can_set = now & MSMON___NRDY;
652
653 _mpam_write_monsel_reg(msc, mon_reg, 0);
654 now = _mpam_read_monsel_reg(msc, mon_reg);
655 can_clear = !(now & MSMON___NRDY);
656 mpam_mon_sel_unlock(msc);
657
658 return (!can_set || !can_clear);
659}
660
661#define mpam_ris_hw_probe_hw_nrdy(_ris, _mon_reg) \
662 _mpam_ris_hw_probe_hw_nrdy(_ris, MSMON_##_mon_reg)
663
664static void mpam_ris_hw_probe(struct mpam_msc_ris *ris)
665{
666 int err;
667 struct mpam_msc *msc = ris->vmsc->msc;
668 struct device *dev = &msc->pdev->dev;
669 struct mpam_props *props = &ris->props;
670 struct mpam_class *class = ris->vmsc->comp->class;
671
672 lockdep_assert_held(&msc->probe_lock);
673 lockdep_assert_held(&msc->part_sel_lock);
674
675 /* Cache Capacity Partitioning */
676 if (FIELD_GET(MPAMF_IDR_HAS_CCAP_PART, ris->idr)) {
677 u32 ccap_features = mpam_read_partsel_reg(msc, CCAP_IDR);
678
679 props->cmax_wd = FIELD_GET(MPAMF_CCAP_IDR_CMAX_WD, ccap_features);
680 if (props->cmax_wd &&
681 FIELD_GET(MPAMF_CCAP_IDR_HAS_CMAX_SOFTLIM, ccap_features))
682 mpam_set_feature(mpam_feat_cmax_softlim, props);
683
684 if (props->cmax_wd &&
685 !FIELD_GET(MPAMF_CCAP_IDR_NO_CMAX, ccap_features))
686 mpam_set_feature(mpam_feat_cmax_cmax, props);
687
688 if (props->cmax_wd &&
689 FIELD_GET(MPAMF_CCAP_IDR_HAS_CMIN, ccap_features))
690 mpam_set_feature(mpam_feat_cmax_cmin, props);
691
692 props->cassoc_wd = FIELD_GET(MPAMF_CCAP_IDR_CASSOC_WD, ccap_features);
693 if (props->cassoc_wd &&
694 FIELD_GET(MPAMF_CCAP_IDR_HAS_CASSOC, ccap_features))
695 mpam_set_feature(mpam_feat_cmax_cassoc, props);
696 }
697
698 /* Cache Portion partitioning */
699 if (FIELD_GET(MPAMF_IDR_HAS_CPOR_PART, ris->idr)) {
700 u32 cpor_features = mpam_read_partsel_reg(msc, CPOR_IDR);
701
702 props->cpbm_wd = FIELD_GET(MPAMF_CPOR_IDR_CPBM_WD, cpor_features);
703 if (props->cpbm_wd)
704 mpam_set_feature(mpam_feat_cpor_part, props);
705 }
706
707 /* Memory bandwidth partitioning */
708 if (FIELD_GET(MPAMF_IDR_HAS_MBW_PART, ris->idr)) {
709 u32 mbw_features = mpam_read_partsel_reg(msc, MBW_IDR);
710
711 /* portion bitmap resolution */
712 props->mbw_pbm_bits = FIELD_GET(MPAMF_MBW_IDR_BWPBM_WD, mbw_features);
713 if (props->mbw_pbm_bits &&
714 FIELD_GET(MPAMF_MBW_IDR_HAS_PBM, mbw_features))
715 mpam_set_feature(mpam_feat_mbw_part, props);
716
717 props->bwa_wd = FIELD_GET(MPAMF_MBW_IDR_BWA_WD, mbw_features);
718 if (props->bwa_wd && FIELD_GET(MPAMF_MBW_IDR_HAS_MAX, mbw_features))
719 mpam_set_feature(mpam_feat_mbw_max, props);
720
721 if (props->bwa_wd && FIELD_GET(MPAMF_MBW_IDR_HAS_MIN, mbw_features))
722 mpam_set_feature(mpam_feat_mbw_min, props);
723
724 if (props->bwa_wd && FIELD_GET(MPAMF_MBW_IDR_HAS_PROP, mbw_features))
725 mpam_set_feature(mpam_feat_mbw_prop, props);
726 }
727
728 /* Priority partitioning */
729 if (FIELD_GET(MPAMF_IDR_HAS_PRI_PART, ris->idr)) {
730 u32 pri_features = mpam_read_partsel_reg(msc, PRI_IDR);
731
732 props->intpri_wd = FIELD_GET(MPAMF_PRI_IDR_INTPRI_WD, pri_features);
733 if (props->intpri_wd && FIELD_GET(MPAMF_PRI_IDR_HAS_INTPRI, pri_features)) {
734 mpam_set_feature(mpam_feat_intpri_part, props);
735 if (FIELD_GET(MPAMF_PRI_IDR_INTPRI_0_IS_LOW, pri_features))
736 mpam_set_feature(mpam_feat_intpri_part_0_low, props);
737 }
738
739 props->dspri_wd = FIELD_GET(MPAMF_PRI_IDR_DSPRI_WD, pri_features);
740 if (props->dspri_wd && FIELD_GET(MPAMF_PRI_IDR_HAS_DSPRI, pri_features)) {
741 mpam_set_feature(mpam_feat_dspri_part, props);
742 if (FIELD_GET(MPAMF_PRI_IDR_DSPRI_0_IS_LOW, pri_features))
743 mpam_set_feature(mpam_feat_dspri_part_0_low, props);
744 }
745 }
746
747 /* Performance Monitoring */
748 if (FIELD_GET(MPAMF_IDR_HAS_MSMON, ris->idr)) {
749 u32 msmon_features = mpam_read_partsel_reg(msc, MSMON_IDR);
750
751 /*
752 * If the firmware max-nrdy-us property is missing, the
753 * CSU counters can't be used. Should we wait forever?
754 */
755 err = device_property_read_u32(&msc->pdev->dev,
756 "arm,not-ready-us",
757 &msc->nrdy_usec);
758
759 if (FIELD_GET(MPAMF_MSMON_IDR_MSMON_CSU, msmon_features)) {
760 u32 csumonidr;
761
762 csumonidr = mpam_read_partsel_reg(msc, CSUMON_IDR);
763 props->num_csu_mon = FIELD_GET(MPAMF_CSUMON_IDR_NUM_MON, csumonidr);
764 if (props->num_csu_mon) {
765 bool hw_managed;
766
767 mpam_set_feature(mpam_feat_msmon_csu, props);
768
769 if (FIELD_GET(MPAMF_CSUMON_IDR_HAS_XCL, csumonidr))
770 mpam_set_feature(mpam_feat_msmon_csu_xcl, props);
771
772 /* Is NRDY hardware managed? */
773 hw_managed = mpam_ris_hw_probe_hw_nrdy(ris, CSU);
774 if (hw_managed)
775 mpam_set_feature(mpam_feat_msmon_csu_hw_nrdy, props);
776 }
777
778 /*
779 * Accept the missing firmware property if NRDY appears
780 * un-implemented.
781 */
782 if (err && mpam_has_feature(mpam_feat_msmon_csu_hw_nrdy, props))
783 dev_err_once(dev, "Counters are not usable because not-ready timeout was not provided by firmware.");
784 }
785 if (FIELD_GET(MPAMF_MSMON_IDR_MSMON_MBWU, msmon_features)) {
786 bool has_long, hw_managed;
787 u32 mbwumon_idr = mpam_read_partsel_reg(msc, MBWUMON_IDR);
788
789 props->num_mbwu_mon = FIELD_GET(MPAMF_MBWUMON_IDR_NUM_MON, mbwumon_idr);
790 if (props->num_mbwu_mon) {
791 mpam_set_feature(mpam_feat_msmon_mbwu, props);
792
793 if (FIELD_GET(MPAMF_MBWUMON_IDR_HAS_RWBW, mbwumon_idr))
794 mpam_set_feature(mpam_feat_msmon_mbwu_rwbw, props);
795
796 has_long = FIELD_GET(MPAMF_MBWUMON_IDR_HAS_LONG, mbwumon_idr);
797 if (has_long) {
798 if (FIELD_GET(MPAMF_MBWUMON_IDR_LWD, mbwumon_idr))
799 mpam_set_feature(mpam_feat_msmon_mbwu_63counter, props);
800 else
801 mpam_set_feature(mpam_feat_msmon_mbwu_44counter, props);
802 } else {
803 mpam_set_feature(mpam_feat_msmon_mbwu_31counter, props);
804 }
805
806 /* Is NRDY hardware managed? */
807 hw_managed = mpam_ris_hw_probe_hw_nrdy(ris, MBWU);
808 if (hw_managed)
809 mpam_set_feature(mpam_feat_msmon_mbwu_hw_nrdy, props);
810
811 /*
812 * Don't warn about any missing firmware property for
813 * MBWU NRDY - it doesn't make any sense!
814 */
815 }
816 }
817 }
818
819 /*
820 * RIS with PARTID narrowing don't have enough storage for one
821 * configuration per PARTID. If these are in a class we could use,
822 * reduce the supported partid_max to match the number of intpartid.
823 * If the class is unknown, just ignore it.
824 */
825 if (FIELD_GET(MPAMF_IDR_HAS_PARTID_NRW, ris->idr) &&
826 class->type != MPAM_CLASS_UNKNOWN) {
827 u32 nrwidr = mpam_read_partsel_reg(msc, PARTID_NRW_IDR);
828 u16 partid_max = FIELD_GET(MPAMF_PARTID_NRW_IDR_INTPARTID_MAX, nrwidr);
829
830 mpam_set_feature(mpam_feat_partid_nrw, props);
831 msc->partid_max = min(msc->partid_max, partid_max);
832 }
833}
834
835static int mpam_msc_hw_probe(struct mpam_msc *msc)
836{
837 u64 idr;
838 u16 partid_max;
839 u8 ris_idx, pmg_max;
840 struct mpam_msc_ris *ris;
841 struct device *dev = &msc->pdev->dev;
842
843 lockdep_assert_held(&msc->probe_lock);
844
845 idr = __mpam_read_reg(msc, MPAMF_AIDR);
846 if ((idr & MPAMF_AIDR_ARCH_MAJOR_REV) != MPAM_ARCHITECTURE_V1) {
847 dev_err_once(dev, "MSC does not match MPAM architecture v1.x\n");
848 return -EIO;
849 }
850
851 /* Grab an IDR value to find out how many RIS there are */
852 mutex_lock(&msc->part_sel_lock);
853 idr = mpam_msc_read_idr(msc);
854 mutex_unlock(&msc->part_sel_lock);
855
856 msc->ris_max = FIELD_GET(MPAMF_IDR_RIS_MAX, idr);
857
858 /* Use these values so partid/pmg always starts with a valid value */
859 msc->partid_max = FIELD_GET(MPAMF_IDR_PARTID_MAX, idr);
860 msc->pmg_max = FIELD_GET(MPAMF_IDR_PMG_MAX, idr);
861
862 for (ris_idx = 0; ris_idx <= msc->ris_max; ris_idx++) {
863 mutex_lock(&msc->part_sel_lock);
864 __mpam_part_sel(ris_idx, 0, msc);
865 idr = mpam_msc_read_idr(msc);
866 mutex_unlock(&msc->part_sel_lock);
867
868 partid_max = FIELD_GET(MPAMF_IDR_PARTID_MAX, idr);
869 pmg_max = FIELD_GET(MPAMF_IDR_PMG_MAX, idr);
870 msc->partid_max = min(msc->partid_max, partid_max);
871 msc->pmg_max = min(msc->pmg_max, pmg_max);
872 msc->has_extd_esr = FIELD_GET(MPAMF_IDR_HAS_EXTD_ESR, idr);
873
874 mutex_lock(&mpam_list_lock);
875 ris = mpam_get_or_create_ris(msc, ris_idx);
876 mutex_unlock(&mpam_list_lock);
877 if (IS_ERR(ris))
878 return PTR_ERR(ris);
879 ris->idr = idr;
880
881 mutex_lock(&msc->part_sel_lock);
882 __mpam_part_sel(ris_idx, 0, msc);
883 mpam_ris_hw_probe(ris);
884 mutex_unlock(&msc->part_sel_lock);
885 }
886
887 /* Clear any stale errors */
888 mpam_msc_clear_esr(msc);
889
890 spin_lock(&partid_max_lock);
891 mpam_partid_max = min(mpam_partid_max, msc->partid_max);
892 mpam_pmg_max = min(mpam_pmg_max, msc->pmg_max);
893 spin_unlock(&partid_max_lock);
894
895 msc->probed = true;
896
897 return 0;
898}
899
900struct mon_read {
901 struct mpam_msc_ris *ris;
902 struct mon_cfg *ctx;
903 enum mpam_device_features type;
904 u64 *val;
905 int err;
906};
907
908static bool mpam_ris_has_mbwu_long_counter(struct mpam_msc_ris *ris)
909{
910 return (mpam_has_feature(mpam_feat_msmon_mbwu_63counter, &ris->props) ||
911 mpam_has_feature(mpam_feat_msmon_mbwu_44counter, &ris->props));
912}
913
914static u64 mpam_msc_read_mbwu_l(struct mpam_msc *msc)
915{
916 int retry = 3;
917 u32 mbwu_l_low;
918 u64 mbwu_l_high1, mbwu_l_high2;
919
920 mpam_mon_sel_lock_held(msc);
921
922 WARN_ON_ONCE((MSMON_MBWU_L + sizeof(u64)) > msc->mapped_hwpage_sz);
923 WARN_ON_ONCE(!cpumask_test_cpu(smp_processor_id(), &msc->accessibility));
924
925 mbwu_l_high2 = __mpam_read_reg(msc, MSMON_MBWU_L + 4);
926 do {
927 mbwu_l_high1 = mbwu_l_high2;
928 mbwu_l_low = __mpam_read_reg(msc, MSMON_MBWU_L);
929 mbwu_l_high2 = __mpam_read_reg(msc, MSMON_MBWU_L + 4);
930
931 retry--;
932 } while (mbwu_l_high1 != mbwu_l_high2 && retry > 0);
933
934 if (mbwu_l_high1 == mbwu_l_high2)
935 return (mbwu_l_high1 << 32) | mbwu_l_low;
936
937 pr_warn("Failed to read a stable value\n");
938 return MSMON___L_NRDY;
939}
940
941static void mpam_msc_zero_mbwu_l(struct mpam_msc *msc)
942{
943 mpam_mon_sel_lock_held(msc);
944
945 WARN_ON_ONCE((MSMON_MBWU_L + sizeof(u64)) > msc->mapped_hwpage_sz);
946 WARN_ON_ONCE(!cpumask_test_cpu(smp_processor_id(), &msc->accessibility));
947
948 __mpam_write_reg(msc, MSMON_MBWU_L, 0);
949 __mpam_write_reg(msc, MSMON_MBWU_L + 4, 0);
950}
951
952static void gen_msmon_ctl_flt_vals(struct mon_read *m, u32 *ctl_val,
953 u32 *flt_val)
954{
955 struct mon_cfg *ctx = m->ctx;
956
957 /*
958 * For CSU counters its implementation-defined what happens when not
959 * filtering by partid.
960 */
961 *ctl_val = MSMON_CFG_x_CTL_MATCH_PARTID;
962
963 *flt_val = FIELD_PREP(MSMON_CFG_x_FLT_PARTID, ctx->partid);
964
965 if (m->ctx->match_pmg) {
966 *ctl_val |= MSMON_CFG_x_CTL_MATCH_PMG;
967 *flt_val |= FIELD_PREP(MSMON_CFG_x_FLT_PMG, ctx->pmg);
968 }
969
970 switch (m->type) {
971 case mpam_feat_msmon_csu:
972 *ctl_val |= MSMON_CFG_CSU_CTL_TYPE_CSU;
973
974 if (mpam_has_feature(mpam_feat_msmon_csu_xcl, &m->ris->props))
975 *flt_val |= FIELD_PREP(MSMON_CFG_CSU_FLT_XCL, ctx->csu_exclude_clean);
976
977 break;
978 case mpam_feat_msmon_mbwu_31counter:
979 case mpam_feat_msmon_mbwu_44counter:
980 case mpam_feat_msmon_mbwu_63counter:
981 *ctl_val |= MSMON_CFG_MBWU_CTL_TYPE_MBWU;
982
983 if (mpam_has_feature(mpam_feat_msmon_mbwu_rwbw, &m->ris->props))
984 *flt_val |= FIELD_PREP(MSMON_CFG_MBWU_FLT_RWBW, ctx->opts);
985
986 break;
987 default:
988 pr_warn("Unexpected monitor type %d\n", m->type);
989 }
990}
991
992static void read_msmon_ctl_flt_vals(struct mon_read *m, u32 *ctl_val,
993 u32 *flt_val)
994{
995 struct mpam_msc *msc = m->ris->vmsc->msc;
996
997 switch (m->type) {
998 case mpam_feat_msmon_csu:
999 *ctl_val = mpam_read_monsel_reg(msc, CFG_CSU_CTL);
1000 *flt_val = mpam_read_monsel_reg(msc, CFG_CSU_FLT);
1001 break;
1002 case mpam_feat_msmon_mbwu_31counter:
1003 case mpam_feat_msmon_mbwu_44counter:
1004 case mpam_feat_msmon_mbwu_63counter:
1005 *ctl_val = mpam_read_monsel_reg(msc, CFG_MBWU_CTL);
1006 *flt_val = mpam_read_monsel_reg(msc, CFG_MBWU_FLT);
1007 break;
1008 default:
1009 pr_warn("Unexpected monitor type %d\n", m->type);
1010 }
1011}
1012
1013/* Remove values set by the hardware to prevent apparent mismatches. */
1014static inline void clean_msmon_ctl_val(u32 *cur_ctl)
1015{
1016 *cur_ctl &= ~MSMON_CFG_x_CTL_OFLOW_STATUS;
1017
1018 if (FIELD_GET(MSMON_CFG_x_CTL_TYPE, *cur_ctl) == MSMON_CFG_MBWU_CTL_TYPE_MBWU)
1019 *cur_ctl &= ~MSMON_CFG_MBWU_CTL_OFLOW_STATUS_L;
1020}
1021
1022static void write_msmon_ctl_flt_vals(struct mon_read *m, u32 ctl_val,
1023 u32 flt_val)
1024{
1025 struct mpam_msc *msc = m->ris->vmsc->msc;
1026
1027 /*
1028 * Write the ctl_val with the enable bit cleared, reset the counter,
1029 * then enable counter.
1030 */
1031 switch (m->type) {
1032 case mpam_feat_msmon_csu:
1033 mpam_write_monsel_reg(msc, CFG_CSU_FLT, flt_val);
1034 mpam_write_monsel_reg(msc, CFG_CSU_CTL, ctl_val);
1035 mpam_write_monsel_reg(msc, CSU, 0);
1036 mpam_write_monsel_reg(msc, CFG_CSU_CTL, ctl_val | MSMON_CFG_x_CTL_EN);
1037 break;
1038 case mpam_feat_msmon_mbwu_31counter:
1039 case mpam_feat_msmon_mbwu_44counter:
1040 case mpam_feat_msmon_mbwu_63counter:
1041 mpam_write_monsel_reg(msc, CFG_MBWU_FLT, flt_val);
1042 mpam_write_monsel_reg(msc, CFG_MBWU_CTL, ctl_val);
1043 mpam_write_monsel_reg(msc, CFG_MBWU_CTL, ctl_val | MSMON_CFG_x_CTL_EN);
1044 /* Counting monitors require NRDY to be reset by software */
1045 if (m->type == mpam_feat_msmon_mbwu_31counter)
1046 mpam_write_monsel_reg(msc, MBWU, 0);
1047 else
1048 mpam_msc_zero_mbwu_l(m->ris->vmsc->msc);
1049 break;
1050 default:
1051 pr_warn("Unexpected monitor type %d\n", m->type);
1052 }
1053}
1054
1055static u64 mpam_msmon_overflow_val(enum mpam_device_features type)
1056{
1057 /* TODO: implement scaling counters */
1058 switch (type) {
1059 case mpam_feat_msmon_mbwu_63counter:
1060 return BIT_ULL(hweight_long(MSMON___LWD_VALUE));
1061 case mpam_feat_msmon_mbwu_44counter:
1062 return BIT_ULL(hweight_long(MSMON___L_VALUE));
1063 case mpam_feat_msmon_mbwu_31counter:
1064 return BIT_ULL(hweight_long(MSMON___VALUE));
1065 default:
1066 return 0;
1067 }
1068}
1069
1070static void __ris_msmon_read(void *arg)
1071{
1072 u64 now;
1073 bool nrdy = false;
1074 bool config_mismatch;
1075 bool overflow = false;
1076 struct mon_read *m = arg;
1077 struct mon_cfg *ctx = m->ctx;
1078 bool reset_on_next_read = false;
1079 struct mpam_msc_ris *ris = m->ris;
1080 struct msmon_mbwu_state *mbwu_state;
1081 struct mpam_props *rprops = &ris->props;
1082 struct mpam_msc *msc = m->ris->vmsc->msc;
1083 u32 mon_sel, ctl_val, flt_val, cur_ctl, cur_flt;
1084
1085 if (!mpam_mon_sel_lock(msc)) {
1086 m->err = -EIO;
1087 return;
1088 }
1089 mon_sel = FIELD_PREP(MSMON_CFG_MON_SEL_MON_SEL, ctx->mon) |
1090 FIELD_PREP(MSMON_CFG_MON_SEL_RIS, ris->ris_idx);
1091 mpam_write_monsel_reg(msc, CFG_MON_SEL, mon_sel);
1092
1093 switch (m->type) {
1094 case mpam_feat_msmon_mbwu_31counter:
1095 case mpam_feat_msmon_mbwu_44counter:
1096 case mpam_feat_msmon_mbwu_63counter:
1097 mbwu_state = &ris->mbwu_state[ctx->mon];
1098 if (mbwu_state) {
1099 reset_on_next_read = mbwu_state->reset_on_next_read;
1100 mbwu_state->reset_on_next_read = false;
1101 }
1102 break;
1103 default:
1104 break;
1105 }
1106
1107 /*
1108 * Read the existing configuration to avoid re-writing the same values.
1109 * This saves waiting for 'nrdy' on subsequent reads.
1110 */
1111 read_msmon_ctl_flt_vals(m, &cur_ctl, &cur_flt);
1112
1113 if (mpam_feat_msmon_mbwu_31counter == m->type)
1114 overflow = cur_ctl & MSMON_CFG_x_CTL_OFLOW_STATUS;
1115 else if (mpam_feat_msmon_mbwu_44counter == m->type ||
1116 mpam_feat_msmon_mbwu_63counter == m->type)
1117 overflow = cur_ctl & MSMON_CFG_MBWU_CTL_OFLOW_STATUS_L;
1118
1119 clean_msmon_ctl_val(&cur_ctl);
1120 gen_msmon_ctl_flt_vals(m, &ctl_val, &flt_val);
1121 config_mismatch = cur_flt != flt_val ||
1122 cur_ctl != (ctl_val | MSMON_CFG_x_CTL_EN);
1123
1124 if (config_mismatch || reset_on_next_read) {
1125 write_msmon_ctl_flt_vals(m, ctl_val, flt_val);
1126 overflow = false;
1127 } else if (overflow) {
1128 mpam_write_monsel_reg(msc, CFG_MBWU_CTL,
1129 cur_ctl &
1130 ~(MSMON_CFG_x_CTL_OFLOW_STATUS |
1131 MSMON_CFG_MBWU_CTL_OFLOW_STATUS_L));
1132 }
1133
1134 switch (m->type) {
1135 case mpam_feat_msmon_csu:
1136 now = mpam_read_monsel_reg(msc, CSU);
1137 if (mpam_has_feature(mpam_feat_msmon_csu_hw_nrdy, rprops))
1138 nrdy = now & MSMON___NRDY;
1139 now = FIELD_GET(MSMON___VALUE, now);
1140 break;
1141 case mpam_feat_msmon_mbwu_31counter:
1142 case mpam_feat_msmon_mbwu_44counter:
1143 case mpam_feat_msmon_mbwu_63counter:
1144 if (m->type != mpam_feat_msmon_mbwu_31counter) {
1145 now = mpam_msc_read_mbwu_l(msc);
1146 if (mpam_has_feature(mpam_feat_msmon_mbwu_hw_nrdy, rprops))
1147 nrdy = now & MSMON___L_NRDY;
1148
1149 if (m->type == mpam_feat_msmon_mbwu_63counter)
1150 now = FIELD_GET(MSMON___LWD_VALUE, now);
1151 else
1152 now = FIELD_GET(MSMON___L_VALUE, now);
1153 } else {
1154 now = mpam_read_monsel_reg(msc, MBWU);
1155 if (mpam_has_feature(mpam_feat_msmon_mbwu_hw_nrdy, rprops))
1156 nrdy = now & MSMON___NRDY;
1157 now = FIELD_GET(MSMON___VALUE, now);
1158 }
1159
1160 if (nrdy)
1161 break;
1162
1163 mbwu_state = &ris->mbwu_state[ctx->mon];
1164
1165 if (overflow)
1166 mbwu_state->correction += mpam_msmon_overflow_val(m->type);
1167
1168 /*
1169 * Include bandwidth consumed before the last hardware reset and
1170 * a counter size increment for each overflow.
1171 */
1172 now += mbwu_state->correction;
1173 break;
1174 default:
1175 m->err = -EINVAL;
1176 }
1177 mpam_mon_sel_unlock(msc);
1178
1179 if (nrdy)
1180 m->err = -EBUSY;
1181
1182 if (m->err)
1183 return;
1184
1185 *m->val += now;
1186}
1187
1188static int _msmon_read(struct mpam_component *comp, struct mon_read *arg)
1189{
1190 int err, any_err = 0;
1191 struct mpam_vmsc *vmsc;
1192
1193 guard(srcu)(&mpam_srcu);
1194 list_for_each_entry_srcu(vmsc, &comp->vmsc, comp_list,
1195 srcu_read_lock_held(&mpam_srcu)) {
1196 struct mpam_msc *msc = vmsc->msc;
1197 struct mpam_msc_ris *ris;
1198
1199 list_for_each_entry_srcu(ris, &vmsc->ris, vmsc_list,
1200 srcu_read_lock_held(&mpam_srcu)) {
1201 arg->ris = ris;
1202
1203 err = smp_call_function_any(&msc->accessibility,
1204 __ris_msmon_read, arg,
1205 true);
1206 if (!err && arg->err)
1207 err = arg->err;
1208
1209 /*
1210 * Save one error to be returned to the caller, but
1211 * keep reading counters so that get reprogrammed. On
1212 * platforms with NRDY this lets us wait once.
1213 */
1214 if (err)
1215 any_err = err;
1216 }
1217 }
1218
1219 return any_err;
1220}
1221
1222static enum mpam_device_features mpam_msmon_choose_counter(struct mpam_class *class)
1223{
1224 struct mpam_props *cprops = &class->props;
1225
1226 if (mpam_has_feature(mpam_feat_msmon_mbwu_63counter, cprops))
1227 return mpam_feat_msmon_mbwu_63counter;
1228 if (mpam_has_feature(mpam_feat_msmon_mbwu_44counter, cprops))
1229 return mpam_feat_msmon_mbwu_44counter;
1230
1231 return mpam_feat_msmon_mbwu_31counter;
1232}
1233
1234int mpam_msmon_read(struct mpam_component *comp, struct mon_cfg *ctx,
1235 enum mpam_device_features type, u64 *val)
1236{
1237 int err;
1238 struct mon_read arg;
1239 u64 wait_jiffies = 0;
1240 struct mpam_class *class = comp->class;
1241 struct mpam_props *cprops = &class->props;
1242
1243 might_sleep();
1244
1245 if (!mpam_is_enabled())
1246 return -EIO;
1247
1248 if (!mpam_has_feature(type, cprops))
1249 return -EOPNOTSUPP;
1250
1251 if (type == mpam_feat_msmon_mbwu)
1252 type = mpam_msmon_choose_counter(class);
1253
1254 arg = (struct mon_read) {
1255 .ctx = ctx,
1256 .type = type,
1257 .val = val,
1258 };
1259 *val = 0;
1260
1261 err = _msmon_read(comp, &arg);
1262 if (err == -EBUSY && class->nrdy_usec)
1263 wait_jiffies = usecs_to_jiffies(class->nrdy_usec);
1264
1265 while (wait_jiffies)
1266 wait_jiffies = schedule_timeout_uninterruptible(wait_jiffies);
1267
1268 if (err == -EBUSY) {
1269 arg = (struct mon_read) {
1270 .ctx = ctx,
1271 .type = type,
1272 .val = val,
1273 };
1274 *val = 0;
1275
1276 err = _msmon_read(comp, &arg);
1277 }
1278
1279 return err;
1280}
1281
1282void mpam_msmon_reset_mbwu(struct mpam_component *comp, struct mon_cfg *ctx)
1283{
1284 struct mpam_msc *msc;
1285 struct mpam_vmsc *vmsc;
1286 struct mpam_msc_ris *ris;
1287
1288 if (!mpam_is_enabled())
1289 return;
1290
1291 guard(srcu)(&mpam_srcu);
1292 list_for_each_entry_srcu(vmsc, &comp->vmsc, comp_list,
1293 srcu_read_lock_held(&mpam_srcu)) {
1294 if (!mpam_has_feature(mpam_feat_msmon_mbwu, &vmsc->props))
1295 continue;
1296
1297 msc = vmsc->msc;
1298 list_for_each_entry_srcu(ris, &vmsc->ris, vmsc_list,
1299 srcu_read_lock_held(&mpam_srcu)) {
1300 if (!mpam_has_feature(mpam_feat_msmon_mbwu, &ris->props))
1301 continue;
1302
1303 if (WARN_ON_ONCE(!mpam_mon_sel_lock(msc)))
1304 continue;
1305
1306 ris->mbwu_state[ctx->mon].correction = 0;
1307 ris->mbwu_state[ctx->mon].reset_on_next_read = true;
1308 mpam_mon_sel_unlock(msc);
1309 }
1310 }
1311}
1312
1313static void mpam_reset_msc_bitmap(struct mpam_msc *msc, u16 reg, u16 wd)
1314{
1315 u32 num_words, msb;
1316 u32 bm = ~0;
1317 int i;
1318
1319 lockdep_assert_held(&msc->part_sel_lock);
1320
1321 if (wd == 0)
1322 return;
1323
1324 /*
1325 * Write all ~0 to all but the last 32bit-word, which may
1326 * have fewer bits...
1327 */
1328 num_words = DIV_ROUND_UP(wd, 32);
1329 for (i = 0; i < num_words - 1; i++, reg += sizeof(bm))
1330 __mpam_write_reg(msc, reg, bm);
1331
1332 /*
1333 * ....and then the last (maybe) partial 32bit word. When wd is a
1334 * multiple of 32, msb should be 31 to write a full 32bit word.
1335 */
1336 msb = (wd - 1) % 32;
1337 bm = GENMASK(msb, 0);
1338 __mpam_write_reg(msc, reg, bm);
1339}
1340
1341/* Called via IPI. Call while holding an SRCU reference */
1342static void mpam_reprogram_ris_partid(struct mpam_msc_ris *ris, u16 partid,
1343 struct mpam_config *cfg)
1344{
1345 u32 pri_val = 0;
1346 u16 cmax = MPAMCFG_CMAX_CMAX;
1347 struct mpam_msc *msc = ris->vmsc->msc;
1348 struct mpam_props *rprops = &ris->props;
1349 u16 dspri = GENMASK(rprops->dspri_wd, 0);
1350 u16 intpri = GENMASK(rprops->intpri_wd, 0);
1351
1352 mutex_lock(&msc->part_sel_lock);
1353 __mpam_part_sel(ris->ris_idx, partid, msc);
1354
1355 if (mpam_has_feature(mpam_feat_partid_nrw, rprops)) {
1356 /* Update the intpartid mapping */
1357 mpam_write_partsel_reg(msc, INTPARTID,
1358 MPAMCFG_INTPARTID_INTERNAL | partid);
1359
1360 /*
1361 * Then switch to the 'internal' partid to update the
1362 * configuration.
1363 */
1364 __mpam_intpart_sel(ris->ris_idx, partid, msc);
1365 }
1366
1367 if (mpam_has_feature(mpam_feat_cpor_part, rprops) &&
1368 mpam_has_feature(mpam_feat_cpor_part, cfg)) {
1369 if (cfg->reset_cpbm)
1370 mpam_reset_msc_bitmap(msc, MPAMCFG_CPBM, rprops->cpbm_wd);
1371 else
1372 mpam_write_partsel_reg(msc, CPBM, cfg->cpbm);
1373 }
1374
1375 if (mpam_has_feature(mpam_feat_mbw_part, rprops) &&
1376 mpam_has_feature(mpam_feat_mbw_part, cfg)) {
1377 if (cfg->reset_mbw_pbm)
1378 mpam_reset_msc_bitmap(msc, MPAMCFG_MBW_PBM, rprops->mbw_pbm_bits);
1379 else
1380 mpam_write_partsel_reg(msc, MBW_PBM, cfg->mbw_pbm);
1381 }
1382
1383 if (mpam_has_feature(mpam_feat_mbw_min, rprops) &&
1384 mpam_has_feature(mpam_feat_mbw_min, cfg))
1385 mpam_write_partsel_reg(msc, MBW_MIN, 0);
1386
1387 if (mpam_has_feature(mpam_feat_mbw_max, rprops) &&
1388 mpam_has_feature(mpam_feat_mbw_max, cfg)) {
1389 if (cfg->reset_mbw_max)
1390 mpam_write_partsel_reg(msc, MBW_MAX, MPAMCFG_MBW_MAX_MAX);
1391 else
1392 mpam_write_partsel_reg(msc, MBW_MAX, cfg->mbw_max);
1393 }
1394
1395 if (mpam_has_feature(mpam_feat_mbw_prop, rprops) &&
1396 mpam_has_feature(mpam_feat_mbw_prop, cfg))
1397 mpam_write_partsel_reg(msc, MBW_PROP, 0);
1398
1399 if (mpam_has_feature(mpam_feat_cmax_cmax, rprops))
1400 mpam_write_partsel_reg(msc, CMAX, cmax);
1401
1402 if (mpam_has_feature(mpam_feat_cmax_cmin, rprops))
1403 mpam_write_partsel_reg(msc, CMIN, 0);
1404
1405 if (mpam_has_feature(mpam_feat_cmax_cassoc, rprops))
1406 mpam_write_partsel_reg(msc, CASSOC, MPAMCFG_CASSOC_CASSOC);
1407
1408 if (mpam_has_feature(mpam_feat_intpri_part, rprops) ||
1409 mpam_has_feature(mpam_feat_dspri_part, rprops)) {
1410 /* aces high? */
1411 if (!mpam_has_feature(mpam_feat_intpri_part_0_low, rprops))
1412 intpri = 0;
1413 if (!mpam_has_feature(mpam_feat_dspri_part_0_low, rprops))
1414 dspri = 0;
1415
1416 if (mpam_has_feature(mpam_feat_intpri_part, rprops))
1417 pri_val |= FIELD_PREP(MPAMCFG_PRI_INTPRI, intpri);
1418 if (mpam_has_feature(mpam_feat_dspri_part, rprops))
1419 pri_val |= FIELD_PREP(MPAMCFG_PRI_DSPRI, dspri);
1420
1421 mpam_write_partsel_reg(msc, PRI, pri_val);
1422 }
1423
1424 mutex_unlock(&msc->part_sel_lock);
1425}
1426
1427/* Call with msc cfg_lock held */
1428static int mpam_restore_mbwu_state(void *_ris)
1429{
1430 int i;
1431 struct mon_read mwbu_arg;
1432 struct mpam_msc_ris *ris = _ris;
1433 struct mpam_class *class = ris->vmsc->comp->class;
1434
1435 for (i = 0; i < ris->props.num_mbwu_mon; i++) {
1436 if (ris->mbwu_state[i].enabled) {
1437 mwbu_arg.ris = ris;
1438 mwbu_arg.ctx = &ris->mbwu_state[i].cfg;
1439 mwbu_arg.type = mpam_msmon_choose_counter(class);
1440
1441 __ris_msmon_read(&mwbu_arg);
1442 }
1443 }
1444
1445 return 0;
1446}
1447
1448/* Call with MSC cfg_lock held */
1449static int mpam_save_mbwu_state(void *arg)
1450{
1451 int i;
1452 u64 val;
1453 struct mon_cfg *cfg;
1454 u32 cur_flt, cur_ctl, mon_sel;
1455 struct mpam_msc_ris *ris = arg;
1456 struct msmon_mbwu_state *mbwu_state;
1457 struct mpam_msc *msc = ris->vmsc->msc;
1458
1459 for (i = 0; i < ris->props.num_mbwu_mon; i++) {
1460 mbwu_state = &ris->mbwu_state[i];
1461 cfg = &mbwu_state->cfg;
1462
1463 if (WARN_ON_ONCE(!mpam_mon_sel_lock(msc)))
1464 return -EIO;
1465
1466 mon_sel = FIELD_PREP(MSMON_CFG_MON_SEL_MON_SEL, i) |
1467 FIELD_PREP(MSMON_CFG_MON_SEL_RIS, ris->ris_idx);
1468 mpam_write_monsel_reg(msc, CFG_MON_SEL, mon_sel);
1469
1470 cur_flt = mpam_read_monsel_reg(msc, CFG_MBWU_FLT);
1471 cur_ctl = mpam_read_monsel_reg(msc, CFG_MBWU_CTL);
1472 mpam_write_monsel_reg(msc, CFG_MBWU_CTL, 0);
1473
1474 if (mpam_ris_has_mbwu_long_counter(ris)) {
1475 val = mpam_msc_read_mbwu_l(msc);
1476 mpam_msc_zero_mbwu_l(msc);
1477 } else {
1478 val = mpam_read_monsel_reg(msc, MBWU);
1479 mpam_write_monsel_reg(msc, MBWU, 0);
1480 }
1481
1482 cfg->mon = i;
1483 cfg->pmg = FIELD_GET(MSMON_CFG_x_FLT_PMG, cur_flt);
1484 cfg->match_pmg = FIELD_GET(MSMON_CFG_x_CTL_MATCH_PMG, cur_ctl);
1485 cfg->partid = FIELD_GET(MSMON_CFG_x_FLT_PARTID, cur_flt);
1486 mbwu_state->correction += val;
1487 mbwu_state->enabled = FIELD_GET(MSMON_CFG_x_CTL_EN, cur_ctl);
1488 mpam_mon_sel_unlock(msc);
1489 }
1490
1491 return 0;
1492}
1493
1494static void mpam_init_reset_cfg(struct mpam_config *reset_cfg)
1495{
1496 *reset_cfg = (struct mpam_config) {
1497 .reset_cpbm = true,
1498 .reset_mbw_pbm = true,
1499 .reset_mbw_max = true,
1500 };
1501 bitmap_fill(reset_cfg->features, MPAM_FEATURE_LAST);
1502}
1503
1504/*
1505 * Called via smp_call_on_cpu() to prevent migration, while still being
1506 * pre-emptible. Caller must hold mpam_srcu.
1507 */
1508static int mpam_reset_ris(void *arg)
1509{
1510 u16 partid, partid_max;
1511 struct mpam_config reset_cfg;
1512 struct mpam_msc_ris *ris = arg;
1513
1514 if (ris->in_reset_state)
1515 return 0;
1516
1517 mpam_init_reset_cfg(&reset_cfg);
1518
1519 spin_lock(&partid_max_lock);
1520 partid_max = mpam_partid_max;
1521 spin_unlock(&partid_max_lock);
1522 for (partid = 0; partid <= partid_max; partid++)
1523 mpam_reprogram_ris_partid(ris, partid, &reset_cfg);
1524
1525 return 0;
1526}
1527
1528/*
1529 * Get the preferred CPU for this MSC. If it is accessible from this CPU,
1530 * this CPU is preferred. This can be preempted/migrated, it will only result
1531 * in more work.
1532 */
1533static int mpam_get_msc_preferred_cpu(struct mpam_msc *msc)
1534{
1535 int cpu = raw_smp_processor_id();
1536
1537 if (cpumask_test_cpu(cpu, &msc->accessibility))
1538 return cpu;
1539
1540 return cpumask_first_and(&msc->accessibility, cpu_online_mask);
1541}
1542
1543static int mpam_touch_msc(struct mpam_msc *msc, int (*fn)(void *a), void *arg)
1544{
1545 lockdep_assert_irqs_enabled();
1546 lockdep_assert_cpus_held();
1547 WARN_ON_ONCE(!srcu_read_lock_held((&mpam_srcu)));
1548
1549 return smp_call_on_cpu(mpam_get_msc_preferred_cpu(msc), fn, arg, true);
1550}
1551
1552struct mpam_write_config_arg {
1553 struct mpam_msc_ris *ris;
1554 struct mpam_component *comp;
1555 u16 partid;
1556};
1557
1558static int __write_config(void *arg)
1559{
1560 struct mpam_write_config_arg *c = arg;
1561
1562 mpam_reprogram_ris_partid(c->ris, c->partid, &c->comp->cfg[c->partid]);
1563
1564 return 0;
1565}
1566
1567static void mpam_reprogram_msc(struct mpam_msc *msc)
1568{
1569 u16 partid;
1570 bool reset;
1571 struct mpam_config *cfg;
1572 struct mpam_msc_ris *ris;
1573 struct mpam_write_config_arg arg;
1574
1575 /*
1576 * No lock for mpam_partid_max as partid_max_published has been
1577 * set by mpam_enabled(), so the values can no longer change.
1578 */
1579 mpam_assert_partid_sizes_fixed();
1580
1581 mutex_lock(&msc->cfg_lock);
1582 list_for_each_entry_srcu(ris, &msc->ris, msc_list,
1583 srcu_read_lock_held(&mpam_srcu)) {
1584 if (!mpam_is_enabled() && !ris->in_reset_state) {
1585 mpam_touch_msc(msc, &mpam_reset_ris, ris);
1586 ris->in_reset_state = true;
1587 continue;
1588 }
1589
1590 arg.comp = ris->vmsc->comp;
1591 arg.ris = ris;
1592 reset = true;
1593 for (partid = 0; partid <= mpam_partid_max; partid++) {
1594 cfg = &ris->vmsc->comp->cfg[partid];
1595 if (!bitmap_empty(cfg->features, MPAM_FEATURE_LAST))
1596 reset = false;
1597
1598 arg.partid = partid;
1599 mpam_touch_msc(msc, __write_config, &arg);
1600 }
1601 ris->in_reset_state = reset;
1602
1603 if (mpam_has_feature(mpam_feat_msmon_mbwu, &ris->props))
1604 mpam_touch_msc(msc, &mpam_restore_mbwu_state, ris);
1605 }
1606 mutex_unlock(&msc->cfg_lock);
1607}
1608
1609static void _enable_percpu_irq(void *_irq)
1610{
1611 int *irq = _irq;
1612
1613 enable_percpu_irq(*irq, IRQ_TYPE_NONE);
1614}
1615
1616static int mpam_cpu_online(unsigned int cpu)
1617{
1618 struct mpam_msc *msc;
1619
1620 guard(srcu)(&mpam_srcu);
1621 list_for_each_entry_srcu(msc, &mpam_all_msc, all_msc_list,
1622 srcu_read_lock_held(&mpam_srcu)) {
1623 if (!cpumask_test_cpu(cpu, &msc->accessibility))
1624 continue;
1625
1626 if (msc->reenable_error_ppi)
1627 _enable_percpu_irq(&msc->reenable_error_ppi);
1628
1629 if (atomic_fetch_inc(&msc->online_refs) == 0)
1630 mpam_reprogram_msc(msc);
1631 }
1632
1633 return 0;
1634}
1635
1636/* Before mpam is enabled, try to probe new MSC */
1637static int mpam_discovery_cpu_online(unsigned int cpu)
1638{
1639 int err = 0;
1640 struct mpam_msc *msc;
1641 bool new_device_probed = false;
1642
1643 if (mpam_is_enabled())
1644 return 0;
1645
1646 guard(srcu)(&mpam_srcu);
1647 list_for_each_entry_srcu(msc, &mpam_all_msc, all_msc_list,
1648 srcu_read_lock_held(&mpam_srcu)) {
1649 if (!cpumask_test_cpu(cpu, &msc->accessibility))
1650 continue;
1651
1652 mutex_lock(&msc->probe_lock);
1653 if (!msc->probed)
1654 err = mpam_msc_hw_probe(msc);
1655 mutex_unlock(&msc->probe_lock);
1656
1657 if (err)
1658 break;
1659 new_device_probed = true;
1660 }
1661
1662 if (new_device_probed && !err)
1663 schedule_work(&mpam_enable_work);
1664 if (err) {
1665 mpam_disable_reason = "error during probing";
1666 schedule_work(&mpam_broken_work);
1667 }
1668
1669 return err;
1670}
1671
1672static int mpam_cpu_offline(unsigned int cpu)
1673{
1674 struct mpam_msc *msc;
1675
1676 guard(srcu)(&mpam_srcu);
1677 list_for_each_entry_srcu(msc, &mpam_all_msc, all_msc_list,
1678 srcu_read_lock_held(&mpam_srcu)) {
1679 if (!cpumask_test_cpu(cpu, &msc->accessibility))
1680 continue;
1681
1682 if (msc->reenable_error_ppi)
1683 disable_percpu_irq(msc->reenable_error_ppi);
1684
1685 if (atomic_dec_and_test(&msc->online_refs)) {
1686 struct mpam_msc_ris *ris;
1687
1688 mutex_lock(&msc->cfg_lock);
1689 list_for_each_entry_srcu(ris, &msc->ris, msc_list,
1690 srcu_read_lock_held(&mpam_srcu)) {
1691 mpam_touch_msc(msc, &mpam_reset_ris, ris);
1692
1693 /*
1694 * The reset state for non-zero partid may be
1695 * lost while the CPUs are offline.
1696 */
1697 ris->in_reset_state = false;
1698
1699 if (mpam_is_enabled())
1700 mpam_touch_msc(msc, &mpam_save_mbwu_state, ris);
1701 }
1702 mutex_unlock(&msc->cfg_lock);
1703 }
1704 }
1705
1706 return 0;
1707}
1708
1709static void mpam_register_cpuhp_callbacks(int (*online)(unsigned int online),
1710 int (*offline)(unsigned int offline),
1711 char *name)
1712{
1713 mutex_lock(&mpam_cpuhp_state_lock);
1714 if (mpam_cpuhp_state) {
1715 cpuhp_remove_state(mpam_cpuhp_state);
1716 mpam_cpuhp_state = 0;
1717 }
1718
1719 mpam_cpuhp_state = cpuhp_setup_state(CPUHP_AP_ONLINE_DYN, name, online,
1720 offline);
1721 if (mpam_cpuhp_state <= 0) {
1722 pr_err("Failed to register cpuhp callbacks");
1723 mpam_cpuhp_state = 0;
1724 }
1725 mutex_unlock(&mpam_cpuhp_state_lock);
1726}
1727
1728static int __setup_ppi(struct mpam_msc *msc)
1729{
1730 int cpu;
1731
1732 msc->error_dev_id = alloc_percpu(struct mpam_msc *);
1733 if (!msc->error_dev_id)
1734 return -ENOMEM;
1735
1736 for_each_cpu(cpu, &msc->accessibility)
1737 *per_cpu_ptr(msc->error_dev_id, cpu) = msc;
1738
1739 return 0;
1740}
1741
1742static int mpam_msc_setup_error_irq(struct mpam_msc *msc)
1743{
1744 int irq;
1745
1746 irq = platform_get_irq_byname_optional(msc->pdev, "error");
1747 if (irq <= 0)
1748 return 0;
1749
1750 /* Allocate and initialise the percpu device pointer for PPI */
1751 if (irq_is_percpu(irq))
1752 return __setup_ppi(msc);
1753
1754 /* sanity check: shared interrupts can be routed anywhere? */
1755 if (!cpumask_equal(&msc->accessibility, cpu_possible_mask)) {
1756 pr_err_once("msc:%u is a private resource with a shared error interrupt",
1757 msc->id);
1758 return -EINVAL;
1759 }
1760
1761 return 0;
1762}
1763
1764/*
1765 * An MSC can control traffic from a set of CPUs, but may only be accessible
1766 * from a (hopefully wider) set of CPUs. The common reason for this is power
1767 * management. If all the CPUs in a cluster are in PSCI:CPU_SUSPEND, the
1768 * corresponding cache may also be powered off. By making accesses from
1769 * one of those CPUs, we ensure we don't access a cache that's powered off.
1770 */
1771static void update_msc_accessibility(struct mpam_msc *msc)
1772{
1773 u32 affinity_id;
1774 int err;
1775
1776 err = device_property_read_u32(&msc->pdev->dev, "cpu_affinity",
1777 &affinity_id);
1778 if (err)
1779 cpumask_copy(&msc->accessibility, cpu_possible_mask);
1780 else
1781 acpi_pptt_get_cpus_from_container(affinity_id, &msc->accessibility);
1782}
1783
1784/*
1785 * There are two ways of reaching a struct mpam_msc_ris. Via the
1786 * class->component->vmsc->ris, or via the msc.
1787 * When destroying the msc, the other side needs unlinking and cleaning up too.
1788 */
1789static void mpam_msc_destroy(struct mpam_msc *msc)
1790{
1791 struct platform_device *pdev = msc->pdev;
1792 struct mpam_msc_ris *ris, *tmp;
1793
1794 lockdep_assert_held(&mpam_list_lock);
1795
1796 list_for_each_entry_safe(ris, tmp, &msc->ris, msc_list)
1797 mpam_ris_destroy(ris);
1798
1799 list_del_rcu(&msc->all_msc_list);
1800 platform_set_drvdata(pdev, NULL);
1801
1802 add_to_garbage(msc);
1803}
1804
1805static void mpam_msc_drv_remove(struct platform_device *pdev)
1806{
1807 struct mpam_msc *msc = platform_get_drvdata(pdev);
1808
1809 mutex_lock(&mpam_list_lock);
1810 mpam_msc_destroy(msc);
1811 mutex_unlock(&mpam_list_lock);
1812
1813 mpam_free_garbage();
1814}
1815
1816static struct mpam_msc *do_mpam_msc_drv_probe(struct platform_device *pdev)
1817{
1818 int err;
1819 u32 tmp;
1820 struct mpam_msc *msc;
1821 struct resource *msc_res;
1822 struct device *dev = &pdev->dev;
1823
1824 lockdep_assert_held(&mpam_list_lock);
1825
1826 msc = devm_kzalloc(&pdev->dev, sizeof(*msc), GFP_KERNEL);
1827 if (!msc)
1828 return ERR_PTR(-ENOMEM);
1829 init_garbage(&msc->garbage);
1830 msc->garbage.pdev = pdev;
1831
1832 err = devm_mutex_init(dev, &msc->probe_lock);
1833 if (err)
1834 return ERR_PTR(err);
1835
1836 err = devm_mutex_init(dev, &msc->part_sel_lock);
1837 if (err)
1838 return ERR_PTR(err);
1839
1840 err = devm_mutex_init(dev, &msc->error_irq_lock);
1841 if (err)
1842 return ERR_PTR(err);
1843
1844 err = devm_mutex_init(dev, &msc->cfg_lock);
1845 if (err)
1846 return ERR_PTR(err);
1847
1848 mpam_mon_sel_lock_init(msc);
1849 msc->id = pdev->id;
1850 msc->pdev = pdev;
1851 INIT_LIST_HEAD_RCU(&msc->all_msc_list);
1852 INIT_LIST_HEAD_RCU(&msc->ris);
1853
1854 update_msc_accessibility(msc);
1855 if (cpumask_empty(&msc->accessibility)) {
1856 dev_err_once(dev, "MSC is not accessible from any CPU!");
1857 return ERR_PTR(-EINVAL);
1858 }
1859
1860 err = mpam_msc_setup_error_irq(msc);
1861 if (err)
1862 return ERR_PTR(err);
1863
1864 if (device_property_read_u32(&pdev->dev, "pcc-channel", &tmp))
1865 msc->iface = MPAM_IFACE_MMIO;
1866 else
1867 msc->iface = MPAM_IFACE_PCC;
1868
1869 if (msc->iface == MPAM_IFACE_MMIO) {
1870 void __iomem *io;
1871
1872 io = devm_platform_get_and_ioremap_resource(pdev, 0,
1873 &msc_res);
1874 if (IS_ERR(io)) {
1875 dev_err_once(dev, "Failed to map MSC base address\n");
1876 return ERR_CAST(io);
1877 }
1878 msc->mapped_hwpage_sz = msc_res->end - msc_res->start;
1879 msc->mapped_hwpage = io;
1880 } else {
1881 return ERR_PTR(-EINVAL);
1882 }
1883
1884 list_add_rcu(&msc->all_msc_list, &mpam_all_msc);
1885 platform_set_drvdata(pdev, msc);
1886
1887 return msc;
1888}
1889
1890static int fw_num_msc;
1891
1892static int mpam_msc_drv_probe(struct platform_device *pdev)
1893{
1894 int err;
1895 struct mpam_msc *msc = NULL;
1896 void *plat_data = pdev->dev.platform_data;
1897
1898 mutex_lock(&mpam_list_lock);
1899 msc = do_mpam_msc_drv_probe(pdev);
1900 mutex_unlock(&mpam_list_lock);
1901
1902 if (IS_ERR(msc))
1903 return PTR_ERR(msc);
1904
1905 /* Create RIS entries described by firmware */
1906 err = acpi_mpam_parse_resources(msc, plat_data);
1907 if (err) {
1908 mpam_msc_drv_remove(pdev);
1909 return err;
1910 }
1911
1912 if (atomic_add_return(1, &mpam_num_msc) == fw_num_msc)
1913 mpam_register_cpuhp_callbacks(mpam_discovery_cpu_online, NULL,
1914 "mpam:drv_probe");
1915
1916 return 0;
1917}
1918
1919static struct platform_driver mpam_msc_driver = {
1920 .driver = {
1921 .name = "mpam_msc",
1922 },
1923 .probe = mpam_msc_drv_probe,
1924 .remove = mpam_msc_drv_remove,
1925};
1926
1927/* Any of these features mean the BWA_WD field is valid. */
1928static bool mpam_has_bwa_wd_feature(struct mpam_props *props)
1929{
1930 if (mpam_has_feature(mpam_feat_mbw_min, props))
1931 return true;
1932 if (mpam_has_feature(mpam_feat_mbw_max, props))
1933 return true;
1934 if (mpam_has_feature(mpam_feat_mbw_prop, props))
1935 return true;
1936 return false;
1937}
1938
1939/* Any of these features mean the CMAX_WD field is valid. */
1940static bool mpam_has_cmax_wd_feature(struct mpam_props *props)
1941{
1942 if (mpam_has_feature(mpam_feat_cmax_cmax, props))
1943 return true;
1944 if (mpam_has_feature(mpam_feat_cmax_cmin, props))
1945 return true;
1946 return false;
1947}
1948
1949#define MISMATCHED_HELPER(parent, child, helper, field, alias) \
1950 helper(parent) && \
1951 ((helper(child) && (parent)->field != (child)->field) || \
1952 (!helper(child) && !(alias)))
1953
1954#define MISMATCHED_FEAT(parent, child, feat, field, alias) \
1955 mpam_has_feature((feat), (parent)) && \
1956 ((mpam_has_feature((feat), (child)) && (parent)->field != (child)->field) || \
1957 (!mpam_has_feature((feat), (child)) && !(alias)))
1958
1959#define CAN_MERGE_FEAT(parent, child, feat, alias) \
1960 (alias) && !mpam_has_feature((feat), (parent)) && \
1961 mpam_has_feature((feat), (child))
1962
1963/*
1964 * Combine two props fields.
1965 * If this is for controls that alias the same resource, it is safe to just
1966 * copy the values over. If two aliasing controls implement the same scheme
1967 * a safe value must be picked.
1968 * For non-aliasing controls, these control different resources, and the
1969 * resulting safe value must be compatible with both. When merging values in
1970 * the tree, all the aliasing resources must be handled first.
1971 * On mismatch, parent is modified.
1972 */
1973static void __props_mismatch(struct mpam_props *parent,
1974 struct mpam_props *child, bool alias)
1975{
1976 if (CAN_MERGE_FEAT(parent, child, mpam_feat_cpor_part, alias)) {
1977 parent->cpbm_wd = child->cpbm_wd;
1978 } else if (MISMATCHED_FEAT(parent, child, mpam_feat_cpor_part,
1979 cpbm_wd, alias)) {
1980 pr_debug("cleared cpor_part\n");
1981 mpam_clear_feature(mpam_feat_cpor_part, parent);
1982 parent->cpbm_wd = 0;
1983 }
1984
1985 if (CAN_MERGE_FEAT(parent, child, mpam_feat_mbw_part, alias)) {
1986 parent->mbw_pbm_bits = child->mbw_pbm_bits;
1987 } else if (MISMATCHED_FEAT(parent, child, mpam_feat_mbw_part,
1988 mbw_pbm_bits, alias)) {
1989 pr_debug("cleared mbw_part\n");
1990 mpam_clear_feature(mpam_feat_mbw_part, parent);
1991 parent->mbw_pbm_bits = 0;
1992 }
1993
1994 /* bwa_wd is a count of bits, fewer bits means less precision */
1995 if (alias && !mpam_has_bwa_wd_feature(parent) &&
1996 mpam_has_bwa_wd_feature(child)) {
1997 parent->bwa_wd = child->bwa_wd;
1998 } else if (MISMATCHED_HELPER(parent, child, mpam_has_bwa_wd_feature,
1999 bwa_wd, alias)) {
2000 pr_debug("took the min bwa_wd\n");
2001 parent->bwa_wd = min(parent->bwa_wd, child->bwa_wd);
2002 }
2003
2004 if (alias && !mpam_has_cmax_wd_feature(parent) && mpam_has_cmax_wd_feature(child)) {
2005 parent->cmax_wd = child->cmax_wd;
2006 } else if (MISMATCHED_HELPER(parent, child, mpam_has_cmax_wd_feature,
2007 cmax_wd, alias)) {
2008 pr_debug("%s took the min cmax_wd\n", __func__);
2009 parent->cmax_wd = min(parent->cmax_wd, child->cmax_wd);
2010 }
2011
2012 if (CAN_MERGE_FEAT(parent, child, mpam_feat_cmax_cassoc, alias)) {
2013 parent->cassoc_wd = child->cassoc_wd;
2014 } else if (MISMATCHED_FEAT(parent, child, mpam_feat_cmax_cassoc,
2015 cassoc_wd, alias)) {
2016 pr_debug("%s cleared cassoc_wd\n", __func__);
2017 mpam_clear_feature(mpam_feat_cmax_cassoc, parent);
2018 parent->cassoc_wd = 0;
2019 }
2020
2021 /* For num properties, take the minimum */
2022 if (CAN_MERGE_FEAT(parent, child, mpam_feat_msmon_csu, alias)) {
2023 parent->num_csu_mon = child->num_csu_mon;
2024 } else if (MISMATCHED_FEAT(parent, child, mpam_feat_msmon_csu,
2025 num_csu_mon, alias)) {
2026 pr_debug("took the min num_csu_mon\n");
2027 parent->num_csu_mon = min(parent->num_csu_mon,
2028 child->num_csu_mon);
2029 }
2030
2031 if (CAN_MERGE_FEAT(parent, child, mpam_feat_msmon_mbwu, alias)) {
2032 parent->num_mbwu_mon = child->num_mbwu_mon;
2033 } else if (MISMATCHED_FEAT(parent, child, mpam_feat_msmon_mbwu,
2034 num_mbwu_mon, alias)) {
2035 pr_debug("took the min num_mbwu_mon\n");
2036 parent->num_mbwu_mon = min(parent->num_mbwu_mon,
2037 child->num_mbwu_mon);
2038 }
2039
2040 if (CAN_MERGE_FEAT(parent, child, mpam_feat_intpri_part, alias)) {
2041 parent->intpri_wd = child->intpri_wd;
2042 } else if (MISMATCHED_FEAT(parent, child, mpam_feat_intpri_part,
2043 intpri_wd, alias)) {
2044 pr_debug("%s took the min intpri_wd\n", __func__);
2045 parent->intpri_wd = min(parent->intpri_wd, child->intpri_wd);
2046 }
2047
2048 if (CAN_MERGE_FEAT(parent, child, mpam_feat_dspri_part, alias)) {
2049 parent->dspri_wd = child->dspri_wd;
2050 } else if (MISMATCHED_FEAT(parent, child, mpam_feat_dspri_part,
2051 dspri_wd, alias)) {
2052 pr_debug("%s took the min dspri_wd\n", __func__);
2053 parent->dspri_wd = min(parent->dspri_wd, child->dspri_wd);
2054 }
2055
2056 /* TODO: alias support for these two */
2057 /* {int,ds}pri may not have differing 0-low behaviour */
2058 if (mpam_has_feature(mpam_feat_intpri_part, parent) &&
2059 (!mpam_has_feature(mpam_feat_intpri_part, child) ||
2060 mpam_has_feature(mpam_feat_intpri_part_0_low, parent) !=
2061 mpam_has_feature(mpam_feat_intpri_part_0_low, child))) {
2062 pr_debug("%s cleared intpri_part\n", __func__);
2063 mpam_clear_feature(mpam_feat_intpri_part, parent);
2064 mpam_clear_feature(mpam_feat_intpri_part_0_low, parent);
2065 }
2066 if (mpam_has_feature(mpam_feat_dspri_part, parent) &&
2067 (!mpam_has_feature(mpam_feat_dspri_part, child) ||
2068 mpam_has_feature(mpam_feat_dspri_part_0_low, parent) !=
2069 mpam_has_feature(mpam_feat_dspri_part_0_low, child))) {
2070 pr_debug("%s cleared dspri_part\n", __func__);
2071 mpam_clear_feature(mpam_feat_dspri_part, parent);
2072 mpam_clear_feature(mpam_feat_dspri_part_0_low, parent);
2073 }
2074
2075 if (alias) {
2076 /* Merge features for aliased resources */
2077 bitmap_or(parent->features, parent->features, child->features, MPAM_FEATURE_LAST);
2078 } else {
2079 /* Clear missing features for non aliasing */
2080 bitmap_and(parent->features, parent->features, child->features, MPAM_FEATURE_LAST);
2081 }
2082}
2083
2084/*
2085 * If a vmsc doesn't match class feature/configuration, do the right thing(tm).
2086 * For 'num' properties we can just take the minimum.
2087 * For properties where the mismatched unused bits would make a difference, we
2088 * nobble the class feature, as we can't configure all the resources.
2089 * e.g. The L3 cache is composed of two resources with 13 and 17 portion
2090 * bitmaps respectively.
2091 */
2092static void
2093__class_props_mismatch(struct mpam_class *class, struct mpam_vmsc *vmsc)
2094{
2095 struct mpam_props *cprops = &class->props;
2096 struct mpam_props *vprops = &vmsc->props;
2097 struct device *dev = &vmsc->msc->pdev->dev;
2098
2099 lockdep_assert_held(&mpam_list_lock); /* we modify class */
2100
2101 dev_dbg(dev, "Merging features for class:0x%lx &= vmsc:0x%lx\n",
2102 (long)cprops->features, (long)vprops->features);
2103
2104 /* Take the safe value for any common features */
2105 __props_mismatch(cprops, vprops, false);
2106}
2107
2108static void
2109__vmsc_props_mismatch(struct mpam_vmsc *vmsc, struct mpam_msc_ris *ris)
2110{
2111 struct mpam_props *rprops = &ris->props;
2112 struct mpam_props *vprops = &vmsc->props;
2113 struct device *dev = &vmsc->msc->pdev->dev;
2114
2115 lockdep_assert_held(&mpam_list_lock); /* we modify vmsc */
2116
2117 dev_dbg(dev, "Merging features for vmsc:0x%lx |= ris:0x%lx\n",
2118 (long)vprops->features, (long)rprops->features);
2119
2120 /*
2121 * Merge mismatched features - Copy any features that aren't common,
2122 * but take the safe value for any common features.
2123 */
2124 __props_mismatch(vprops, rprops, true);
2125}
2126
2127/*
2128 * Copy the first component's first vMSC's properties and features to the
2129 * class. __class_props_mismatch() will remove conflicts.
2130 * It is not possible to have a class with no components, or a component with
2131 * no resources. The vMSC properties have already been built.
2132 */
2133static void mpam_enable_init_class_features(struct mpam_class *class)
2134{
2135 struct mpam_vmsc *vmsc;
2136 struct mpam_component *comp;
2137
2138 comp = list_first_entry(&class->components,
2139 struct mpam_component, class_list);
2140 vmsc = list_first_entry(&comp->vmsc,
2141 struct mpam_vmsc, comp_list);
2142
2143 class->props = vmsc->props;
2144}
2145
2146static void mpam_enable_merge_vmsc_features(struct mpam_component *comp)
2147{
2148 struct mpam_vmsc *vmsc;
2149 struct mpam_msc_ris *ris;
2150 struct mpam_class *class = comp->class;
2151
2152 list_for_each_entry(vmsc, &comp->vmsc, comp_list) {
2153 list_for_each_entry(ris, &vmsc->ris, vmsc_list) {
2154 __vmsc_props_mismatch(vmsc, ris);
2155 class->nrdy_usec = max(class->nrdy_usec,
2156 vmsc->msc->nrdy_usec);
2157 }
2158 }
2159}
2160
2161static void mpam_enable_merge_class_features(struct mpam_component *comp)
2162{
2163 struct mpam_vmsc *vmsc;
2164 struct mpam_class *class = comp->class;
2165
2166 list_for_each_entry(vmsc, &comp->vmsc, comp_list)
2167 __class_props_mismatch(class, vmsc);
2168}
2169
2170/*
2171 * Merge all the common resource features into class.
2172 * vmsc features are bitwise-or'd together by mpam_enable_merge_vmsc_features()
2173 * as the first step so that mpam_enable_init_class_features() can initialise
2174 * the class with a representative set of features.
2175 * Next the mpam_enable_merge_class_features() bitwise-and's all the vmsc
2176 * features to form the class features.
2177 * Other features are the min/max as appropriate.
2178 *
2179 * To avoid walking the whole tree twice, the class->nrdy_usec property is
2180 * updated when working with the vmsc as it is a max(), and doesn't need
2181 * initialising first.
2182 */
2183static void mpam_enable_merge_features(struct list_head *all_classes_list)
2184{
2185 struct mpam_class *class;
2186 struct mpam_component *comp;
2187
2188 lockdep_assert_held(&mpam_list_lock);
2189
2190 list_for_each_entry(class, all_classes_list, classes_list) {
2191 list_for_each_entry(comp, &class->components, class_list)
2192 mpam_enable_merge_vmsc_features(comp);
2193
2194 mpam_enable_init_class_features(class);
2195
2196 list_for_each_entry(comp, &class->components, class_list)
2197 mpam_enable_merge_class_features(comp);
2198 }
2199}
2200
2201static char *mpam_errcode_names[16] = {
2202 [MPAM_ERRCODE_NONE] = "No error",
2203 [MPAM_ERRCODE_PARTID_SEL_RANGE] = "PARTID_SEL_Range",
2204 [MPAM_ERRCODE_REQ_PARTID_RANGE] = "Req_PARTID_Range",
2205 [MPAM_ERRCODE_MSMONCFG_ID_RANGE] = "MSMONCFG_ID_RANGE",
2206 [MPAM_ERRCODE_REQ_PMG_RANGE] = "Req_PMG_Range",
2207 [MPAM_ERRCODE_MONITOR_RANGE] = "Monitor_Range",
2208 [MPAM_ERRCODE_INTPARTID_RANGE] = "intPARTID_Range",
2209 [MPAM_ERRCODE_UNEXPECTED_INTERNAL] = "Unexpected_INTERNAL",
2210 [MPAM_ERRCODE_UNDEFINED_RIS_PART_SEL] = "Undefined_RIS_PART_SEL",
2211 [MPAM_ERRCODE_RIS_NO_CONTROL] = "RIS_No_Control",
2212 [MPAM_ERRCODE_UNDEFINED_RIS_MON_SEL] = "Undefined_RIS_MON_SEL",
2213 [MPAM_ERRCODE_RIS_NO_MONITOR] = "RIS_No_Monitor",
2214 [12 ... 15] = "Reserved"
2215};
2216
2217static int mpam_enable_msc_ecr(void *_msc)
2218{
2219 struct mpam_msc *msc = _msc;
2220
2221 __mpam_write_reg(msc, MPAMF_ECR, MPAMF_ECR_INTEN);
2222
2223 return 0;
2224}
2225
2226/* This can run in mpam_disable(), and the interrupt handler on the same CPU */
2227static int mpam_disable_msc_ecr(void *_msc)
2228{
2229 struct mpam_msc *msc = _msc;
2230
2231 __mpam_write_reg(msc, MPAMF_ECR, 0);
2232
2233 return 0;
2234}
2235
2236static irqreturn_t __mpam_irq_handler(int irq, struct mpam_msc *msc)
2237{
2238 u64 reg;
2239 u16 partid;
2240 u8 errcode, pmg, ris;
2241
2242 if (WARN_ON_ONCE(!msc) ||
2243 WARN_ON_ONCE(!cpumask_test_cpu(smp_processor_id(),
2244 &msc->accessibility)))
2245 return IRQ_NONE;
2246
2247 reg = mpam_msc_read_esr(msc);
2248
2249 errcode = FIELD_GET(MPAMF_ESR_ERRCODE, reg);
2250 if (!errcode)
2251 return IRQ_NONE;
2252
2253 /* Clear level triggered irq */
2254 mpam_msc_clear_esr(msc);
2255
2256 partid = FIELD_GET(MPAMF_ESR_PARTID_MON, reg);
2257 pmg = FIELD_GET(MPAMF_ESR_PMG, reg);
2258 ris = FIELD_GET(MPAMF_ESR_RIS, reg);
2259
2260 pr_err_ratelimited("error irq from msc:%u '%s', partid:%u, pmg: %u, ris: %u\n",
2261 msc->id, mpam_errcode_names[errcode], partid, pmg,
2262 ris);
2263
2264 /* Disable this interrupt. */
2265 mpam_disable_msc_ecr(msc);
2266
2267 /* Are we racing with the thread disabling MPAM? */
2268 if (!mpam_is_enabled())
2269 return IRQ_HANDLED;
2270
2271 /*
2272 * Schedule the teardown work. Don't use a threaded IRQ as we can't
2273 * unregister the interrupt from the threaded part of the handler.
2274 */
2275 mpam_disable_reason = "hardware error interrupt";
2276 schedule_work(&mpam_broken_work);
2277
2278 return IRQ_HANDLED;
2279}
2280
2281static irqreturn_t mpam_ppi_handler(int irq, void *dev_id)
2282{
2283 struct mpam_msc *msc = *(struct mpam_msc **)dev_id;
2284
2285 return __mpam_irq_handler(irq, msc);
2286}
2287
2288static irqreturn_t mpam_spi_handler(int irq, void *dev_id)
2289{
2290 struct mpam_msc *msc = dev_id;
2291
2292 return __mpam_irq_handler(irq, msc);
2293}
2294
2295static int mpam_register_irqs(void)
2296{
2297 int err, irq;
2298 struct mpam_msc *msc;
2299
2300 lockdep_assert_cpus_held();
2301
2302 guard(srcu)(&mpam_srcu);
2303 list_for_each_entry_srcu(msc, &mpam_all_msc, all_msc_list,
2304 srcu_read_lock_held(&mpam_srcu)) {
2305 irq = platform_get_irq_byname_optional(msc->pdev, "error");
2306 if (irq <= 0)
2307 continue;
2308
2309 /* The MPAM spec says the interrupt can be SPI, PPI or LPI */
2310 /* We anticipate sharing the interrupt with other MSCs */
2311 if (irq_is_percpu(irq)) {
2312 err = request_percpu_irq(irq, &mpam_ppi_handler,
2313 "mpam:msc:error",
2314 msc->error_dev_id);
2315 if (err)
2316 return err;
2317
2318 msc->reenable_error_ppi = irq;
2319 smp_call_function_many(&msc->accessibility,
2320 &_enable_percpu_irq, &irq,
2321 true);
2322 } else {
2323 err = devm_request_irq(&msc->pdev->dev, irq,
2324 &mpam_spi_handler, IRQF_SHARED,
2325 "mpam:msc:error", msc);
2326 if (err)
2327 return err;
2328 }
2329
2330 mutex_lock(&msc->error_irq_lock);
2331 msc->error_irq_req = true;
2332 mpam_touch_msc(msc, mpam_enable_msc_ecr, msc);
2333 msc->error_irq_hw_enabled = true;
2334 mutex_unlock(&msc->error_irq_lock);
2335 }
2336
2337 return 0;
2338}
2339
2340static void mpam_unregister_irqs(void)
2341{
2342 int irq;
2343 struct mpam_msc *msc;
2344
2345 guard(cpus_read_lock)();
2346 guard(srcu)(&mpam_srcu);
2347 list_for_each_entry_srcu(msc, &mpam_all_msc, all_msc_list,
2348 srcu_read_lock_held(&mpam_srcu)) {
2349 irq = platform_get_irq_byname_optional(msc->pdev, "error");
2350 if (irq <= 0)
2351 continue;
2352
2353 mutex_lock(&msc->error_irq_lock);
2354 if (msc->error_irq_hw_enabled) {
2355 mpam_touch_msc(msc, mpam_disable_msc_ecr, msc);
2356 msc->error_irq_hw_enabled = false;
2357 }
2358
2359 if (msc->error_irq_req) {
2360 if (irq_is_percpu(irq)) {
2361 msc->reenable_error_ppi = 0;
2362 free_percpu_irq(irq, msc->error_dev_id);
2363 } else {
2364 devm_free_irq(&msc->pdev->dev, irq, msc);
2365 }
2366 msc->error_irq_req = false;
2367 }
2368 mutex_unlock(&msc->error_irq_lock);
2369 }
2370}
2371
2372static void __destroy_component_cfg(struct mpam_component *comp)
2373{
2374 struct mpam_msc *msc;
2375 struct mpam_vmsc *vmsc;
2376 struct mpam_msc_ris *ris;
2377
2378 lockdep_assert_held(&mpam_list_lock);
2379
2380 add_to_garbage(comp->cfg);
2381 list_for_each_entry(vmsc, &comp->vmsc, comp_list) {
2382 msc = vmsc->msc;
2383
2384 if (mpam_mon_sel_lock(msc)) {
2385 list_for_each_entry(ris, &vmsc->ris, vmsc_list)
2386 add_to_garbage(ris->mbwu_state);
2387 mpam_mon_sel_unlock(msc);
2388 }
2389 }
2390}
2391
2392static void mpam_reset_component_cfg(struct mpam_component *comp)
2393{
2394 int i;
2395 struct mpam_props *cprops = &comp->class->props;
2396
2397 mpam_assert_partid_sizes_fixed();
2398
2399 if (!comp->cfg)
2400 return;
2401
2402 for (i = 0; i <= mpam_partid_max; i++) {
2403 comp->cfg[i] = (struct mpam_config) {};
2404 if (cprops->cpbm_wd)
2405 comp->cfg[i].cpbm = GENMASK(cprops->cpbm_wd - 1, 0);
2406 if (cprops->mbw_pbm_bits)
2407 comp->cfg[i].mbw_pbm = GENMASK(cprops->mbw_pbm_bits - 1, 0);
2408 if (cprops->bwa_wd)
2409 comp->cfg[i].mbw_max = GENMASK(15, 16 - cprops->bwa_wd);
2410 }
2411}
2412
2413static int __allocate_component_cfg(struct mpam_component *comp)
2414{
2415 struct mpam_vmsc *vmsc;
2416
2417 mpam_assert_partid_sizes_fixed();
2418
2419 if (comp->cfg)
2420 return 0;
2421
2422 comp->cfg = kcalloc(mpam_partid_max + 1, sizeof(*comp->cfg), GFP_KERNEL);
2423 if (!comp->cfg)
2424 return -ENOMEM;
2425
2426 /*
2427 * The array is free()d in one go, so only cfg[0]'s structure needs
2428 * to be initialised.
2429 */
2430 init_garbage(&comp->cfg[0].garbage);
2431
2432 mpam_reset_component_cfg(comp);
2433
2434 list_for_each_entry(vmsc, &comp->vmsc, comp_list) {
2435 struct mpam_msc *msc;
2436 struct mpam_msc_ris *ris;
2437 struct msmon_mbwu_state *mbwu_state;
2438
2439 if (!vmsc->props.num_mbwu_mon)
2440 continue;
2441
2442 msc = vmsc->msc;
2443 list_for_each_entry(ris, &vmsc->ris, vmsc_list) {
2444 if (!ris->props.num_mbwu_mon)
2445 continue;
2446
2447 mbwu_state = kcalloc(ris->props.num_mbwu_mon,
2448 sizeof(*ris->mbwu_state),
2449 GFP_KERNEL);
2450 if (!mbwu_state) {
2451 __destroy_component_cfg(comp);
2452 return -ENOMEM;
2453 }
2454
2455 init_garbage(&mbwu_state[0].garbage);
2456
2457 if (mpam_mon_sel_lock(msc)) {
2458 ris->mbwu_state = mbwu_state;
2459 mpam_mon_sel_unlock(msc);
2460 }
2461 }
2462 }
2463
2464 return 0;
2465}
2466
2467static int mpam_allocate_config(void)
2468{
2469 struct mpam_class *class;
2470 struct mpam_component *comp;
2471
2472 lockdep_assert_held(&mpam_list_lock);
2473
2474 list_for_each_entry(class, &mpam_classes, classes_list) {
2475 list_for_each_entry(comp, &class->components, class_list) {
2476 int err = __allocate_component_cfg(comp);
2477 if (err)
2478 return err;
2479 }
2480 }
2481
2482 return 0;
2483}
2484
2485static void mpam_enable_once(void)
2486{
2487 int err;
2488
2489 /*
2490 * Once the cpuhp callbacks have been changed, mpam_partid_max can no
2491 * longer change.
2492 */
2493 spin_lock(&partid_max_lock);
2494 partid_max_published = true;
2495 spin_unlock(&partid_max_lock);
2496
2497 /*
2498 * If all the MSC have been probed, enabling the IRQs happens next.
2499 * That involves cross-calling to a CPU that can reach the MSC, and
2500 * the locks must be taken in this order:
2501 */
2502 cpus_read_lock();
2503 mutex_lock(&mpam_list_lock);
2504 do {
2505 mpam_enable_merge_features(&mpam_classes);
2506
2507 err = mpam_register_irqs();
2508 if (err) {
2509 pr_warn("Failed to register irqs: %d\n", err);
2510 break;
2511 }
2512
2513 err = mpam_allocate_config();
2514 if (err) {
2515 pr_err("Failed to allocate configuration arrays.\n");
2516 break;
2517 }
2518 } while (0);
2519 mutex_unlock(&mpam_list_lock);
2520 cpus_read_unlock();
2521
2522 if (err) {
2523 mpam_disable_reason = "Failed to enable.";
2524 schedule_work(&mpam_broken_work);
2525 return;
2526 }
2527
2528 static_branch_enable(&mpam_enabled);
2529 mpam_register_cpuhp_callbacks(mpam_cpu_online, mpam_cpu_offline,
2530 "mpam:online");
2531
2532 /* Use printk() to avoid the pr_fmt adding the function name. */
2533 printk(KERN_INFO "MPAM enabled with %u PARTIDs and %u PMGs\n",
2534 mpam_partid_max + 1, mpam_pmg_max + 1);
2535}
2536
2537static void mpam_reset_component_locked(struct mpam_component *comp)
2538{
2539 struct mpam_vmsc *vmsc;
2540
2541 lockdep_assert_cpus_held();
2542 mpam_assert_partid_sizes_fixed();
2543
2544 mpam_reset_component_cfg(comp);
2545
2546 guard(srcu)(&mpam_srcu);
2547 list_for_each_entry_srcu(vmsc, &comp->vmsc, comp_list,
2548 srcu_read_lock_held(&mpam_srcu)) {
2549 struct mpam_msc *msc = vmsc->msc;
2550 struct mpam_msc_ris *ris;
2551
2552 list_for_each_entry_srcu(ris, &vmsc->ris, vmsc_list,
2553 srcu_read_lock_held(&mpam_srcu)) {
2554 if (!ris->in_reset_state)
2555 mpam_touch_msc(msc, mpam_reset_ris, ris);
2556 ris->in_reset_state = true;
2557 }
2558 }
2559}
2560
2561static void mpam_reset_class_locked(struct mpam_class *class)
2562{
2563 struct mpam_component *comp;
2564
2565 lockdep_assert_cpus_held();
2566
2567 guard(srcu)(&mpam_srcu);
2568 list_for_each_entry_srcu(comp, &class->components, class_list,
2569 srcu_read_lock_held(&mpam_srcu))
2570 mpam_reset_component_locked(comp);
2571}
2572
2573static void mpam_reset_class(struct mpam_class *class)
2574{
2575 cpus_read_lock();
2576 mpam_reset_class_locked(class);
2577 cpus_read_unlock();
2578}
2579
2580/*
2581 * Called in response to an error IRQ.
2582 * All of MPAMs errors indicate a software bug, restore any modified
2583 * controls to their reset values.
2584 */
2585void mpam_disable(struct work_struct *ignored)
2586{
2587 int idx;
2588 struct mpam_class *class;
2589 struct mpam_msc *msc, *tmp;
2590
2591 mutex_lock(&mpam_cpuhp_state_lock);
2592 if (mpam_cpuhp_state) {
2593 cpuhp_remove_state(mpam_cpuhp_state);
2594 mpam_cpuhp_state = 0;
2595 }
2596 mutex_unlock(&mpam_cpuhp_state_lock);
2597
2598 static_branch_disable(&mpam_enabled);
2599
2600 mpam_unregister_irqs();
2601
2602 idx = srcu_read_lock(&mpam_srcu);
2603 list_for_each_entry_srcu(class, &mpam_classes, classes_list,
2604 srcu_read_lock_held(&mpam_srcu))
2605 mpam_reset_class(class);
2606 srcu_read_unlock(&mpam_srcu, idx);
2607
2608 mutex_lock(&mpam_list_lock);
2609 list_for_each_entry_safe(msc, tmp, &mpam_all_msc, all_msc_list)
2610 mpam_msc_destroy(msc);
2611 mutex_unlock(&mpam_list_lock);
2612 mpam_free_garbage();
2613
2614 pr_err_once("MPAM disabled due to %s\n", mpam_disable_reason);
2615}
2616
2617/*
2618 * Enable mpam once all devices have been probed.
2619 * Scheduled by mpam_discovery_cpu_online() once all devices have been created.
2620 * Also scheduled when new devices are probed when new CPUs come online.
2621 */
2622void mpam_enable(struct work_struct *work)
2623{
2624 static atomic_t once;
2625 struct mpam_msc *msc;
2626 bool all_devices_probed = true;
2627
2628 /* Have we probed all the hw devices? */
2629 guard(srcu)(&mpam_srcu);
2630 list_for_each_entry_srcu(msc, &mpam_all_msc, all_msc_list,
2631 srcu_read_lock_held(&mpam_srcu)) {
2632 mutex_lock(&msc->probe_lock);
2633 if (!msc->probed)
2634 all_devices_probed = false;
2635 mutex_unlock(&msc->probe_lock);
2636
2637 if (!all_devices_probed)
2638 break;
2639 }
2640
2641 if (all_devices_probed && !atomic_fetch_inc(&once))
2642 mpam_enable_once();
2643}
2644
2645#define maybe_update_config(cfg, feature, newcfg, member, changes) do { \
2646 if (mpam_has_feature(feature, newcfg) && \
2647 (newcfg)->member != (cfg)->member) { \
2648 (cfg)->member = (newcfg)->member; \
2649 mpam_set_feature(feature, cfg); \
2650 \
2651 (changes) = true; \
2652 } \
2653} while (0)
2654
2655static bool mpam_update_config(struct mpam_config *cfg,
2656 const struct mpam_config *newcfg)
2657{
2658 bool has_changes = false;
2659
2660 maybe_update_config(cfg, mpam_feat_cpor_part, newcfg, cpbm, has_changes);
2661 maybe_update_config(cfg, mpam_feat_mbw_part, newcfg, mbw_pbm, has_changes);
2662 maybe_update_config(cfg, mpam_feat_mbw_max, newcfg, mbw_max, has_changes);
2663
2664 return has_changes;
2665}
2666
2667int mpam_apply_config(struct mpam_component *comp, u16 partid,
2668 struct mpam_config *cfg)
2669{
2670 struct mpam_write_config_arg arg;
2671 struct mpam_msc_ris *ris;
2672 struct mpam_vmsc *vmsc;
2673 struct mpam_msc *msc;
2674
2675 lockdep_assert_cpus_held();
2676
2677 /* Don't pass in the current config! */
2678 WARN_ON_ONCE(&comp->cfg[partid] == cfg);
2679
2680 if (!mpam_update_config(&comp->cfg[partid], cfg))
2681 return 0;
2682
2683 arg.comp = comp;
2684 arg.partid = partid;
2685
2686 guard(srcu)(&mpam_srcu);
2687 list_for_each_entry_srcu(vmsc, &comp->vmsc, comp_list,
2688 srcu_read_lock_held(&mpam_srcu)) {
2689 msc = vmsc->msc;
2690
2691 mutex_lock(&msc->cfg_lock);
2692 list_for_each_entry_srcu(ris, &vmsc->ris, vmsc_list,
2693 srcu_read_lock_held(&mpam_srcu)) {
2694 arg.ris = ris;
2695 mpam_touch_msc(msc, __write_config, &arg);
2696 }
2697 mutex_unlock(&msc->cfg_lock);
2698 }
2699
2700 return 0;
2701}
2702
2703static int __init mpam_msc_driver_init(void)
2704{
2705 if (!system_supports_mpam())
2706 return -EOPNOTSUPP;
2707
2708 init_srcu_struct(&mpam_srcu);
2709
2710 fw_num_msc = acpi_mpam_count_msc();
2711 if (fw_num_msc <= 0) {
2712 pr_err("No MSC devices found in firmware\n");
2713 return -EINVAL;
2714 }
2715
2716 return platform_driver_register(&mpam_msc_driver);
2717}
2718
2719/* Must occur after arm64_mpam_register_cpus() from arch_initcall() */
2720subsys_initcall(mpam_msc_driver_init);
2721
2722#ifdef CONFIG_MPAM_KUNIT_TEST
2723#include "test_mpam_devices.c"
2724#endif