xref: /linux/drivers/resctrl/mpam_devices.c (revision e28ddd0b7af218e1a8863c524e15918895af9ac8)
1 // SPDX-License-Identifier: GPL-2.0
2 // Copyright (C) 2025 Arm Ltd.
3 
4 #define pr_fmt(fmt) "%s:%s: " fmt, KBUILD_MODNAME, __func__
5 
6 #include <linux/acpi.h>
7 #include <linux/atomic.h>
8 #include <linux/arm_mpam.h>
9 #include <linux/bitfield.h>
10 #include <linux/bitmap.h>
11 #include <linux/cacheinfo.h>
12 #include <linux/cpu.h>
13 #include <linux/cpumask.h>
14 #include <linux/device.h>
15 #include <linux/errno.h>
16 #include <linux/gfp.h>
17 #include <linux/interrupt.h>
18 #include <linux/irq.h>
19 #include <linux/irqdesc.h>
20 #include <linux/list.h>
21 #include <linux/lockdep.h>
22 #include <linux/mutex.h>
23 #include <linux/platform_device.h>
24 #include <linux/printk.h>
25 #include <linux/srcu.h>
26 #include <linux/spinlock.h>
27 #include <linux/types.h>
28 #include <linux/workqueue.h>
29 
30 #include "mpam_internal.h"
31 
32 DEFINE_STATIC_KEY_FALSE(mpam_enabled); /* This moves to arch code */
33 
34 /*
35  * mpam_list_lock protects the SRCU lists when writing. Once the
36  * mpam_enabled key is enabled these lists are read-only,
37  * unless the error interrupt disables the driver.
38  */
39 static DEFINE_MUTEX(mpam_list_lock);
40 static LIST_HEAD(mpam_all_msc);
41 
42 struct srcu_struct mpam_srcu;
43 
44 /*
45  * Number of MSCs that have been probed. Once all MSCs have been probed MPAM
46  * can be enabled.
47  */
48 static atomic_t mpam_num_msc;
49 
50 static int mpam_cpuhp_state;
51 static DEFINE_MUTEX(mpam_cpuhp_state_lock);
52 
53 /*
54  * The smallest common values for any CPU or MSC in the system.
55  * Generating traffic outside this range will result in screaming interrupts.
56  */
57 u16 mpam_partid_max;
58 u8 mpam_pmg_max;
59 static bool partid_max_init, partid_max_published;
60 static DEFINE_SPINLOCK(partid_max_lock);
61 
62 /*
63  * mpam is enabled once all devices have been probed from CPU online callbacks,
64  * scheduled via this work_struct. If access to an MSC depends on a CPU that
65  * was not brought online at boot, this can happen surprisingly late.
66  */
67 static DECLARE_WORK(mpam_enable_work, &mpam_enable);
68 
69 /*
70  * All mpam error interrupts indicate a software bug. On receipt, disable the
71  * driver.
72  */
73 static DECLARE_WORK(mpam_broken_work, &mpam_disable);
74 
75 /* When mpam is disabled, the printed reason to aid debugging */
76 static char *mpam_disable_reason;
77 
78 /*
79  * An MSC is a physical container for controls and monitors, each identified by
80  * their RIS index. These share a base-address, interrupts and some MMIO
81  * registers. A vMSC is a virtual container for RIS in an MSC that control or
82  * monitor the same thing. Members of a vMSC are all RIS in the same MSC, but
83  * not all RIS in an MSC share a vMSC.
84  *
85  * Components are a group of vMSC that control or monitor the same thing but
86  * are from different MSC, so have different base-address, interrupts etc.
87  * Classes are the set components of the same type.
88  *
89  * The features of a vMSC is the union of the RIS it contains.
90  * The features of a Class and Component are the common subset of the vMSC
91  * they contain.
92  *
93  * e.g. The system cache may have bandwidth controls on multiple interfaces,
94  * for regulating traffic from devices independently of traffic from CPUs.
95  * If these are two RIS in one MSC, they will be treated as controlling
96  * different things, and will not share a vMSC/component/class.
97  *
98  * e.g. The L2 may have one MSC and two RIS, one for cache-controls another
99  * for bandwidth. These two RIS are members of the same vMSC.
100  *
101  * e.g. The set of RIS that make up the L2 are grouped as a component. These
102  * are sometimes termed slices. They should be configured the same, as if there
103  * were only one.
104  *
105  * e.g. The SoC probably has more than one L2, each attached to a distinct set
106  * of CPUs. All the L2 components are grouped as a class.
107  *
108  * When creating an MSC, struct mpam_msc is added to the all mpam_all_msc list,
109  * then linked via struct mpam_ris to a vmsc, component and class.
110  * The same MSC may exist under different class->component->vmsc paths, but the
111  * RIS index will be unique.
112  */
113 LIST_HEAD(mpam_classes);
114 
115 /* List of all objects that can be free()d after synchronise_srcu() */
116 static LLIST_HEAD(mpam_garbage);
117 
init_garbage(struct mpam_garbage * garbage)118 static inline void init_garbage(struct mpam_garbage *garbage)
119 {
120 	init_llist_node(&garbage->llist);
121 }
122 
123 #define add_to_garbage(x)				\
124 do {							\
125 	__typeof__(x) _x = (x);				\
126 	_x->garbage.to_free = _x;			\
127 	llist_add(&_x->garbage.llist, &mpam_garbage);	\
128 } while (0)
129 
mpam_free_garbage(void)130 static void mpam_free_garbage(void)
131 {
132 	struct mpam_garbage *iter, *tmp;
133 	struct llist_node *to_free = llist_del_all(&mpam_garbage);
134 
135 	if (!to_free)
136 		return;
137 
138 	synchronize_srcu(&mpam_srcu);
139 
140 	llist_for_each_entry_safe(iter, tmp, to_free, llist) {
141 		if (iter->pdev)
142 			devm_kfree(&iter->pdev->dev, iter->to_free);
143 		else
144 			kfree(iter->to_free);
145 	}
146 }
147 
148 /*
149  * Once mpam is enabled, new requestors cannot further reduce the available
150  * partid. Assert that the size is fixed, and new requestors will be turned
151  * away.
152  */
mpam_assert_partid_sizes_fixed(void)153 static void mpam_assert_partid_sizes_fixed(void)
154 {
155 	WARN_ON_ONCE(!partid_max_published);
156 }
157 
__mpam_read_reg(struct mpam_msc * msc,u16 reg)158 static u32 __mpam_read_reg(struct mpam_msc *msc, u16 reg)
159 {
160 	WARN_ON_ONCE(!cpumask_test_cpu(smp_processor_id(), &msc->accessibility));
161 
162 	return readl_relaxed(msc->mapped_hwpage + reg);
163 }
164 
_mpam_read_partsel_reg(struct mpam_msc * msc,u16 reg)165 static inline u32 _mpam_read_partsel_reg(struct mpam_msc *msc, u16 reg)
166 {
167 	lockdep_assert_held_once(&msc->part_sel_lock);
168 	return __mpam_read_reg(msc, reg);
169 }
170 
171 #define mpam_read_partsel_reg(msc, reg) _mpam_read_partsel_reg(msc, MPAMF_##reg)
172 
__mpam_write_reg(struct mpam_msc * msc,u16 reg,u32 val)173 static void __mpam_write_reg(struct mpam_msc *msc, u16 reg, u32 val)
174 {
175 	WARN_ON_ONCE(reg + sizeof(u32) > msc->mapped_hwpage_sz);
176 	WARN_ON_ONCE(!cpumask_test_cpu(smp_processor_id(), &msc->accessibility));
177 
178 	writel_relaxed(val, msc->mapped_hwpage + reg);
179 }
180 
_mpam_write_partsel_reg(struct mpam_msc * msc,u16 reg,u32 val)181 static inline void _mpam_write_partsel_reg(struct mpam_msc *msc, u16 reg, u32 val)
182 {
183 	lockdep_assert_held_once(&msc->part_sel_lock);
184 	__mpam_write_reg(msc, reg, val);
185 }
186 
187 #define mpam_write_partsel_reg(msc, reg, val)  _mpam_write_partsel_reg(msc, MPAMCFG_##reg, val)
188 
_mpam_read_monsel_reg(struct mpam_msc * msc,u16 reg)189 static inline u32 _mpam_read_monsel_reg(struct mpam_msc *msc, u16 reg)
190 {
191 	mpam_mon_sel_lock_held(msc);
192 	return __mpam_read_reg(msc, reg);
193 }
194 
195 #define mpam_read_monsel_reg(msc, reg) _mpam_read_monsel_reg(msc, MSMON_##reg)
196 
_mpam_write_monsel_reg(struct mpam_msc * msc,u16 reg,u32 val)197 static inline void _mpam_write_monsel_reg(struct mpam_msc *msc, u16 reg, u32 val)
198 {
199 	mpam_mon_sel_lock_held(msc);
200 	__mpam_write_reg(msc, reg, val);
201 }
202 
203 #define mpam_write_monsel_reg(msc, reg, val)   _mpam_write_monsel_reg(msc, MSMON_##reg, val)
204 
mpam_msc_read_idr(struct mpam_msc * msc)205 static u64 mpam_msc_read_idr(struct mpam_msc *msc)
206 {
207 	u64 idr_high = 0, idr_low;
208 
209 	lockdep_assert_held(&msc->part_sel_lock);
210 
211 	idr_low = mpam_read_partsel_reg(msc, IDR);
212 	if (FIELD_GET(MPAMF_IDR_EXT, idr_low))
213 		idr_high = mpam_read_partsel_reg(msc, IDR + 4);
214 
215 	return (idr_high << 32) | idr_low;
216 }
217 
mpam_msc_clear_esr(struct mpam_msc * msc)218 static void mpam_msc_clear_esr(struct mpam_msc *msc)
219 {
220 	u64 esr_low = __mpam_read_reg(msc, MPAMF_ESR);
221 
222 	if (!esr_low)
223 		return;
224 
225 	/*
226 	 * Clearing the high/low bits of MPAMF_ESR can not be atomic.
227 	 * Clear the top half first, so that the pending error bits in the
228 	 * lower half prevent hardware from updating either half of the
229 	 * register.
230 	 */
231 	if (msc->has_extd_esr)
232 		__mpam_write_reg(msc, MPAMF_ESR + 4, 0);
233 	__mpam_write_reg(msc, MPAMF_ESR, 0);
234 }
235 
mpam_msc_read_esr(struct mpam_msc * msc)236 static u64 mpam_msc_read_esr(struct mpam_msc *msc)
237 {
238 	u64 esr_high = 0, esr_low;
239 
240 	esr_low = __mpam_read_reg(msc, MPAMF_ESR);
241 	if (msc->has_extd_esr)
242 		esr_high = __mpam_read_reg(msc, MPAMF_ESR + 4);
243 
244 	return (esr_high << 32) | esr_low;
245 }
246 
__mpam_part_sel_raw(u32 partsel,struct mpam_msc * msc)247 static void __mpam_part_sel_raw(u32 partsel, struct mpam_msc *msc)
248 {
249 	lockdep_assert_held(&msc->part_sel_lock);
250 
251 	mpam_write_partsel_reg(msc, PART_SEL, partsel);
252 }
253 
__mpam_part_sel(u8 ris_idx,u16 partid,struct mpam_msc * msc)254 static void __mpam_part_sel(u8 ris_idx, u16 partid, struct mpam_msc *msc)
255 {
256 	u32 partsel = FIELD_PREP(MPAMCFG_PART_SEL_RIS, ris_idx) |
257 		      FIELD_PREP(MPAMCFG_PART_SEL_PARTID_SEL, partid);
258 
259 	__mpam_part_sel_raw(partsel, msc);
260 }
261 
__mpam_intpart_sel(u8 ris_idx,u16 intpartid,struct mpam_msc * msc)262 static void __mpam_intpart_sel(u8 ris_idx, u16 intpartid, struct mpam_msc *msc)
263 {
264 	u32 partsel = FIELD_PREP(MPAMCFG_PART_SEL_RIS, ris_idx) |
265 		      FIELD_PREP(MPAMCFG_PART_SEL_PARTID_SEL, intpartid) |
266 		      MPAMCFG_PART_SEL_INTERNAL;
267 
268 	__mpam_part_sel_raw(partsel, msc);
269 }
270 
mpam_register_requestor(u16 partid_max,u8 pmg_max)271 int mpam_register_requestor(u16 partid_max, u8 pmg_max)
272 {
273 	guard(spinlock)(&partid_max_lock);
274 	if (!partid_max_init) {
275 		mpam_partid_max = partid_max;
276 		mpam_pmg_max = pmg_max;
277 		partid_max_init = true;
278 	} else if (!partid_max_published) {
279 		mpam_partid_max = min(mpam_partid_max, partid_max);
280 		mpam_pmg_max = min(mpam_pmg_max, pmg_max);
281 	} else {
282 		/* New requestors can't lower the values */
283 		if (partid_max < mpam_partid_max || pmg_max < mpam_pmg_max)
284 			return -EBUSY;
285 	}
286 
287 	return 0;
288 }
289 EXPORT_SYMBOL(mpam_register_requestor);
290 
291 static struct mpam_class *
mpam_class_alloc(u8 level_idx,enum mpam_class_types type)292 mpam_class_alloc(u8 level_idx, enum mpam_class_types type)
293 {
294 	struct mpam_class *class;
295 
296 	lockdep_assert_held(&mpam_list_lock);
297 
298 	class = kzalloc(sizeof(*class), GFP_KERNEL);
299 	if (!class)
300 		return ERR_PTR(-ENOMEM);
301 	init_garbage(&class->garbage);
302 
303 	INIT_LIST_HEAD_RCU(&class->components);
304 	/* Affinity is updated when ris are added */
305 	class->level = level_idx;
306 	class->type = type;
307 	INIT_LIST_HEAD_RCU(&class->classes_list);
308 	ida_init(&class->ida_csu_mon);
309 	ida_init(&class->ida_mbwu_mon);
310 
311 	list_add_rcu(&class->classes_list, &mpam_classes);
312 
313 	return class;
314 }
315 
mpam_class_destroy(struct mpam_class * class)316 static void mpam_class_destroy(struct mpam_class *class)
317 {
318 	lockdep_assert_held(&mpam_list_lock);
319 
320 	list_del_rcu(&class->classes_list);
321 	add_to_garbage(class);
322 }
323 
324 static struct mpam_class *
mpam_class_find(u8 level_idx,enum mpam_class_types type)325 mpam_class_find(u8 level_idx, enum mpam_class_types type)
326 {
327 	struct mpam_class *class;
328 
329 	lockdep_assert_held(&mpam_list_lock);
330 
331 	list_for_each_entry(class, &mpam_classes, classes_list) {
332 		if (class->type == type && class->level == level_idx)
333 			return class;
334 	}
335 
336 	return mpam_class_alloc(level_idx, type);
337 }
338 
339 static struct mpam_component *
mpam_component_alloc(struct mpam_class * class,int id)340 mpam_component_alloc(struct mpam_class *class, int id)
341 {
342 	struct mpam_component *comp;
343 
344 	lockdep_assert_held(&mpam_list_lock);
345 
346 	comp = kzalloc(sizeof(*comp), GFP_KERNEL);
347 	if (!comp)
348 		return ERR_PTR(-ENOMEM);
349 	init_garbage(&comp->garbage);
350 
351 	comp->comp_id = id;
352 	INIT_LIST_HEAD_RCU(&comp->vmsc);
353 	/* Affinity is updated when RIS are added */
354 	INIT_LIST_HEAD_RCU(&comp->class_list);
355 	comp->class = class;
356 
357 	list_add_rcu(&comp->class_list, &class->components);
358 
359 	return comp;
360 }
361 
362 static void __destroy_component_cfg(struct mpam_component *comp);
363 
mpam_component_destroy(struct mpam_component * comp)364 static void mpam_component_destroy(struct mpam_component *comp)
365 {
366 	struct mpam_class *class = comp->class;
367 
368 	lockdep_assert_held(&mpam_list_lock);
369 
370 	__destroy_component_cfg(comp);
371 
372 	list_del_rcu(&comp->class_list);
373 	add_to_garbage(comp);
374 
375 	if (list_empty(&class->components))
376 		mpam_class_destroy(class);
377 }
378 
379 static struct mpam_component *
mpam_component_find(struct mpam_class * class,int id)380 mpam_component_find(struct mpam_class *class, int id)
381 {
382 	struct mpam_component *comp;
383 
384 	lockdep_assert_held(&mpam_list_lock);
385 
386 	list_for_each_entry(comp, &class->components, class_list) {
387 		if (comp->comp_id == id)
388 			return comp;
389 	}
390 
391 	return mpam_component_alloc(class, id);
392 }
393 
394 static struct mpam_vmsc *
mpam_vmsc_alloc(struct mpam_component * comp,struct mpam_msc * msc)395 mpam_vmsc_alloc(struct mpam_component *comp, struct mpam_msc *msc)
396 {
397 	struct mpam_vmsc *vmsc;
398 
399 	lockdep_assert_held(&mpam_list_lock);
400 
401 	vmsc = kzalloc(sizeof(*vmsc), GFP_KERNEL);
402 	if (!vmsc)
403 		return ERR_PTR(-ENOMEM);
404 	init_garbage(&vmsc->garbage);
405 
406 	INIT_LIST_HEAD_RCU(&vmsc->ris);
407 	INIT_LIST_HEAD_RCU(&vmsc->comp_list);
408 	vmsc->comp = comp;
409 	vmsc->msc = msc;
410 
411 	list_add_rcu(&vmsc->comp_list, &comp->vmsc);
412 
413 	return vmsc;
414 }
415 
mpam_vmsc_destroy(struct mpam_vmsc * vmsc)416 static void mpam_vmsc_destroy(struct mpam_vmsc *vmsc)
417 {
418 	struct mpam_component *comp = vmsc->comp;
419 
420 	lockdep_assert_held(&mpam_list_lock);
421 
422 	list_del_rcu(&vmsc->comp_list);
423 	add_to_garbage(vmsc);
424 
425 	if (list_empty(&comp->vmsc))
426 		mpam_component_destroy(comp);
427 }
428 
429 static struct mpam_vmsc *
mpam_vmsc_find(struct mpam_component * comp,struct mpam_msc * msc)430 mpam_vmsc_find(struct mpam_component *comp, struct mpam_msc *msc)
431 {
432 	struct mpam_vmsc *vmsc;
433 
434 	lockdep_assert_held(&mpam_list_lock);
435 
436 	list_for_each_entry(vmsc, &comp->vmsc, comp_list) {
437 		if (vmsc->msc->id == msc->id)
438 			return vmsc;
439 	}
440 
441 	return mpam_vmsc_alloc(comp, msc);
442 }
443 
444 /*
445  * The cacheinfo structures are only populated when CPUs are online.
446  * This helper walks the acpi tables to include offline CPUs too.
447  */
mpam_get_cpumask_from_cache_id(unsigned long cache_id,u32 cache_level,cpumask_t * affinity)448 int mpam_get_cpumask_from_cache_id(unsigned long cache_id, u32 cache_level,
449 				   cpumask_t *affinity)
450 {
451 	return acpi_pptt_get_cpumask_from_cache_id(cache_id, affinity);
452 }
453 
454 /*
455  * cpumask_of_node() only knows about online CPUs. This can't tell us whether
456  * a class is represented on all possible CPUs.
457  */
get_cpumask_from_node_id(u32 node_id,cpumask_t * affinity)458 static void get_cpumask_from_node_id(u32 node_id, cpumask_t *affinity)
459 {
460 	int cpu;
461 
462 	for_each_possible_cpu(cpu) {
463 		if (node_id == cpu_to_node(cpu))
464 			cpumask_set_cpu(cpu, affinity);
465 	}
466 }
467 
mpam_ris_get_affinity(struct mpam_msc * msc,cpumask_t * affinity,enum mpam_class_types type,struct mpam_class * class,struct mpam_component * comp)468 static int mpam_ris_get_affinity(struct mpam_msc *msc, cpumask_t *affinity,
469 				 enum mpam_class_types type,
470 				 struct mpam_class *class,
471 				 struct mpam_component *comp)
472 {
473 	int err;
474 
475 	switch (type) {
476 	case MPAM_CLASS_CACHE:
477 		err = mpam_get_cpumask_from_cache_id(comp->comp_id, class->level,
478 						     affinity);
479 		if (err) {
480 			dev_warn_once(&msc->pdev->dev,
481 				      "Failed to determine CPU affinity\n");
482 			return err;
483 		}
484 
485 		if (cpumask_empty(affinity))
486 			dev_warn_once(&msc->pdev->dev, "no CPUs associated with cache node\n");
487 
488 		break;
489 	case MPAM_CLASS_MEMORY:
490 		get_cpumask_from_node_id(comp->comp_id, affinity);
491 		/* affinity may be empty for CPU-less memory nodes */
492 		break;
493 	case MPAM_CLASS_UNKNOWN:
494 		return 0;
495 	}
496 
497 	cpumask_and(affinity, affinity, &msc->accessibility);
498 
499 	return 0;
500 }
501 
mpam_ris_create_locked(struct mpam_msc * msc,u8 ris_idx,enum mpam_class_types type,u8 class_id,int component_id)502 static int mpam_ris_create_locked(struct mpam_msc *msc, u8 ris_idx,
503 				  enum mpam_class_types type, u8 class_id,
504 				  int component_id)
505 {
506 	int err;
507 	struct mpam_vmsc *vmsc;
508 	struct mpam_msc_ris *ris;
509 	struct mpam_class *class;
510 	struct mpam_component *comp;
511 	struct platform_device *pdev = msc->pdev;
512 
513 	lockdep_assert_held(&mpam_list_lock);
514 
515 	if (ris_idx > MPAM_MSC_MAX_NUM_RIS)
516 		return -EINVAL;
517 
518 	if (test_and_set_bit(ris_idx, &msc->ris_idxs))
519 		return -EBUSY;
520 
521 	ris = devm_kzalloc(&msc->pdev->dev, sizeof(*ris), GFP_KERNEL);
522 	if (!ris)
523 		return -ENOMEM;
524 	init_garbage(&ris->garbage);
525 	ris->garbage.pdev = pdev;
526 
527 	class = mpam_class_find(class_id, type);
528 	if (IS_ERR(class))
529 		return PTR_ERR(class);
530 
531 	comp = mpam_component_find(class, component_id);
532 	if (IS_ERR(comp)) {
533 		if (list_empty(&class->components))
534 			mpam_class_destroy(class);
535 		return PTR_ERR(comp);
536 	}
537 
538 	vmsc = mpam_vmsc_find(comp, msc);
539 	if (IS_ERR(vmsc)) {
540 		if (list_empty(&comp->vmsc))
541 			mpam_component_destroy(comp);
542 		return PTR_ERR(vmsc);
543 	}
544 
545 	err = mpam_ris_get_affinity(msc, &ris->affinity, type, class, comp);
546 	if (err) {
547 		if (list_empty(&vmsc->ris))
548 			mpam_vmsc_destroy(vmsc);
549 		return err;
550 	}
551 
552 	ris->ris_idx = ris_idx;
553 	INIT_LIST_HEAD_RCU(&ris->msc_list);
554 	INIT_LIST_HEAD_RCU(&ris->vmsc_list);
555 	ris->vmsc = vmsc;
556 
557 	cpumask_or(&comp->affinity, &comp->affinity, &ris->affinity);
558 	cpumask_or(&class->affinity, &class->affinity, &ris->affinity);
559 	list_add_rcu(&ris->vmsc_list, &vmsc->ris);
560 	list_add_rcu(&ris->msc_list, &msc->ris);
561 
562 	return 0;
563 }
564 
mpam_ris_destroy(struct mpam_msc_ris * ris)565 static void mpam_ris_destroy(struct mpam_msc_ris *ris)
566 {
567 	struct mpam_vmsc *vmsc = ris->vmsc;
568 	struct mpam_msc *msc = vmsc->msc;
569 	struct mpam_component *comp = vmsc->comp;
570 	struct mpam_class *class = comp->class;
571 
572 	lockdep_assert_held(&mpam_list_lock);
573 
574 	/*
575 	 * It is assumed affinities don't overlap. If they do the class becomes
576 	 * unusable immediately.
577 	 */
578 	cpumask_andnot(&class->affinity, &class->affinity, &ris->affinity);
579 	cpumask_andnot(&comp->affinity, &comp->affinity, &ris->affinity);
580 	clear_bit(ris->ris_idx, &msc->ris_idxs);
581 	list_del_rcu(&ris->msc_list);
582 	list_del_rcu(&ris->vmsc_list);
583 	add_to_garbage(ris);
584 
585 	if (list_empty(&vmsc->ris))
586 		mpam_vmsc_destroy(vmsc);
587 }
588 
mpam_ris_create(struct mpam_msc * msc,u8 ris_idx,enum mpam_class_types type,u8 class_id,int component_id)589 int mpam_ris_create(struct mpam_msc *msc, u8 ris_idx,
590 		    enum mpam_class_types type, u8 class_id, int component_id)
591 {
592 	int err;
593 
594 	mutex_lock(&mpam_list_lock);
595 	err = mpam_ris_create_locked(msc, ris_idx, type, class_id,
596 				     component_id);
597 	mutex_unlock(&mpam_list_lock);
598 	if (err)
599 		mpam_free_garbage();
600 
601 	return err;
602 }
603 
mpam_get_or_create_ris(struct mpam_msc * msc,u8 ris_idx)604 static struct mpam_msc_ris *mpam_get_or_create_ris(struct mpam_msc *msc,
605 						   u8 ris_idx)
606 {
607 	int err;
608 	struct mpam_msc_ris *ris;
609 
610 	lockdep_assert_held(&mpam_list_lock);
611 
612 	if (!test_bit(ris_idx, &msc->ris_idxs)) {
613 		err = mpam_ris_create_locked(msc, ris_idx, MPAM_CLASS_UNKNOWN,
614 					     0, 0);
615 		if (err)
616 			return ERR_PTR(err);
617 	}
618 
619 	list_for_each_entry(ris, &msc->ris, msc_list) {
620 		if (ris->ris_idx == ris_idx)
621 			return ris;
622 	}
623 
624 	return ERR_PTR(-ENOENT);
625 }
626 
627 /*
628  * IHI009A.a has this nugget: "If a monitor does not support automatic behaviour
629  * of NRDY, software can use this bit for any purpose" - so hardware might not
630  * implement this - but it isn't RES0.
631  *
632  * Try and see what values stick in this bit. If we can write either value,
633  * its probably not implemented by hardware.
634  */
_mpam_ris_hw_probe_hw_nrdy(struct mpam_msc_ris * ris,u32 mon_reg)635 static bool _mpam_ris_hw_probe_hw_nrdy(struct mpam_msc_ris *ris, u32 mon_reg)
636 {
637 	u32 now;
638 	u64 mon_sel;
639 	bool can_set, can_clear;
640 	struct mpam_msc *msc = ris->vmsc->msc;
641 
642 	if (WARN_ON_ONCE(!mpam_mon_sel_lock(msc)))
643 		return false;
644 
645 	mon_sel = FIELD_PREP(MSMON_CFG_MON_SEL_MON_SEL, 0) |
646 		  FIELD_PREP(MSMON_CFG_MON_SEL_RIS, ris->ris_idx);
647 	_mpam_write_monsel_reg(msc, mon_reg, mon_sel);
648 
649 	_mpam_write_monsel_reg(msc, mon_reg, MSMON___NRDY);
650 	now = _mpam_read_monsel_reg(msc, mon_reg);
651 	can_set = now & MSMON___NRDY;
652 
653 	_mpam_write_monsel_reg(msc, mon_reg, 0);
654 	now = _mpam_read_monsel_reg(msc, mon_reg);
655 	can_clear = !(now & MSMON___NRDY);
656 	mpam_mon_sel_unlock(msc);
657 
658 	return (!can_set || !can_clear);
659 }
660 
661 #define mpam_ris_hw_probe_hw_nrdy(_ris, _mon_reg)			\
662 	_mpam_ris_hw_probe_hw_nrdy(_ris, MSMON_##_mon_reg)
663 
mpam_ris_hw_probe(struct mpam_msc_ris * ris)664 static void mpam_ris_hw_probe(struct mpam_msc_ris *ris)
665 {
666 	int err;
667 	struct mpam_msc *msc = ris->vmsc->msc;
668 	struct device *dev = &msc->pdev->dev;
669 	struct mpam_props *props = &ris->props;
670 	struct mpam_class *class = ris->vmsc->comp->class;
671 
672 	lockdep_assert_held(&msc->probe_lock);
673 	lockdep_assert_held(&msc->part_sel_lock);
674 
675 	/* Cache Capacity Partitioning */
676 	if (FIELD_GET(MPAMF_IDR_HAS_CCAP_PART, ris->idr)) {
677 		u32 ccap_features = mpam_read_partsel_reg(msc, CCAP_IDR);
678 
679 		props->cmax_wd = FIELD_GET(MPAMF_CCAP_IDR_CMAX_WD, ccap_features);
680 		if (props->cmax_wd &&
681 		    FIELD_GET(MPAMF_CCAP_IDR_HAS_CMAX_SOFTLIM, ccap_features))
682 			mpam_set_feature(mpam_feat_cmax_softlim, props);
683 
684 		if (props->cmax_wd &&
685 		    !FIELD_GET(MPAMF_CCAP_IDR_NO_CMAX, ccap_features))
686 			mpam_set_feature(mpam_feat_cmax_cmax, props);
687 
688 		if (props->cmax_wd &&
689 		    FIELD_GET(MPAMF_CCAP_IDR_HAS_CMIN, ccap_features))
690 			mpam_set_feature(mpam_feat_cmax_cmin, props);
691 
692 		props->cassoc_wd = FIELD_GET(MPAMF_CCAP_IDR_CASSOC_WD, ccap_features);
693 		if (props->cassoc_wd &&
694 		    FIELD_GET(MPAMF_CCAP_IDR_HAS_CASSOC, ccap_features))
695 			mpam_set_feature(mpam_feat_cmax_cassoc, props);
696 	}
697 
698 	/* Cache Portion partitioning */
699 	if (FIELD_GET(MPAMF_IDR_HAS_CPOR_PART, ris->idr)) {
700 		u32 cpor_features = mpam_read_partsel_reg(msc, CPOR_IDR);
701 
702 		props->cpbm_wd = FIELD_GET(MPAMF_CPOR_IDR_CPBM_WD, cpor_features);
703 		if (props->cpbm_wd)
704 			mpam_set_feature(mpam_feat_cpor_part, props);
705 	}
706 
707 	/* Memory bandwidth partitioning */
708 	if (FIELD_GET(MPAMF_IDR_HAS_MBW_PART, ris->idr)) {
709 		u32 mbw_features = mpam_read_partsel_reg(msc, MBW_IDR);
710 
711 		/* portion bitmap resolution */
712 		props->mbw_pbm_bits = FIELD_GET(MPAMF_MBW_IDR_BWPBM_WD, mbw_features);
713 		if (props->mbw_pbm_bits &&
714 		    FIELD_GET(MPAMF_MBW_IDR_HAS_PBM, mbw_features))
715 			mpam_set_feature(mpam_feat_mbw_part, props);
716 
717 		props->bwa_wd = FIELD_GET(MPAMF_MBW_IDR_BWA_WD, mbw_features);
718 		if (props->bwa_wd && FIELD_GET(MPAMF_MBW_IDR_HAS_MAX, mbw_features))
719 			mpam_set_feature(mpam_feat_mbw_max, props);
720 
721 		if (props->bwa_wd && FIELD_GET(MPAMF_MBW_IDR_HAS_MIN, mbw_features))
722 			mpam_set_feature(mpam_feat_mbw_min, props);
723 
724 		if (props->bwa_wd && FIELD_GET(MPAMF_MBW_IDR_HAS_PROP, mbw_features))
725 			mpam_set_feature(mpam_feat_mbw_prop, props);
726 	}
727 
728 	/* Priority partitioning */
729 	if (FIELD_GET(MPAMF_IDR_HAS_PRI_PART, ris->idr)) {
730 		u32 pri_features = mpam_read_partsel_reg(msc, PRI_IDR);
731 
732 		props->intpri_wd = FIELD_GET(MPAMF_PRI_IDR_INTPRI_WD, pri_features);
733 		if (props->intpri_wd && FIELD_GET(MPAMF_PRI_IDR_HAS_INTPRI, pri_features)) {
734 			mpam_set_feature(mpam_feat_intpri_part, props);
735 			if (FIELD_GET(MPAMF_PRI_IDR_INTPRI_0_IS_LOW, pri_features))
736 				mpam_set_feature(mpam_feat_intpri_part_0_low, props);
737 		}
738 
739 		props->dspri_wd = FIELD_GET(MPAMF_PRI_IDR_DSPRI_WD, pri_features);
740 		if (props->dspri_wd && FIELD_GET(MPAMF_PRI_IDR_HAS_DSPRI, pri_features)) {
741 			mpam_set_feature(mpam_feat_dspri_part, props);
742 			if (FIELD_GET(MPAMF_PRI_IDR_DSPRI_0_IS_LOW, pri_features))
743 				mpam_set_feature(mpam_feat_dspri_part_0_low, props);
744 		}
745 	}
746 
747 	/* Performance Monitoring */
748 	if (FIELD_GET(MPAMF_IDR_HAS_MSMON, ris->idr)) {
749 		u32 msmon_features = mpam_read_partsel_reg(msc, MSMON_IDR);
750 
751 		/*
752 		 * If the firmware max-nrdy-us property is missing, the
753 		 * CSU counters can't be used. Should we wait forever?
754 		 */
755 		err = device_property_read_u32(&msc->pdev->dev,
756 					       "arm,not-ready-us",
757 					       &msc->nrdy_usec);
758 
759 		if (FIELD_GET(MPAMF_MSMON_IDR_MSMON_CSU, msmon_features)) {
760 			u32 csumonidr;
761 
762 			csumonidr = mpam_read_partsel_reg(msc, CSUMON_IDR);
763 			props->num_csu_mon = FIELD_GET(MPAMF_CSUMON_IDR_NUM_MON, csumonidr);
764 			if (props->num_csu_mon) {
765 				bool hw_managed;
766 
767 				mpam_set_feature(mpam_feat_msmon_csu, props);
768 
769 				if (FIELD_GET(MPAMF_CSUMON_IDR_HAS_XCL, csumonidr))
770 					mpam_set_feature(mpam_feat_msmon_csu_xcl, props);
771 
772 				/* Is NRDY hardware managed? */
773 				hw_managed = mpam_ris_hw_probe_hw_nrdy(ris, CSU);
774 				if (hw_managed)
775 					mpam_set_feature(mpam_feat_msmon_csu_hw_nrdy, props);
776 			}
777 
778 			/*
779 			 * Accept the missing firmware property if NRDY appears
780 			 * un-implemented.
781 			 */
782 			if (err && mpam_has_feature(mpam_feat_msmon_csu_hw_nrdy, props))
783 				dev_err_once(dev, "Counters are not usable because not-ready timeout was not provided by firmware.");
784 		}
785 		if (FIELD_GET(MPAMF_MSMON_IDR_MSMON_MBWU, msmon_features)) {
786 			bool has_long, hw_managed;
787 			u32 mbwumon_idr = mpam_read_partsel_reg(msc, MBWUMON_IDR);
788 
789 			props->num_mbwu_mon = FIELD_GET(MPAMF_MBWUMON_IDR_NUM_MON, mbwumon_idr);
790 			if (props->num_mbwu_mon) {
791 				mpam_set_feature(mpam_feat_msmon_mbwu, props);
792 
793 				if (FIELD_GET(MPAMF_MBWUMON_IDR_HAS_RWBW, mbwumon_idr))
794 					mpam_set_feature(mpam_feat_msmon_mbwu_rwbw, props);
795 
796 				has_long = FIELD_GET(MPAMF_MBWUMON_IDR_HAS_LONG, mbwumon_idr);
797 				if (has_long) {
798 					if (FIELD_GET(MPAMF_MBWUMON_IDR_LWD, mbwumon_idr))
799 						mpam_set_feature(mpam_feat_msmon_mbwu_63counter, props);
800 					else
801 						mpam_set_feature(mpam_feat_msmon_mbwu_44counter, props);
802 				} else {
803 					mpam_set_feature(mpam_feat_msmon_mbwu_31counter, props);
804 				}
805 
806 				/* Is NRDY hardware managed? */
807 				hw_managed = mpam_ris_hw_probe_hw_nrdy(ris, MBWU);
808 				if (hw_managed)
809 					mpam_set_feature(mpam_feat_msmon_mbwu_hw_nrdy, props);
810 
811 				/*
812 				 * Don't warn about any missing firmware property for
813 				 * MBWU NRDY - it doesn't make any sense!
814 				 */
815 			}
816 		}
817 	}
818 
819 	/*
820 	 * RIS with PARTID narrowing don't have enough storage for one
821 	 * configuration per PARTID. If these are in a class we could use,
822 	 * reduce the supported partid_max to match the number of intpartid.
823 	 * If the class is unknown, just ignore it.
824 	 */
825 	if (FIELD_GET(MPAMF_IDR_HAS_PARTID_NRW, ris->idr) &&
826 	    class->type != MPAM_CLASS_UNKNOWN) {
827 		u32 nrwidr = mpam_read_partsel_reg(msc, PARTID_NRW_IDR);
828 		u16 partid_max = FIELD_GET(MPAMF_PARTID_NRW_IDR_INTPARTID_MAX, nrwidr);
829 
830 		mpam_set_feature(mpam_feat_partid_nrw, props);
831 		msc->partid_max = min(msc->partid_max, partid_max);
832 	}
833 }
834 
mpam_msc_hw_probe(struct mpam_msc * msc)835 static int mpam_msc_hw_probe(struct mpam_msc *msc)
836 {
837 	u64 idr;
838 	u16 partid_max;
839 	u8 ris_idx, pmg_max;
840 	struct mpam_msc_ris *ris;
841 	struct device *dev = &msc->pdev->dev;
842 
843 	lockdep_assert_held(&msc->probe_lock);
844 
845 	idr = __mpam_read_reg(msc, MPAMF_AIDR);
846 	if ((idr & MPAMF_AIDR_ARCH_MAJOR_REV) != MPAM_ARCHITECTURE_V1) {
847 		dev_err_once(dev, "MSC does not match MPAM architecture v1.x\n");
848 		return -EIO;
849 	}
850 
851 	/* Grab an IDR value to find out how many RIS there are */
852 	mutex_lock(&msc->part_sel_lock);
853 	idr = mpam_msc_read_idr(msc);
854 	mutex_unlock(&msc->part_sel_lock);
855 
856 	msc->ris_max = FIELD_GET(MPAMF_IDR_RIS_MAX, idr);
857 
858 	/* Use these values so partid/pmg always starts with a valid value */
859 	msc->partid_max = FIELD_GET(MPAMF_IDR_PARTID_MAX, idr);
860 	msc->pmg_max = FIELD_GET(MPAMF_IDR_PMG_MAX, idr);
861 
862 	for (ris_idx = 0; ris_idx <= msc->ris_max; ris_idx++) {
863 		mutex_lock(&msc->part_sel_lock);
864 		__mpam_part_sel(ris_idx, 0, msc);
865 		idr = mpam_msc_read_idr(msc);
866 		mutex_unlock(&msc->part_sel_lock);
867 
868 		partid_max = FIELD_GET(MPAMF_IDR_PARTID_MAX, idr);
869 		pmg_max = FIELD_GET(MPAMF_IDR_PMG_MAX, idr);
870 		msc->partid_max = min(msc->partid_max, partid_max);
871 		msc->pmg_max = min(msc->pmg_max, pmg_max);
872 		msc->has_extd_esr = FIELD_GET(MPAMF_IDR_HAS_EXTD_ESR, idr);
873 
874 		mutex_lock(&mpam_list_lock);
875 		ris = mpam_get_or_create_ris(msc, ris_idx);
876 		mutex_unlock(&mpam_list_lock);
877 		if (IS_ERR(ris))
878 			return PTR_ERR(ris);
879 		ris->idr = idr;
880 
881 		mutex_lock(&msc->part_sel_lock);
882 		__mpam_part_sel(ris_idx, 0, msc);
883 		mpam_ris_hw_probe(ris);
884 		mutex_unlock(&msc->part_sel_lock);
885 	}
886 
887 	/* Clear any stale errors */
888 	mpam_msc_clear_esr(msc);
889 
890 	spin_lock(&partid_max_lock);
891 	mpam_partid_max = min(mpam_partid_max, msc->partid_max);
892 	mpam_pmg_max = min(mpam_pmg_max, msc->pmg_max);
893 	spin_unlock(&partid_max_lock);
894 
895 	msc->probed = true;
896 
897 	return 0;
898 }
899 
900 struct mon_read {
901 	struct mpam_msc_ris		*ris;
902 	struct mon_cfg			*ctx;
903 	enum mpam_device_features	type;
904 	u64				*val;
905 	int				err;
906 };
907 
mpam_ris_has_mbwu_long_counter(struct mpam_msc_ris * ris)908 static bool mpam_ris_has_mbwu_long_counter(struct mpam_msc_ris *ris)
909 {
910 	return (mpam_has_feature(mpam_feat_msmon_mbwu_63counter, &ris->props) ||
911 		mpam_has_feature(mpam_feat_msmon_mbwu_44counter, &ris->props));
912 }
913 
mpam_msc_read_mbwu_l(struct mpam_msc * msc)914 static u64 mpam_msc_read_mbwu_l(struct mpam_msc *msc)
915 {
916 	int retry = 3;
917 	u32 mbwu_l_low;
918 	u64 mbwu_l_high1, mbwu_l_high2;
919 
920 	mpam_mon_sel_lock_held(msc);
921 
922 	WARN_ON_ONCE((MSMON_MBWU_L + sizeof(u64)) > msc->mapped_hwpage_sz);
923 	WARN_ON_ONCE(!cpumask_test_cpu(smp_processor_id(), &msc->accessibility));
924 
925 	mbwu_l_high2 = __mpam_read_reg(msc, MSMON_MBWU_L + 4);
926 	do {
927 		mbwu_l_high1 = mbwu_l_high2;
928 		mbwu_l_low = __mpam_read_reg(msc, MSMON_MBWU_L);
929 		mbwu_l_high2 = __mpam_read_reg(msc, MSMON_MBWU_L + 4);
930 
931 		retry--;
932 	} while (mbwu_l_high1 != mbwu_l_high2 && retry > 0);
933 
934 	if (mbwu_l_high1 == mbwu_l_high2)
935 		return (mbwu_l_high1 << 32) | mbwu_l_low;
936 
937 	pr_warn("Failed to read a stable value\n");
938 	return MSMON___L_NRDY;
939 }
940 
mpam_msc_zero_mbwu_l(struct mpam_msc * msc)941 static void mpam_msc_zero_mbwu_l(struct mpam_msc *msc)
942 {
943 	mpam_mon_sel_lock_held(msc);
944 
945 	WARN_ON_ONCE((MSMON_MBWU_L + sizeof(u64)) > msc->mapped_hwpage_sz);
946 	WARN_ON_ONCE(!cpumask_test_cpu(smp_processor_id(), &msc->accessibility));
947 
948 	__mpam_write_reg(msc, MSMON_MBWU_L, 0);
949 	__mpam_write_reg(msc, MSMON_MBWU_L + 4, 0);
950 }
951 
gen_msmon_ctl_flt_vals(struct mon_read * m,u32 * ctl_val,u32 * flt_val)952 static void gen_msmon_ctl_flt_vals(struct mon_read *m, u32 *ctl_val,
953 				   u32 *flt_val)
954 {
955 	struct mon_cfg *ctx = m->ctx;
956 
957 	/*
958 	 * For CSU counters its implementation-defined what happens when not
959 	 * filtering by partid.
960 	 */
961 	*ctl_val = MSMON_CFG_x_CTL_MATCH_PARTID;
962 
963 	*flt_val = FIELD_PREP(MSMON_CFG_x_FLT_PARTID, ctx->partid);
964 
965 	if (m->ctx->match_pmg) {
966 		*ctl_val |= MSMON_CFG_x_CTL_MATCH_PMG;
967 		*flt_val |= FIELD_PREP(MSMON_CFG_x_FLT_PMG, ctx->pmg);
968 	}
969 
970 	switch (m->type) {
971 	case mpam_feat_msmon_csu:
972 		*ctl_val |= MSMON_CFG_CSU_CTL_TYPE_CSU;
973 
974 		if (mpam_has_feature(mpam_feat_msmon_csu_xcl, &m->ris->props))
975 			*flt_val |= FIELD_PREP(MSMON_CFG_CSU_FLT_XCL, ctx->csu_exclude_clean);
976 
977 		break;
978 	case mpam_feat_msmon_mbwu_31counter:
979 	case mpam_feat_msmon_mbwu_44counter:
980 	case mpam_feat_msmon_mbwu_63counter:
981 		*ctl_val |= MSMON_CFG_MBWU_CTL_TYPE_MBWU;
982 
983 		if (mpam_has_feature(mpam_feat_msmon_mbwu_rwbw, &m->ris->props))
984 			*flt_val |= FIELD_PREP(MSMON_CFG_MBWU_FLT_RWBW, ctx->opts);
985 
986 		break;
987 	default:
988 		pr_warn("Unexpected monitor type %d\n", m->type);
989 	}
990 }
991 
read_msmon_ctl_flt_vals(struct mon_read * m,u32 * ctl_val,u32 * flt_val)992 static void read_msmon_ctl_flt_vals(struct mon_read *m, u32 *ctl_val,
993 				    u32 *flt_val)
994 {
995 	struct mpam_msc *msc = m->ris->vmsc->msc;
996 
997 	switch (m->type) {
998 	case mpam_feat_msmon_csu:
999 		*ctl_val = mpam_read_monsel_reg(msc, CFG_CSU_CTL);
1000 		*flt_val = mpam_read_monsel_reg(msc, CFG_CSU_FLT);
1001 		break;
1002 	case mpam_feat_msmon_mbwu_31counter:
1003 	case mpam_feat_msmon_mbwu_44counter:
1004 	case mpam_feat_msmon_mbwu_63counter:
1005 		*ctl_val = mpam_read_monsel_reg(msc, CFG_MBWU_CTL);
1006 		*flt_val = mpam_read_monsel_reg(msc, CFG_MBWU_FLT);
1007 		break;
1008 	default:
1009 		pr_warn("Unexpected monitor type %d\n", m->type);
1010 	}
1011 }
1012 
1013 /* Remove values set by the hardware to prevent apparent mismatches. */
clean_msmon_ctl_val(u32 * cur_ctl)1014 static inline void clean_msmon_ctl_val(u32 *cur_ctl)
1015 {
1016 	*cur_ctl &= ~MSMON_CFG_x_CTL_OFLOW_STATUS;
1017 
1018 	if (FIELD_GET(MSMON_CFG_x_CTL_TYPE, *cur_ctl) == MSMON_CFG_MBWU_CTL_TYPE_MBWU)
1019 		*cur_ctl &= ~MSMON_CFG_MBWU_CTL_OFLOW_STATUS_L;
1020 }
1021 
write_msmon_ctl_flt_vals(struct mon_read * m,u32 ctl_val,u32 flt_val)1022 static void write_msmon_ctl_flt_vals(struct mon_read *m, u32 ctl_val,
1023 				     u32 flt_val)
1024 {
1025 	struct mpam_msc *msc = m->ris->vmsc->msc;
1026 
1027 	/*
1028 	 * Write the ctl_val with the enable bit cleared, reset the counter,
1029 	 * then enable counter.
1030 	 */
1031 	switch (m->type) {
1032 	case mpam_feat_msmon_csu:
1033 		mpam_write_monsel_reg(msc, CFG_CSU_FLT, flt_val);
1034 		mpam_write_monsel_reg(msc, CFG_CSU_CTL, ctl_val);
1035 		mpam_write_monsel_reg(msc, CSU, 0);
1036 		mpam_write_monsel_reg(msc, CFG_CSU_CTL, ctl_val | MSMON_CFG_x_CTL_EN);
1037 		break;
1038 	case mpam_feat_msmon_mbwu_31counter:
1039 	case mpam_feat_msmon_mbwu_44counter:
1040 	case mpam_feat_msmon_mbwu_63counter:
1041 		mpam_write_monsel_reg(msc, CFG_MBWU_FLT, flt_val);
1042 		mpam_write_monsel_reg(msc, CFG_MBWU_CTL, ctl_val);
1043 		mpam_write_monsel_reg(msc, CFG_MBWU_CTL, ctl_val | MSMON_CFG_x_CTL_EN);
1044 		/* Counting monitors require NRDY to be reset by software */
1045 		if (m->type == mpam_feat_msmon_mbwu_31counter)
1046 			mpam_write_monsel_reg(msc, MBWU, 0);
1047 		else
1048 			mpam_msc_zero_mbwu_l(m->ris->vmsc->msc);
1049 		break;
1050 	default:
1051 		pr_warn("Unexpected monitor type %d\n", m->type);
1052 	}
1053 }
1054 
mpam_msmon_overflow_val(enum mpam_device_features type)1055 static u64 mpam_msmon_overflow_val(enum mpam_device_features type)
1056 {
1057 	/* TODO: implement scaling counters */
1058 	switch (type) {
1059 	case mpam_feat_msmon_mbwu_63counter:
1060 		return BIT_ULL(hweight_long(MSMON___LWD_VALUE));
1061 	case mpam_feat_msmon_mbwu_44counter:
1062 		return BIT_ULL(hweight_long(MSMON___L_VALUE));
1063 	case mpam_feat_msmon_mbwu_31counter:
1064 		return BIT_ULL(hweight_long(MSMON___VALUE));
1065 	default:
1066 		return 0;
1067 	}
1068 }
1069 
__ris_msmon_read(void * arg)1070 static void __ris_msmon_read(void *arg)
1071 {
1072 	u64 now;
1073 	bool nrdy = false;
1074 	bool config_mismatch;
1075 	bool overflow = false;
1076 	struct mon_read *m = arg;
1077 	struct mon_cfg *ctx = m->ctx;
1078 	bool reset_on_next_read = false;
1079 	struct mpam_msc_ris *ris = m->ris;
1080 	struct msmon_mbwu_state *mbwu_state;
1081 	struct mpam_props *rprops = &ris->props;
1082 	struct mpam_msc *msc = m->ris->vmsc->msc;
1083 	u32 mon_sel, ctl_val, flt_val, cur_ctl, cur_flt;
1084 
1085 	if (!mpam_mon_sel_lock(msc)) {
1086 		m->err = -EIO;
1087 		return;
1088 	}
1089 	mon_sel = FIELD_PREP(MSMON_CFG_MON_SEL_MON_SEL, ctx->mon) |
1090 		  FIELD_PREP(MSMON_CFG_MON_SEL_RIS, ris->ris_idx);
1091 	mpam_write_monsel_reg(msc, CFG_MON_SEL, mon_sel);
1092 
1093 	switch (m->type) {
1094 	case mpam_feat_msmon_mbwu_31counter:
1095 	case mpam_feat_msmon_mbwu_44counter:
1096 	case mpam_feat_msmon_mbwu_63counter:
1097 		mbwu_state = &ris->mbwu_state[ctx->mon];
1098 		if (mbwu_state) {
1099 			reset_on_next_read = mbwu_state->reset_on_next_read;
1100 			mbwu_state->reset_on_next_read = false;
1101 		}
1102 		break;
1103 	default:
1104 		break;
1105 	}
1106 
1107 	/*
1108 	 * Read the existing configuration to avoid re-writing the same values.
1109 	 * This saves waiting for 'nrdy' on subsequent reads.
1110 	 */
1111 	read_msmon_ctl_flt_vals(m, &cur_ctl, &cur_flt);
1112 
1113 	if (mpam_feat_msmon_mbwu_31counter == m->type)
1114 		overflow = cur_ctl & MSMON_CFG_x_CTL_OFLOW_STATUS;
1115 	else if (mpam_feat_msmon_mbwu_44counter == m->type ||
1116 		 mpam_feat_msmon_mbwu_63counter == m->type)
1117 		overflow = cur_ctl & MSMON_CFG_MBWU_CTL_OFLOW_STATUS_L;
1118 
1119 	clean_msmon_ctl_val(&cur_ctl);
1120 	gen_msmon_ctl_flt_vals(m, &ctl_val, &flt_val);
1121 	config_mismatch = cur_flt != flt_val ||
1122 			  cur_ctl != (ctl_val | MSMON_CFG_x_CTL_EN);
1123 
1124 	if (config_mismatch || reset_on_next_read) {
1125 		write_msmon_ctl_flt_vals(m, ctl_val, flt_val);
1126 		overflow = false;
1127 	} else if (overflow) {
1128 		mpam_write_monsel_reg(msc, CFG_MBWU_CTL,
1129 				      cur_ctl &
1130 				      ~(MSMON_CFG_x_CTL_OFLOW_STATUS |
1131 					MSMON_CFG_MBWU_CTL_OFLOW_STATUS_L));
1132 	}
1133 
1134 	switch (m->type) {
1135 	case mpam_feat_msmon_csu:
1136 		now = mpam_read_monsel_reg(msc, CSU);
1137 		if (mpam_has_feature(mpam_feat_msmon_csu_hw_nrdy, rprops))
1138 			nrdy = now & MSMON___NRDY;
1139 		now = FIELD_GET(MSMON___VALUE, now);
1140 		break;
1141 	case mpam_feat_msmon_mbwu_31counter:
1142 	case mpam_feat_msmon_mbwu_44counter:
1143 	case mpam_feat_msmon_mbwu_63counter:
1144 		if (m->type != mpam_feat_msmon_mbwu_31counter) {
1145 			now = mpam_msc_read_mbwu_l(msc);
1146 			if (mpam_has_feature(mpam_feat_msmon_mbwu_hw_nrdy, rprops))
1147 				nrdy = now & MSMON___L_NRDY;
1148 
1149 			if (m->type == mpam_feat_msmon_mbwu_63counter)
1150 				now = FIELD_GET(MSMON___LWD_VALUE, now);
1151 			else
1152 				now = FIELD_GET(MSMON___L_VALUE, now);
1153 		} else {
1154 			now = mpam_read_monsel_reg(msc, MBWU);
1155 			if (mpam_has_feature(mpam_feat_msmon_mbwu_hw_nrdy, rprops))
1156 				nrdy = now & MSMON___NRDY;
1157 			now = FIELD_GET(MSMON___VALUE, now);
1158 		}
1159 
1160 		if (nrdy)
1161 			break;
1162 
1163 		mbwu_state = &ris->mbwu_state[ctx->mon];
1164 
1165 		if (overflow)
1166 			mbwu_state->correction += mpam_msmon_overflow_val(m->type);
1167 
1168 		/*
1169 		 * Include bandwidth consumed before the last hardware reset and
1170 		 * a counter size increment for each overflow.
1171 		 */
1172 		now += mbwu_state->correction;
1173 		break;
1174 	default:
1175 		m->err = -EINVAL;
1176 	}
1177 	mpam_mon_sel_unlock(msc);
1178 
1179 	if (nrdy)
1180 		m->err = -EBUSY;
1181 
1182 	if (m->err)
1183 		return;
1184 
1185 	*m->val += now;
1186 }
1187 
_msmon_read(struct mpam_component * comp,struct mon_read * arg)1188 static int _msmon_read(struct mpam_component *comp, struct mon_read *arg)
1189 {
1190 	int err, any_err = 0;
1191 	struct mpam_vmsc *vmsc;
1192 
1193 	guard(srcu)(&mpam_srcu);
1194 	list_for_each_entry_srcu(vmsc, &comp->vmsc, comp_list,
1195 				 srcu_read_lock_held(&mpam_srcu)) {
1196 		struct mpam_msc *msc = vmsc->msc;
1197 		struct mpam_msc_ris *ris;
1198 
1199 		list_for_each_entry_srcu(ris, &vmsc->ris, vmsc_list,
1200 					 srcu_read_lock_held(&mpam_srcu)) {
1201 			arg->ris = ris;
1202 
1203 			err = smp_call_function_any(&msc->accessibility,
1204 						    __ris_msmon_read, arg,
1205 						    true);
1206 			if (!err && arg->err)
1207 				err = arg->err;
1208 
1209 			/*
1210 			 * Save one error to be returned to the caller, but
1211 			 * keep reading counters so that get reprogrammed. On
1212 			 * platforms with NRDY this lets us wait once.
1213 			 */
1214 			if (err)
1215 				any_err = err;
1216 		}
1217 	}
1218 
1219 	return any_err;
1220 }
1221 
mpam_msmon_choose_counter(struct mpam_class * class)1222 static enum mpam_device_features mpam_msmon_choose_counter(struct mpam_class *class)
1223 {
1224 	struct mpam_props *cprops = &class->props;
1225 
1226 	if (mpam_has_feature(mpam_feat_msmon_mbwu_63counter, cprops))
1227 		return mpam_feat_msmon_mbwu_63counter;
1228 	if (mpam_has_feature(mpam_feat_msmon_mbwu_44counter, cprops))
1229 		return mpam_feat_msmon_mbwu_44counter;
1230 
1231 	return mpam_feat_msmon_mbwu_31counter;
1232 }
1233 
mpam_msmon_read(struct mpam_component * comp,struct mon_cfg * ctx,enum mpam_device_features type,u64 * val)1234 int mpam_msmon_read(struct mpam_component *comp, struct mon_cfg *ctx,
1235 		    enum mpam_device_features type, u64 *val)
1236 {
1237 	int err;
1238 	struct mon_read arg;
1239 	u64 wait_jiffies = 0;
1240 	struct mpam_class *class = comp->class;
1241 	struct mpam_props *cprops = &class->props;
1242 
1243 	might_sleep();
1244 
1245 	if (!mpam_is_enabled())
1246 		return -EIO;
1247 
1248 	if (!mpam_has_feature(type, cprops))
1249 		return -EOPNOTSUPP;
1250 
1251 	if (type == mpam_feat_msmon_mbwu)
1252 		type = mpam_msmon_choose_counter(class);
1253 
1254 	arg = (struct mon_read) {
1255 		.ctx = ctx,
1256 		.type = type,
1257 		.val = val,
1258 	};
1259 	*val = 0;
1260 
1261 	err = _msmon_read(comp, &arg);
1262 	if (err == -EBUSY && class->nrdy_usec)
1263 		wait_jiffies = usecs_to_jiffies(class->nrdy_usec);
1264 
1265 	while (wait_jiffies)
1266 		wait_jiffies = schedule_timeout_uninterruptible(wait_jiffies);
1267 
1268 	if (err == -EBUSY) {
1269 		arg = (struct mon_read) {
1270 			.ctx = ctx,
1271 			.type = type,
1272 			.val = val,
1273 		};
1274 		*val = 0;
1275 
1276 		err = _msmon_read(comp, &arg);
1277 	}
1278 
1279 	return err;
1280 }
1281 
mpam_msmon_reset_mbwu(struct mpam_component * comp,struct mon_cfg * ctx)1282 void mpam_msmon_reset_mbwu(struct mpam_component *comp, struct mon_cfg *ctx)
1283 {
1284 	struct mpam_msc *msc;
1285 	struct mpam_vmsc *vmsc;
1286 	struct mpam_msc_ris *ris;
1287 
1288 	if (!mpam_is_enabled())
1289 		return;
1290 
1291 	guard(srcu)(&mpam_srcu);
1292 	list_for_each_entry_srcu(vmsc, &comp->vmsc, comp_list,
1293 				 srcu_read_lock_held(&mpam_srcu)) {
1294 		if (!mpam_has_feature(mpam_feat_msmon_mbwu, &vmsc->props))
1295 			continue;
1296 
1297 		msc = vmsc->msc;
1298 		list_for_each_entry_srcu(ris, &vmsc->ris, vmsc_list,
1299 					 srcu_read_lock_held(&mpam_srcu)) {
1300 			if (!mpam_has_feature(mpam_feat_msmon_mbwu, &ris->props))
1301 				continue;
1302 
1303 			if (WARN_ON_ONCE(!mpam_mon_sel_lock(msc)))
1304 				continue;
1305 
1306 			ris->mbwu_state[ctx->mon].correction = 0;
1307 			ris->mbwu_state[ctx->mon].reset_on_next_read = true;
1308 			mpam_mon_sel_unlock(msc);
1309 		}
1310 	}
1311 }
1312 
mpam_reset_msc_bitmap(struct mpam_msc * msc,u16 reg,u16 wd)1313 static void mpam_reset_msc_bitmap(struct mpam_msc *msc, u16 reg, u16 wd)
1314 {
1315 	u32 num_words, msb;
1316 	u32 bm = ~0;
1317 	int i;
1318 
1319 	lockdep_assert_held(&msc->part_sel_lock);
1320 
1321 	if (wd == 0)
1322 		return;
1323 
1324 	/*
1325 	 * Write all ~0 to all but the last 32bit-word, which may
1326 	 * have fewer bits...
1327 	 */
1328 	num_words = DIV_ROUND_UP(wd, 32);
1329 	for (i = 0; i < num_words - 1; i++, reg += sizeof(bm))
1330 		__mpam_write_reg(msc, reg, bm);
1331 
1332 	/*
1333 	 * ....and then the last (maybe) partial 32bit word. When wd is a
1334 	 * multiple of 32, msb should be 31 to write a full 32bit word.
1335 	 */
1336 	msb = (wd - 1) % 32;
1337 	bm = GENMASK(msb, 0);
1338 	__mpam_write_reg(msc, reg, bm);
1339 }
1340 
1341 /* Called via IPI. Call while holding an SRCU reference */
mpam_reprogram_ris_partid(struct mpam_msc_ris * ris,u16 partid,struct mpam_config * cfg)1342 static void mpam_reprogram_ris_partid(struct mpam_msc_ris *ris, u16 partid,
1343 				      struct mpam_config *cfg)
1344 {
1345 	u32 pri_val = 0;
1346 	u16 cmax = MPAMCFG_CMAX_CMAX;
1347 	struct mpam_msc *msc = ris->vmsc->msc;
1348 	struct mpam_props *rprops = &ris->props;
1349 	u16 dspri = GENMASK(rprops->dspri_wd, 0);
1350 	u16 intpri = GENMASK(rprops->intpri_wd, 0);
1351 
1352 	mutex_lock(&msc->part_sel_lock);
1353 	__mpam_part_sel(ris->ris_idx, partid, msc);
1354 
1355 	if (mpam_has_feature(mpam_feat_partid_nrw, rprops)) {
1356 		/* Update the intpartid mapping */
1357 		mpam_write_partsel_reg(msc, INTPARTID,
1358 				       MPAMCFG_INTPARTID_INTERNAL | partid);
1359 
1360 		/*
1361 		 * Then switch to the 'internal' partid to update the
1362 		 * configuration.
1363 		 */
1364 		__mpam_intpart_sel(ris->ris_idx, partid, msc);
1365 	}
1366 
1367 	if (mpam_has_feature(mpam_feat_cpor_part, rprops) &&
1368 	    mpam_has_feature(mpam_feat_cpor_part, cfg)) {
1369 		if (cfg->reset_cpbm)
1370 			mpam_reset_msc_bitmap(msc, MPAMCFG_CPBM, rprops->cpbm_wd);
1371 		else
1372 			mpam_write_partsel_reg(msc, CPBM, cfg->cpbm);
1373 	}
1374 
1375 	if (mpam_has_feature(mpam_feat_mbw_part, rprops) &&
1376 	    mpam_has_feature(mpam_feat_mbw_part, cfg)) {
1377 		if (cfg->reset_mbw_pbm)
1378 			mpam_reset_msc_bitmap(msc, MPAMCFG_MBW_PBM, rprops->mbw_pbm_bits);
1379 		else
1380 			mpam_write_partsel_reg(msc, MBW_PBM, cfg->mbw_pbm);
1381 	}
1382 
1383 	if (mpam_has_feature(mpam_feat_mbw_min, rprops) &&
1384 	    mpam_has_feature(mpam_feat_mbw_min, cfg))
1385 		mpam_write_partsel_reg(msc, MBW_MIN, 0);
1386 
1387 	if (mpam_has_feature(mpam_feat_mbw_max, rprops) &&
1388 	    mpam_has_feature(mpam_feat_mbw_max, cfg)) {
1389 		if (cfg->reset_mbw_max)
1390 			mpam_write_partsel_reg(msc, MBW_MAX, MPAMCFG_MBW_MAX_MAX);
1391 		else
1392 			mpam_write_partsel_reg(msc, MBW_MAX, cfg->mbw_max);
1393 	}
1394 
1395 	if (mpam_has_feature(mpam_feat_mbw_prop, rprops) &&
1396 	    mpam_has_feature(mpam_feat_mbw_prop, cfg))
1397 		mpam_write_partsel_reg(msc, MBW_PROP, 0);
1398 
1399 	if (mpam_has_feature(mpam_feat_cmax_cmax, rprops))
1400 		mpam_write_partsel_reg(msc, CMAX, cmax);
1401 
1402 	if (mpam_has_feature(mpam_feat_cmax_cmin, rprops))
1403 		mpam_write_partsel_reg(msc, CMIN, 0);
1404 
1405 	if (mpam_has_feature(mpam_feat_cmax_cassoc, rprops))
1406 		mpam_write_partsel_reg(msc, CASSOC, MPAMCFG_CASSOC_CASSOC);
1407 
1408 	if (mpam_has_feature(mpam_feat_intpri_part, rprops) ||
1409 	    mpam_has_feature(mpam_feat_dspri_part, rprops)) {
1410 		/* aces high? */
1411 		if (!mpam_has_feature(mpam_feat_intpri_part_0_low, rprops))
1412 			intpri = 0;
1413 		if (!mpam_has_feature(mpam_feat_dspri_part_0_low, rprops))
1414 			dspri = 0;
1415 
1416 		if (mpam_has_feature(mpam_feat_intpri_part, rprops))
1417 			pri_val |= FIELD_PREP(MPAMCFG_PRI_INTPRI, intpri);
1418 		if (mpam_has_feature(mpam_feat_dspri_part, rprops))
1419 			pri_val |= FIELD_PREP(MPAMCFG_PRI_DSPRI, dspri);
1420 
1421 		mpam_write_partsel_reg(msc, PRI, pri_val);
1422 	}
1423 
1424 	mutex_unlock(&msc->part_sel_lock);
1425 }
1426 
1427 /* Call with msc cfg_lock held */
mpam_restore_mbwu_state(void * _ris)1428 static int mpam_restore_mbwu_state(void *_ris)
1429 {
1430 	int i;
1431 	struct mon_read mwbu_arg;
1432 	struct mpam_msc_ris *ris = _ris;
1433 	struct mpam_class *class = ris->vmsc->comp->class;
1434 
1435 	for (i = 0; i < ris->props.num_mbwu_mon; i++) {
1436 		if (ris->mbwu_state[i].enabled) {
1437 			mwbu_arg.ris = ris;
1438 			mwbu_arg.ctx = &ris->mbwu_state[i].cfg;
1439 			mwbu_arg.type = mpam_msmon_choose_counter(class);
1440 
1441 			__ris_msmon_read(&mwbu_arg);
1442 		}
1443 	}
1444 
1445 	return 0;
1446 }
1447 
1448 /* Call with MSC cfg_lock held */
mpam_save_mbwu_state(void * arg)1449 static int mpam_save_mbwu_state(void *arg)
1450 {
1451 	int i;
1452 	u64 val;
1453 	struct mon_cfg *cfg;
1454 	u32 cur_flt, cur_ctl, mon_sel;
1455 	struct mpam_msc_ris *ris = arg;
1456 	struct msmon_mbwu_state *mbwu_state;
1457 	struct mpam_msc *msc = ris->vmsc->msc;
1458 
1459 	for (i = 0; i < ris->props.num_mbwu_mon; i++) {
1460 		mbwu_state = &ris->mbwu_state[i];
1461 		cfg = &mbwu_state->cfg;
1462 
1463 		if (WARN_ON_ONCE(!mpam_mon_sel_lock(msc)))
1464 			return -EIO;
1465 
1466 		mon_sel = FIELD_PREP(MSMON_CFG_MON_SEL_MON_SEL, i) |
1467 			  FIELD_PREP(MSMON_CFG_MON_SEL_RIS, ris->ris_idx);
1468 		mpam_write_monsel_reg(msc, CFG_MON_SEL, mon_sel);
1469 
1470 		cur_flt = mpam_read_monsel_reg(msc, CFG_MBWU_FLT);
1471 		cur_ctl = mpam_read_monsel_reg(msc, CFG_MBWU_CTL);
1472 		mpam_write_monsel_reg(msc, CFG_MBWU_CTL, 0);
1473 
1474 		if (mpam_ris_has_mbwu_long_counter(ris)) {
1475 			val = mpam_msc_read_mbwu_l(msc);
1476 			mpam_msc_zero_mbwu_l(msc);
1477 		} else {
1478 			val = mpam_read_monsel_reg(msc, MBWU);
1479 			mpam_write_monsel_reg(msc, MBWU, 0);
1480 		}
1481 
1482 		cfg->mon = i;
1483 		cfg->pmg = FIELD_GET(MSMON_CFG_x_FLT_PMG, cur_flt);
1484 		cfg->match_pmg = FIELD_GET(MSMON_CFG_x_CTL_MATCH_PMG, cur_ctl);
1485 		cfg->partid = FIELD_GET(MSMON_CFG_x_FLT_PARTID, cur_flt);
1486 		mbwu_state->correction += val;
1487 		mbwu_state->enabled = FIELD_GET(MSMON_CFG_x_CTL_EN, cur_ctl);
1488 		mpam_mon_sel_unlock(msc);
1489 	}
1490 
1491 	return 0;
1492 }
1493 
mpam_init_reset_cfg(struct mpam_config * reset_cfg)1494 static void mpam_init_reset_cfg(struct mpam_config *reset_cfg)
1495 {
1496 	*reset_cfg = (struct mpam_config) {
1497 		.reset_cpbm = true,
1498 		.reset_mbw_pbm = true,
1499 		.reset_mbw_max = true,
1500 	};
1501 	bitmap_fill(reset_cfg->features, MPAM_FEATURE_LAST);
1502 }
1503 
1504 /*
1505  * Called via smp_call_on_cpu() to prevent migration, while still being
1506  * pre-emptible. Caller must hold mpam_srcu.
1507  */
mpam_reset_ris(void * arg)1508 static int mpam_reset_ris(void *arg)
1509 {
1510 	u16 partid, partid_max;
1511 	struct mpam_config reset_cfg;
1512 	struct mpam_msc_ris *ris = arg;
1513 
1514 	if (ris->in_reset_state)
1515 		return 0;
1516 
1517 	mpam_init_reset_cfg(&reset_cfg);
1518 
1519 	spin_lock(&partid_max_lock);
1520 	partid_max = mpam_partid_max;
1521 	spin_unlock(&partid_max_lock);
1522 	for (partid = 0; partid <= partid_max; partid++)
1523 		mpam_reprogram_ris_partid(ris, partid, &reset_cfg);
1524 
1525 	return 0;
1526 }
1527 
1528 /*
1529  * Get the preferred CPU for this MSC. If it is accessible from this CPU,
1530  * this CPU is preferred. This can be preempted/migrated, it will only result
1531  * in more work.
1532  */
mpam_get_msc_preferred_cpu(struct mpam_msc * msc)1533 static int mpam_get_msc_preferred_cpu(struct mpam_msc *msc)
1534 {
1535 	int cpu = raw_smp_processor_id();
1536 
1537 	if (cpumask_test_cpu(cpu, &msc->accessibility))
1538 		return cpu;
1539 
1540 	return cpumask_first_and(&msc->accessibility, cpu_online_mask);
1541 }
1542 
mpam_touch_msc(struct mpam_msc * msc,int (* fn)(void * a),void * arg)1543 static int mpam_touch_msc(struct mpam_msc *msc, int (*fn)(void *a), void *arg)
1544 {
1545 	lockdep_assert_irqs_enabled();
1546 	lockdep_assert_cpus_held();
1547 	WARN_ON_ONCE(!srcu_read_lock_held((&mpam_srcu)));
1548 
1549 	return smp_call_on_cpu(mpam_get_msc_preferred_cpu(msc), fn, arg, true);
1550 }
1551 
1552 struct mpam_write_config_arg {
1553 	struct mpam_msc_ris *ris;
1554 	struct mpam_component *comp;
1555 	u16 partid;
1556 };
1557 
__write_config(void * arg)1558 static int __write_config(void *arg)
1559 {
1560 	struct mpam_write_config_arg *c = arg;
1561 
1562 	mpam_reprogram_ris_partid(c->ris, c->partid, &c->comp->cfg[c->partid]);
1563 
1564 	return 0;
1565 }
1566 
mpam_reprogram_msc(struct mpam_msc * msc)1567 static void mpam_reprogram_msc(struct mpam_msc *msc)
1568 {
1569 	u16 partid;
1570 	bool reset;
1571 	struct mpam_config *cfg;
1572 	struct mpam_msc_ris *ris;
1573 	struct mpam_write_config_arg arg;
1574 
1575 	/*
1576 	 * No lock for mpam_partid_max as partid_max_published has been
1577 	 * set by mpam_enabled(), so the values can no longer change.
1578 	 */
1579 	mpam_assert_partid_sizes_fixed();
1580 
1581 	mutex_lock(&msc->cfg_lock);
1582 	list_for_each_entry_srcu(ris, &msc->ris, msc_list,
1583 				 srcu_read_lock_held(&mpam_srcu)) {
1584 		if (!mpam_is_enabled() && !ris->in_reset_state) {
1585 			mpam_touch_msc(msc, &mpam_reset_ris, ris);
1586 			ris->in_reset_state = true;
1587 			continue;
1588 		}
1589 
1590 		arg.comp = ris->vmsc->comp;
1591 		arg.ris = ris;
1592 		reset = true;
1593 		for (partid = 0; partid <= mpam_partid_max; partid++) {
1594 			cfg = &ris->vmsc->comp->cfg[partid];
1595 			if (!bitmap_empty(cfg->features, MPAM_FEATURE_LAST))
1596 				reset = false;
1597 
1598 			arg.partid = partid;
1599 			mpam_touch_msc(msc, __write_config, &arg);
1600 		}
1601 		ris->in_reset_state = reset;
1602 
1603 		if (mpam_has_feature(mpam_feat_msmon_mbwu, &ris->props))
1604 			mpam_touch_msc(msc, &mpam_restore_mbwu_state, ris);
1605 	}
1606 	mutex_unlock(&msc->cfg_lock);
1607 }
1608 
_enable_percpu_irq(void * _irq)1609 static void _enable_percpu_irq(void *_irq)
1610 {
1611 	int *irq = _irq;
1612 
1613 	enable_percpu_irq(*irq, IRQ_TYPE_NONE);
1614 }
1615 
mpam_cpu_online(unsigned int cpu)1616 static int mpam_cpu_online(unsigned int cpu)
1617 {
1618 	struct mpam_msc *msc;
1619 
1620 	guard(srcu)(&mpam_srcu);
1621 	list_for_each_entry_srcu(msc, &mpam_all_msc, all_msc_list,
1622 				 srcu_read_lock_held(&mpam_srcu)) {
1623 		if (!cpumask_test_cpu(cpu, &msc->accessibility))
1624 			continue;
1625 
1626 		if (msc->reenable_error_ppi)
1627 			_enable_percpu_irq(&msc->reenable_error_ppi);
1628 
1629 		if (atomic_fetch_inc(&msc->online_refs) == 0)
1630 			mpam_reprogram_msc(msc);
1631 	}
1632 
1633 	return 0;
1634 }
1635 
1636 /* Before mpam is enabled, try to probe new MSC */
mpam_discovery_cpu_online(unsigned int cpu)1637 static int mpam_discovery_cpu_online(unsigned int cpu)
1638 {
1639 	int err = 0;
1640 	struct mpam_msc *msc;
1641 	bool new_device_probed = false;
1642 
1643 	if (mpam_is_enabled())
1644 		return 0;
1645 
1646 	guard(srcu)(&mpam_srcu);
1647 	list_for_each_entry_srcu(msc, &mpam_all_msc, all_msc_list,
1648 				 srcu_read_lock_held(&mpam_srcu)) {
1649 		if (!cpumask_test_cpu(cpu, &msc->accessibility))
1650 			continue;
1651 
1652 		mutex_lock(&msc->probe_lock);
1653 		if (!msc->probed)
1654 			err = mpam_msc_hw_probe(msc);
1655 		mutex_unlock(&msc->probe_lock);
1656 
1657 		if (err)
1658 			break;
1659 		new_device_probed = true;
1660 	}
1661 
1662 	if (new_device_probed && !err)
1663 		schedule_work(&mpam_enable_work);
1664 	if (err) {
1665 		mpam_disable_reason = "error during probing";
1666 		schedule_work(&mpam_broken_work);
1667 	}
1668 
1669 	return err;
1670 }
1671 
mpam_cpu_offline(unsigned int cpu)1672 static int mpam_cpu_offline(unsigned int cpu)
1673 {
1674 	struct mpam_msc *msc;
1675 
1676 	guard(srcu)(&mpam_srcu);
1677 	list_for_each_entry_srcu(msc, &mpam_all_msc, all_msc_list,
1678 				 srcu_read_lock_held(&mpam_srcu)) {
1679 		if (!cpumask_test_cpu(cpu, &msc->accessibility))
1680 			continue;
1681 
1682 		if (msc->reenable_error_ppi)
1683 			disable_percpu_irq(msc->reenable_error_ppi);
1684 
1685 		if (atomic_dec_and_test(&msc->online_refs)) {
1686 			struct mpam_msc_ris *ris;
1687 
1688 			mutex_lock(&msc->cfg_lock);
1689 			list_for_each_entry_srcu(ris, &msc->ris, msc_list,
1690 						 srcu_read_lock_held(&mpam_srcu)) {
1691 				mpam_touch_msc(msc, &mpam_reset_ris, ris);
1692 
1693 				/*
1694 				 * The reset state for non-zero partid may be
1695 				 * lost while the CPUs are offline.
1696 				 */
1697 				ris->in_reset_state = false;
1698 
1699 				if (mpam_is_enabled())
1700 					mpam_touch_msc(msc, &mpam_save_mbwu_state, ris);
1701 			}
1702 			mutex_unlock(&msc->cfg_lock);
1703 		}
1704 	}
1705 
1706 	return 0;
1707 }
1708 
mpam_register_cpuhp_callbacks(int (* online)(unsigned int online),int (* offline)(unsigned int offline),char * name)1709 static void mpam_register_cpuhp_callbacks(int (*online)(unsigned int online),
1710 					  int (*offline)(unsigned int offline),
1711 					  char *name)
1712 {
1713 	mutex_lock(&mpam_cpuhp_state_lock);
1714 	if (mpam_cpuhp_state) {
1715 		cpuhp_remove_state(mpam_cpuhp_state);
1716 		mpam_cpuhp_state = 0;
1717 	}
1718 
1719 	mpam_cpuhp_state = cpuhp_setup_state(CPUHP_AP_ONLINE_DYN, name, online,
1720 					     offline);
1721 	if (mpam_cpuhp_state <= 0) {
1722 		pr_err("Failed to register cpuhp callbacks");
1723 		mpam_cpuhp_state = 0;
1724 	}
1725 	mutex_unlock(&mpam_cpuhp_state_lock);
1726 }
1727 
__setup_ppi(struct mpam_msc * msc)1728 static int __setup_ppi(struct mpam_msc *msc)
1729 {
1730 	int cpu;
1731 
1732 	msc->error_dev_id = alloc_percpu(struct mpam_msc *);
1733 	if (!msc->error_dev_id)
1734 		return -ENOMEM;
1735 
1736 	for_each_cpu(cpu, &msc->accessibility)
1737 		*per_cpu_ptr(msc->error_dev_id, cpu) = msc;
1738 
1739 	return 0;
1740 }
1741 
mpam_msc_setup_error_irq(struct mpam_msc * msc)1742 static int mpam_msc_setup_error_irq(struct mpam_msc *msc)
1743 {
1744 	int irq;
1745 
1746 	irq = platform_get_irq_byname_optional(msc->pdev, "error");
1747 	if (irq <= 0)
1748 		return 0;
1749 
1750 	/* Allocate and initialise the percpu device pointer for PPI */
1751 	if (irq_is_percpu(irq))
1752 		return __setup_ppi(msc);
1753 
1754 	/* sanity check: shared interrupts can be routed anywhere? */
1755 	if (!cpumask_equal(&msc->accessibility, cpu_possible_mask)) {
1756 		pr_err_once("msc:%u is a private resource with a shared error interrupt",
1757 			    msc->id);
1758 		return -EINVAL;
1759 	}
1760 
1761 	return 0;
1762 }
1763 
1764 /*
1765  * An MSC can control traffic from a set of CPUs, but may only be accessible
1766  * from a (hopefully wider) set of CPUs. The common reason for this is power
1767  * management. If all the CPUs in a cluster are in PSCI:CPU_SUSPEND, the
1768  * corresponding cache may also be powered off. By making accesses from
1769  * one of those CPUs, we ensure we don't access a cache that's powered off.
1770  */
update_msc_accessibility(struct mpam_msc * msc)1771 static void update_msc_accessibility(struct mpam_msc *msc)
1772 {
1773 	u32 affinity_id;
1774 	int err;
1775 
1776 	err = device_property_read_u32(&msc->pdev->dev, "cpu_affinity",
1777 				       &affinity_id);
1778 	if (err)
1779 		cpumask_copy(&msc->accessibility, cpu_possible_mask);
1780 	else
1781 		acpi_pptt_get_cpus_from_container(affinity_id, &msc->accessibility);
1782 }
1783 
1784 /*
1785  * There are two ways of reaching a struct mpam_msc_ris. Via the
1786  * class->component->vmsc->ris, or via the msc.
1787  * When destroying the msc, the other side needs unlinking and cleaning up too.
1788  */
mpam_msc_destroy(struct mpam_msc * msc)1789 static void mpam_msc_destroy(struct mpam_msc *msc)
1790 {
1791 	struct platform_device *pdev = msc->pdev;
1792 	struct mpam_msc_ris *ris, *tmp;
1793 
1794 	lockdep_assert_held(&mpam_list_lock);
1795 
1796 	list_for_each_entry_safe(ris, tmp, &msc->ris, msc_list)
1797 		mpam_ris_destroy(ris);
1798 
1799 	list_del_rcu(&msc->all_msc_list);
1800 	platform_set_drvdata(pdev, NULL);
1801 
1802 	add_to_garbage(msc);
1803 }
1804 
mpam_msc_drv_remove(struct platform_device * pdev)1805 static void mpam_msc_drv_remove(struct platform_device *pdev)
1806 {
1807 	struct mpam_msc *msc = platform_get_drvdata(pdev);
1808 
1809 	mutex_lock(&mpam_list_lock);
1810 	mpam_msc_destroy(msc);
1811 	mutex_unlock(&mpam_list_lock);
1812 
1813 	mpam_free_garbage();
1814 }
1815 
do_mpam_msc_drv_probe(struct platform_device * pdev)1816 static struct mpam_msc *do_mpam_msc_drv_probe(struct platform_device *pdev)
1817 {
1818 	int err;
1819 	u32 tmp;
1820 	struct mpam_msc *msc;
1821 	struct resource *msc_res;
1822 	struct device *dev = &pdev->dev;
1823 
1824 	lockdep_assert_held(&mpam_list_lock);
1825 
1826 	msc = devm_kzalloc(&pdev->dev, sizeof(*msc), GFP_KERNEL);
1827 	if (!msc)
1828 		return ERR_PTR(-ENOMEM);
1829 	init_garbage(&msc->garbage);
1830 	msc->garbage.pdev = pdev;
1831 
1832 	err = devm_mutex_init(dev, &msc->probe_lock);
1833 	if (err)
1834 		return ERR_PTR(err);
1835 
1836 	err = devm_mutex_init(dev, &msc->part_sel_lock);
1837 	if (err)
1838 		return ERR_PTR(err);
1839 
1840 	err = devm_mutex_init(dev, &msc->error_irq_lock);
1841 	if (err)
1842 		return ERR_PTR(err);
1843 
1844 	err = devm_mutex_init(dev, &msc->cfg_lock);
1845 	if (err)
1846 		return ERR_PTR(err);
1847 
1848 	mpam_mon_sel_lock_init(msc);
1849 	msc->id = pdev->id;
1850 	msc->pdev = pdev;
1851 	INIT_LIST_HEAD_RCU(&msc->all_msc_list);
1852 	INIT_LIST_HEAD_RCU(&msc->ris);
1853 
1854 	update_msc_accessibility(msc);
1855 	if (cpumask_empty(&msc->accessibility)) {
1856 		dev_err_once(dev, "MSC is not accessible from any CPU!");
1857 		return ERR_PTR(-EINVAL);
1858 	}
1859 
1860 	err = mpam_msc_setup_error_irq(msc);
1861 	if (err)
1862 		return ERR_PTR(err);
1863 
1864 	if (device_property_read_u32(&pdev->dev, "pcc-channel", &tmp))
1865 		msc->iface = MPAM_IFACE_MMIO;
1866 	else
1867 		msc->iface = MPAM_IFACE_PCC;
1868 
1869 	if (msc->iface == MPAM_IFACE_MMIO) {
1870 		void __iomem *io;
1871 
1872 		io = devm_platform_get_and_ioremap_resource(pdev, 0,
1873 							    &msc_res);
1874 		if (IS_ERR(io)) {
1875 			dev_err_once(dev, "Failed to map MSC base address\n");
1876 			return ERR_CAST(io);
1877 		}
1878 		msc->mapped_hwpage_sz = msc_res->end - msc_res->start;
1879 		msc->mapped_hwpage = io;
1880 	} else {
1881 		return ERR_PTR(-EINVAL);
1882 	}
1883 
1884 	list_add_rcu(&msc->all_msc_list, &mpam_all_msc);
1885 	platform_set_drvdata(pdev, msc);
1886 
1887 	return msc;
1888 }
1889 
1890 static int fw_num_msc;
1891 
mpam_msc_drv_probe(struct platform_device * pdev)1892 static int mpam_msc_drv_probe(struct platform_device *pdev)
1893 {
1894 	int err;
1895 	struct mpam_msc *msc = NULL;
1896 	void *plat_data = pdev->dev.platform_data;
1897 
1898 	mutex_lock(&mpam_list_lock);
1899 	msc = do_mpam_msc_drv_probe(pdev);
1900 	mutex_unlock(&mpam_list_lock);
1901 
1902 	if (IS_ERR(msc))
1903 		return PTR_ERR(msc);
1904 
1905 	/* Create RIS entries described by firmware */
1906 	err = acpi_mpam_parse_resources(msc, plat_data);
1907 	if (err) {
1908 		mpam_msc_drv_remove(pdev);
1909 		return err;
1910 	}
1911 
1912 	if (atomic_add_return(1, &mpam_num_msc) == fw_num_msc)
1913 		mpam_register_cpuhp_callbacks(mpam_discovery_cpu_online, NULL,
1914 					      "mpam:drv_probe");
1915 
1916 	return 0;
1917 }
1918 
1919 static struct platform_driver mpam_msc_driver = {
1920 	.driver = {
1921 		.name = "mpam_msc",
1922 	},
1923 	.probe = mpam_msc_drv_probe,
1924 	.remove = mpam_msc_drv_remove,
1925 };
1926 
1927 /* Any of these features mean the BWA_WD field is valid. */
mpam_has_bwa_wd_feature(struct mpam_props * props)1928 static bool mpam_has_bwa_wd_feature(struct mpam_props *props)
1929 {
1930 	if (mpam_has_feature(mpam_feat_mbw_min, props))
1931 		return true;
1932 	if (mpam_has_feature(mpam_feat_mbw_max, props))
1933 		return true;
1934 	if (mpam_has_feature(mpam_feat_mbw_prop, props))
1935 		return true;
1936 	return false;
1937 }
1938 
1939 /* Any of these features mean the CMAX_WD field is valid. */
mpam_has_cmax_wd_feature(struct mpam_props * props)1940 static bool mpam_has_cmax_wd_feature(struct mpam_props *props)
1941 {
1942 	if (mpam_has_feature(mpam_feat_cmax_cmax, props))
1943 		return true;
1944 	if (mpam_has_feature(mpam_feat_cmax_cmin, props))
1945 		return true;
1946 	return false;
1947 }
1948 
1949 #define MISMATCHED_HELPER(parent, child, helper, field, alias)		\
1950 	helper(parent) &&						\
1951 	((helper(child) && (parent)->field != (child)->field) ||	\
1952 	 (!helper(child) && !(alias)))
1953 
1954 #define MISMATCHED_FEAT(parent, child, feat, field, alias)		     \
1955 	mpam_has_feature((feat), (parent)) &&				     \
1956 	((mpam_has_feature((feat), (child)) && (parent)->field != (child)->field) || \
1957 	 (!mpam_has_feature((feat), (child)) && !(alias)))
1958 
1959 #define CAN_MERGE_FEAT(parent, child, feat, alias)			\
1960 	(alias) && !mpam_has_feature((feat), (parent)) &&		\
1961 	mpam_has_feature((feat), (child))
1962 
1963 /*
1964  * Combine two props fields.
1965  * If this is for controls that alias the same resource, it is safe to just
1966  * copy the values over. If two aliasing controls implement the same scheme
1967  * a safe value must be picked.
1968  * For non-aliasing controls, these control different resources, and the
1969  * resulting safe value must be compatible with both. When merging values in
1970  * the tree, all the aliasing resources must be handled first.
1971  * On mismatch, parent is modified.
1972  */
__props_mismatch(struct mpam_props * parent,struct mpam_props * child,bool alias)1973 static void __props_mismatch(struct mpam_props *parent,
1974 			     struct mpam_props *child, bool alias)
1975 {
1976 	if (CAN_MERGE_FEAT(parent, child, mpam_feat_cpor_part, alias)) {
1977 		parent->cpbm_wd = child->cpbm_wd;
1978 	} else if (MISMATCHED_FEAT(parent, child, mpam_feat_cpor_part,
1979 				   cpbm_wd, alias)) {
1980 		pr_debug("cleared cpor_part\n");
1981 		mpam_clear_feature(mpam_feat_cpor_part, parent);
1982 		parent->cpbm_wd = 0;
1983 	}
1984 
1985 	if (CAN_MERGE_FEAT(parent, child, mpam_feat_mbw_part, alias)) {
1986 		parent->mbw_pbm_bits = child->mbw_pbm_bits;
1987 	} else if (MISMATCHED_FEAT(parent, child, mpam_feat_mbw_part,
1988 				   mbw_pbm_bits, alias)) {
1989 		pr_debug("cleared mbw_part\n");
1990 		mpam_clear_feature(mpam_feat_mbw_part, parent);
1991 		parent->mbw_pbm_bits = 0;
1992 	}
1993 
1994 	/* bwa_wd is a count of bits, fewer bits means less precision */
1995 	if (alias && !mpam_has_bwa_wd_feature(parent) &&
1996 	    mpam_has_bwa_wd_feature(child)) {
1997 		parent->bwa_wd = child->bwa_wd;
1998 	} else if (MISMATCHED_HELPER(parent, child, mpam_has_bwa_wd_feature,
1999 				     bwa_wd, alias)) {
2000 		pr_debug("took the min bwa_wd\n");
2001 		parent->bwa_wd = min(parent->bwa_wd, child->bwa_wd);
2002 	}
2003 
2004 	if (alias && !mpam_has_cmax_wd_feature(parent) && mpam_has_cmax_wd_feature(child)) {
2005 		parent->cmax_wd = child->cmax_wd;
2006 	} else if (MISMATCHED_HELPER(parent, child, mpam_has_cmax_wd_feature,
2007 				     cmax_wd, alias)) {
2008 		pr_debug("%s took the min cmax_wd\n", __func__);
2009 		parent->cmax_wd = min(parent->cmax_wd, child->cmax_wd);
2010 	}
2011 
2012 	if (CAN_MERGE_FEAT(parent, child, mpam_feat_cmax_cassoc, alias)) {
2013 		parent->cassoc_wd = child->cassoc_wd;
2014 	} else if (MISMATCHED_FEAT(parent, child, mpam_feat_cmax_cassoc,
2015 				   cassoc_wd, alias)) {
2016 		pr_debug("%s cleared cassoc_wd\n", __func__);
2017 		mpam_clear_feature(mpam_feat_cmax_cassoc, parent);
2018 		parent->cassoc_wd = 0;
2019 	}
2020 
2021 	/* For num properties, take the minimum */
2022 	if (CAN_MERGE_FEAT(parent, child, mpam_feat_msmon_csu, alias)) {
2023 		parent->num_csu_mon = child->num_csu_mon;
2024 	} else if (MISMATCHED_FEAT(parent, child, mpam_feat_msmon_csu,
2025 				   num_csu_mon, alias)) {
2026 		pr_debug("took the min num_csu_mon\n");
2027 		parent->num_csu_mon = min(parent->num_csu_mon,
2028 					  child->num_csu_mon);
2029 	}
2030 
2031 	if (CAN_MERGE_FEAT(parent, child, mpam_feat_msmon_mbwu, alias)) {
2032 		parent->num_mbwu_mon = child->num_mbwu_mon;
2033 	} else if (MISMATCHED_FEAT(parent, child, mpam_feat_msmon_mbwu,
2034 				   num_mbwu_mon, alias)) {
2035 		pr_debug("took the min num_mbwu_mon\n");
2036 		parent->num_mbwu_mon = min(parent->num_mbwu_mon,
2037 					   child->num_mbwu_mon);
2038 	}
2039 
2040 	if (CAN_MERGE_FEAT(parent, child, mpam_feat_intpri_part, alias)) {
2041 		parent->intpri_wd = child->intpri_wd;
2042 	} else if (MISMATCHED_FEAT(parent, child, mpam_feat_intpri_part,
2043 				   intpri_wd, alias)) {
2044 		pr_debug("%s took the min intpri_wd\n", __func__);
2045 		parent->intpri_wd = min(parent->intpri_wd, child->intpri_wd);
2046 	}
2047 
2048 	if (CAN_MERGE_FEAT(parent, child, mpam_feat_dspri_part, alias)) {
2049 		parent->dspri_wd = child->dspri_wd;
2050 	} else if (MISMATCHED_FEAT(parent, child, mpam_feat_dspri_part,
2051 				   dspri_wd, alias)) {
2052 		pr_debug("%s took the min dspri_wd\n", __func__);
2053 		parent->dspri_wd = min(parent->dspri_wd, child->dspri_wd);
2054 	}
2055 
2056 	/* TODO: alias support for these two */
2057 	/* {int,ds}pri may not have differing 0-low behaviour */
2058 	if (mpam_has_feature(mpam_feat_intpri_part, parent) &&
2059 	    (!mpam_has_feature(mpam_feat_intpri_part, child) ||
2060 	     mpam_has_feature(mpam_feat_intpri_part_0_low, parent) !=
2061 	     mpam_has_feature(mpam_feat_intpri_part_0_low, child))) {
2062 		pr_debug("%s cleared intpri_part\n", __func__);
2063 		mpam_clear_feature(mpam_feat_intpri_part, parent);
2064 		mpam_clear_feature(mpam_feat_intpri_part_0_low, parent);
2065 	}
2066 	if (mpam_has_feature(mpam_feat_dspri_part, parent) &&
2067 	    (!mpam_has_feature(mpam_feat_dspri_part, child) ||
2068 	     mpam_has_feature(mpam_feat_dspri_part_0_low, parent) !=
2069 	     mpam_has_feature(mpam_feat_dspri_part_0_low, child))) {
2070 		pr_debug("%s cleared dspri_part\n", __func__);
2071 		mpam_clear_feature(mpam_feat_dspri_part, parent);
2072 		mpam_clear_feature(mpam_feat_dspri_part_0_low, parent);
2073 	}
2074 
2075 	if (alias) {
2076 		/* Merge features for aliased resources */
2077 		bitmap_or(parent->features, parent->features, child->features, MPAM_FEATURE_LAST);
2078 	} else {
2079 		/* Clear missing features for non aliasing */
2080 		bitmap_and(parent->features, parent->features, child->features, MPAM_FEATURE_LAST);
2081 	}
2082 }
2083 
2084 /*
2085  * If a vmsc doesn't match class feature/configuration, do the right thing(tm).
2086  * For 'num' properties we can just take the minimum.
2087  * For properties where the mismatched unused bits would make a difference, we
2088  * nobble the class feature, as we can't configure all the resources.
2089  * e.g. The L3 cache is composed of two resources with 13 and 17 portion
2090  * bitmaps respectively.
2091  */
2092 static void
__class_props_mismatch(struct mpam_class * class,struct mpam_vmsc * vmsc)2093 __class_props_mismatch(struct mpam_class *class, struct mpam_vmsc *vmsc)
2094 {
2095 	struct mpam_props *cprops = &class->props;
2096 	struct mpam_props *vprops = &vmsc->props;
2097 	struct device *dev = &vmsc->msc->pdev->dev;
2098 
2099 	lockdep_assert_held(&mpam_list_lock); /* we modify class */
2100 
2101 	dev_dbg(dev, "Merging features for class:0x%lx &= vmsc:0x%lx\n",
2102 		(long)cprops->features, (long)vprops->features);
2103 
2104 	/* Take the safe value for any common features */
2105 	__props_mismatch(cprops, vprops, false);
2106 }
2107 
2108 static void
__vmsc_props_mismatch(struct mpam_vmsc * vmsc,struct mpam_msc_ris * ris)2109 __vmsc_props_mismatch(struct mpam_vmsc *vmsc, struct mpam_msc_ris *ris)
2110 {
2111 	struct mpam_props *rprops = &ris->props;
2112 	struct mpam_props *vprops = &vmsc->props;
2113 	struct device *dev = &vmsc->msc->pdev->dev;
2114 
2115 	lockdep_assert_held(&mpam_list_lock); /* we modify vmsc */
2116 
2117 	dev_dbg(dev, "Merging features for vmsc:0x%lx |= ris:0x%lx\n",
2118 		(long)vprops->features, (long)rprops->features);
2119 
2120 	/*
2121 	 * Merge mismatched features - Copy any features that aren't common,
2122 	 * but take the safe value for any common features.
2123 	 */
2124 	__props_mismatch(vprops, rprops, true);
2125 }
2126 
2127 /*
2128  * Copy the first component's first vMSC's properties and features to the
2129  * class. __class_props_mismatch() will remove conflicts.
2130  * It is not possible to have a class with no components, or a component with
2131  * no resources. The vMSC properties have already been built.
2132  */
mpam_enable_init_class_features(struct mpam_class * class)2133 static void mpam_enable_init_class_features(struct mpam_class *class)
2134 {
2135 	struct mpam_vmsc *vmsc;
2136 	struct mpam_component *comp;
2137 
2138 	comp = list_first_entry(&class->components,
2139 				struct mpam_component, class_list);
2140 	vmsc = list_first_entry(&comp->vmsc,
2141 				struct mpam_vmsc, comp_list);
2142 
2143 	class->props = vmsc->props;
2144 }
2145 
mpam_enable_merge_vmsc_features(struct mpam_component * comp)2146 static void mpam_enable_merge_vmsc_features(struct mpam_component *comp)
2147 {
2148 	struct mpam_vmsc *vmsc;
2149 	struct mpam_msc_ris *ris;
2150 	struct mpam_class *class = comp->class;
2151 
2152 	list_for_each_entry(vmsc, &comp->vmsc, comp_list) {
2153 		list_for_each_entry(ris, &vmsc->ris, vmsc_list) {
2154 			__vmsc_props_mismatch(vmsc, ris);
2155 			class->nrdy_usec = max(class->nrdy_usec,
2156 					       vmsc->msc->nrdy_usec);
2157 		}
2158 	}
2159 }
2160 
mpam_enable_merge_class_features(struct mpam_component * comp)2161 static void mpam_enable_merge_class_features(struct mpam_component *comp)
2162 {
2163 	struct mpam_vmsc *vmsc;
2164 	struct mpam_class *class = comp->class;
2165 
2166 	list_for_each_entry(vmsc, &comp->vmsc, comp_list)
2167 		__class_props_mismatch(class, vmsc);
2168 }
2169 
2170 /*
2171  * Merge all the common resource features into class.
2172  * vmsc features are bitwise-or'd together by mpam_enable_merge_vmsc_features()
2173  * as the first step so that mpam_enable_init_class_features() can initialise
2174  * the class with a representative set of features.
2175  * Next the mpam_enable_merge_class_features() bitwise-and's all the vmsc
2176  * features to form the class features.
2177  * Other features are the min/max as appropriate.
2178  *
2179  * To avoid walking the whole tree twice, the class->nrdy_usec property is
2180  * updated when working with the vmsc as it is a max(), and doesn't need
2181  * initialising first.
2182  */
mpam_enable_merge_features(struct list_head * all_classes_list)2183 static void mpam_enable_merge_features(struct list_head *all_classes_list)
2184 {
2185 	struct mpam_class *class;
2186 	struct mpam_component *comp;
2187 
2188 	lockdep_assert_held(&mpam_list_lock);
2189 
2190 	list_for_each_entry(class, all_classes_list, classes_list) {
2191 		list_for_each_entry(comp, &class->components, class_list)
2192 			mpam_enable_merge_vmsc_features(comp);
2193 
2194 		mpam_enable_init_class_features(class);
2195 
2196 		list_for_each_entry(comp, &class->components, class_list)
2197 			mpam_enable_merge_class_features(comp);
2198 	}
2199 }
2200 
2201 static char *mpam_errcode_names[16] = {
2202 	[MPAM_ERRCODE_NONE]			= "No error",
2203 	[MPAM_ERRCODE_PARTID_SEL_RANGE]		= "PARTID_SEL_Range",
2204 	[MPAM_ERRCODE_REQ_PARTID_RANGE]		= "Req_PARTID_Range",
2205 	[MPAM_ERRCODE_MSMONCFG_ID_RANGE]	= "MSMONCFG_ID_RANGE",
2206 	[MPAM_ERRCODE_REQ_PMG_RANGE]		= "Req_PMG_Range",
2207 	[MPAM_ERRCODE_MONITOR_RANGE]		= "Monitor_Range",
2208 	[MPAM_ERRCODE_INTPARTID_RANGE]		= "intPARTID_Range",
2209 	[MPAM_ERRCODE_UNEXPECTED_INTERNAL]	= "Unexpected_INTERNAL",
2210 	[MPAM_ERRCODE_UNDEFINED_RIS_PART_SEL]	= "Undefined_RIS_PART_SEL",
2211 	[MPAM_ERRCODE_RIS_NO_CONTROL]		= "RIS_No_Control",
2212 	[MPAM_ERRCODE_UNDEFINED_RIS_MON_SEL]	= "Undefined_RIS_MON_SEL",
2213 	[MPAM_ERRCODE_RIS_NO_MONITOR]		= "RIS_No_Monitor",
2214 	[12 ... 15] = "Reserved"
2215 };
2216 
mpam_enable_msc_ecr(void * _msc)2217 static int mpam_enable_msc_ecr(void *_msc)
2218 {
2219 	struct mpam_msc *msc = _msc;
2220 
2221 	__mpam_write_reg(msc, MPAMF_ECR, MPAMF_ECR_INTEN);
2222 
2223 	return 0;
2224 }
2225 
2226 /* This can run in mpam_disable(), and the interrupt handler on the same CPU */
mpam_disable_msc_ecr(void * _msc)2227 static int mpam_disable_msc_ecr(void *_msc)
2228 {
2229 	struct mpam_msc *msc = _msc;
2230 
2231 	__mpam_write_reg(msc, MPAMF_ECR, 0);
2232 
2233 	return 0;
2234 }
2235 
__mpam_irq_handler(int irq,struct mpam_msc * msc)2236 static irqreturn_t __mpam_irq_handler(int irq, struct mpam_msc *msc)
2237 {
2238 	u64 reg;
2239 	u16 partid;
2240 	u8 errcode, pmg, ris;
2241 
2242 	if (WARN_ON_ONCE(!msc) ||
2243 	    WARN_ON_ONCE(!cpumask_test_cpu(smp_processor_id(),
2244 					   &msc->accessibility)))
2245 		return IRQ_NONE;
2246 
2247 	reg = mpam_msc_read_esr(msc);
2248 
2249 	errcode = FIELD_GET(MPAMF_ESR_ERRCODE, reg);
2250 	if (!errcode)
2251 		return IRQ_NONE;
2252 
2253 	/* Clear level triggered irq */
2254 	mpam_msc_clear_esr(msc);
2255 
2256 	partid = FIELD_GET(MPAMF_ESR_PARTID_MON, reg);
2257 	pmg = FIELD_GET(MPAMF_ESR_PMG, reg);
2258 	ris = FIELD_GET(MPAMF_ESR_RIS, reg);
2259 
2260 	pr_err_ratelimited("error irq from msc:%u '%s', partid:%u, pmg: %u, ris: %u\n",
2261 			   msc->id, mpam_errcode_names[errcode], partid, pmg,
2262 			   ris);
2263 
2264 	/* Disable this interrupt. */
2265 	mpam_disable_msc_ecr(msc);
2266 
2267 	/* Are we racing with the thread disabling MPAM? */
2268 	if (!mpam_is_enabled())
2269 		return IRQ_HANDLED;
2270 
2271 	/*
2272 	 * Schedule the teardown work. Don't use a threaded IRQ as we can't
2273 	 * unregister the interrupt from the threaded part of the handler.
2274 	 */
2275 	mpam_disable_reason = "hardware error interrupt";
2276 	schedule_work(&mpam_broken_work);
2277 
2278 	return IRQ_HANDLED;
2279 }
2280 
mpam_ppi_handler(int irq,void * dev_id)2281 static irqreturn_t mpam_ppi_handler(int irq, void *dev_id)
2282 {
2283 	struct mpam_msc *msc = *(struct mpam_msc **)dev_id;
2284 
2285 	return __mpam_irq_handler(irq, msc);
2286 }
2287 
mpam_spi_handler(int irq,void * dev_id)2288 static irqreturn_t mpam_spi_handler(int irq, void *dev_id)
2289 {
2290 	struct mpam_msc *msc = dev_id;
2291 
2292 	return __mpam_irq_handler(irq, msc);
2293 }
2294 
mpam_register_irqs(void)2295 static int mpam_register_irqs(void)
2296 {
2297 	int err, irq;
2298 	struct mpam_msc *msc;
2299 
2300 	lockdep_assert_cpus_held();
2301 
2302 	guard(srcu)(&mpam_srcu);
2303 	list_for_each_entry_srcu(msc, &mpam_all_msc, all_msc_list,
2304 				 srcu_read_lock_held(&mpam_srcu)) {
2305 		irq = platform_get_irq_byname_optional(msc->pdev, "error");
2306 		if (irq <= 0)
2307 			continue;
2308 
2309 		/* The MPAM spec says the interrupt can be SPI, PPI or LPI */
2310 		/* We anticipate sharing the interrupt with other MSCs */
2311 		if (irq_is_percpu(irq)) {
2312 			err = request_percpu_irq(irq, &mpam_ppi_handler,
2313 						 "mpam:msc:error",
2314 						 msc->error_dev_id);
2315 			if (err)
2316 				return err;
2317 
2318 			msc->reenable_error_ppi = irq;
2319 			smp_call_function_many(&msc->accessibility,
2320 					       &_enable_percpu_irq, &irq,
2321 					       true);
2322 		} else {
2323 			err = devm_request_irq(&msc->pdev->dev, irq,
2324 					       &mpam_spi_handler, IRQF_SHARED,
2325 					       "mpam:msc:error", msc);
2326 			if (err)
2327 				return err;
2328 		}
2329 
2330 		mutex_lock(&msc->error_irq_lock);
2331 		msc->error_irq_req = true;
2332 		mpam_touch_msc(msc, mpam_enable_msc_ecr, msc);
2333 		msc->error_irq_hw_enabled = true;
2334 		mutex_unlock(&msc->error_irq_lock);
2335 	}
2336 
2337 	return 0;
2338 }
2339 
mpam_unregister_irqs(void)2340 static void mpam_unregister_irqs(void)
2341 {
2342 	int irq;
2343 	struct mpam_msc *msc;
2344 
2345 	guard(cpus_read_lock)();
2346 	guard(srcu)(&mpam_srcu);
2347 	list_for_each_entry_srcu(msc, &mpam_all_msc, all_msc_list,
2348 				 srcu_read_lock_held(&mpam_srcu)) {
2349 		irq = platform_get_irq_byname_optional(msc->pdev, "error");
2350 		if (irq <= 0)
2351 			continue;
2352 
2353 		mutex_lock(&msc->error_irq_lock);
2354 		if (msc->error_irq_hw_enabled) {
2355 			mpam_touch_msc(msc, mpam_disable_msc_ecr, msc);
2356 			msc->error_irq_hw_enabled = false;
2357 		}
2358 
2359 		if (msc->error_irq_req) {
2360 			if (irq_is_percpu(irq)) {
2361 				msc->reenable_error_ppi = 0;
2362 				free_percpu_irq(irq, msc->error_dev_id);
2363 			} else {
2364 				devm_free_irq(&msc->pdev->dev, irq, msc);
2365 			}
2366 			msc->error_irq_req = false;
2367 		}
2368 		mutex_unlock(&msc->error_irq_lock);
2369 	}
2370 }
2371 
__destroy_component_cfg(struct mpam_component * comp)2372 static void __destroy_component_cfg(struct mpam_component *comp)
2373 {
2374 	struct mpam_msc *msc;
2375 	struct mpam_vmsc *vmsc;
2376 	struct mpam_msc_ris *ris;
2377 
2378 	lockdep_assert_held(&mpam_list_lock);
2379 
2380 	add_to_garbage(comp->cfg);
2381 	list_for_each_entry(vmsc, &comp->vmsc, comp_list) {
2382 		msc = vmsc->msc;
2383 
2384 		if (mpam_mon_sel_lock(msc)) {
2385 			list_for_each_entry(ris, &vmsc->ris, vmsc_list)
2386 				add_to_garbage(ris->mbwu_state);
2387 			mpam_mon_sel_unlock(msc);
2388 		}
2389 	}
2390 }
2391 
mpam_reset_component_cfg(struct mpam_component * comp)2392 static void mpam_reset_component_cfg(struct mpam_component *comp)
2393 {
2394 	int i;
2395 	struct mpam_props *cprops = &comp->class->props;
2396 
2397 	mpam_assert_partid_sizes_fixed();
2398 
2399 	if (!comp->cfg)
2400 		return;
2401 
2402 	for (i = 0; i <= mpam_partid_max; i++) {
2403 		comp->cfg[i] = (struct mpam_config) {};
2404 		if (cprops->cpbm_wd)
2405 			comp->cfg[i].cpbm = GENMASK(cprops->cpbm_wd - 1, 0);
2406 		if (cprops->mbw_pbm_bits)
2407 			comp->cfg[i].mbw_pbm = GENMASK(cprops->mbw_pbm_bits - 1, 0);
2408 		if (cprops->bwa_wd)
2409 			comp->cfg[i].mbw_max = GENMASK(15, 16 - cprops->bwa_wd);
2410 	}
2411 }
2412 
__allocate_component_cfg(struct mpam_component * comp)2413 static int __allocate_component_cfg(struct mpam_component *comp)
2414 {
2415 	struct mpam_vmsc *vmsc;
2416 
2417 	mpam_assert_partid_sizes_fixed();
2418 
2419 	if (comp->cfg)
2420 		return 0;
2421 
2422 	comp->cfg = kcalloc(mpam_partid_max + 1, sizeof(*comp->cfg), GFP_KERNEL);
2423 	if (!comp->cfg)
2424 		return -ENOMEM;
2425 
2426 	/*
2427 	 * The array is free()d in one go, so only cfg[0]'s structure needs
2428 	 * to be initialised.
2429 	 */
2430 	init_garbage(&comp->cfg[0].garbage);
2431 
2432 	mpam_reset_component_cfg(comp);
2433 
2434 	list_for_each_entry(vmsc, &comp->vmsc, comp_list) {
2435 		struct mpam_msc *msc;
2436 		struct mpam_msc_ris *ris;
2437 		struct msmon_mbwu_state *mbwu_state;
2438 
2439 		if (!vmsc->props.num_mbwu_mon)
2440 			continue;
2441 
2442 		msc = vmsc->msc;
2443 		list_for_each_entry(ris, &vmsc->ris, vmsc_list) {
2444 			if (!ris->props.num_mbwu_mon)
2445 				continue;
2446 
2447 			mbwu_state = kcalloc(ris->props.num_mbwu_mon,
2448 					     sizeof(*ris->mbwu_state),
2449 					     GFP_KERNEL);
2450 			if (!mbwu_state) {
2451 				__destroy_component_cfg(comp);
2452 				return -ENOMEM;
2453 			}
2454 
2455 			init_garbage(&mbwu_state[0].garbage);
2456 
2457 			if (mpam_mon_sel_lock(msc)) {
2458 				ris->mbwu_state = mbwu_state;
2459 				mpam_mon_sel_unlock(msc);
2460 			}
2461 		}
2462 	}
2463 
2464 	return 0;
2465 }
2466 
mpam_allocate_config(void)2467 static int mpam_allocate_config(void)
2468 {
2469 	struct mpam_class *class;
2470 	struct mpam_component *comp;
2471 
2472 	lockdep_assert_held(&mpam_list_lock);
2473 
2474 	list_for_each_entry(class, &mpam_classes, classes_list) {
2475 		list_for_each_entry(comp, &class->components, class_list) {
2476 			int err = __allocate_component_cfg(comp);
2477 			if (err)
2478 				return err;
2479 		}
2480 	}
2481 
2482 	return 0;
2483 }
2484 
mpam_enable_once(void)2485 static void mpam_enable_once(void)
2486 {
2487 	int err;
2488 
2489 	/*
2490 	 * Once the cpuhp callbacks have been changed, mpam_partid_max can no
2491 	 * longer change.
2492 	 */
2493 	spin_lock(&partid_max_lock);
2494 	partid_max_published = true;
2495 	spin_unlock(&partid_max_lock);
2496 
2497 	/*
2498 	 * If all the MSC have been probed, enabling the IRQs happens next.
2499 	 * That involves cross-calling to a CPU that can reach the MSC, and
2500 	 * the locks must be taken in this order:
2501 	 */
2502 	cpus_read_lock();
2503 	mutex_lock(&mpam_list_lock);
2504 	do {
2505 		mpam_enable_merge_features(&mpam_classes);
2506 
2507 		err = mpam_register_irqs();
2508 		if (err) {
2509 			pr_warn("Failed to register irqs: %d\n", err);
2510 			break;
2511 		}
2512 
2513 		err = mpam_allocate_config();
2514 		if (err) {
2515 			pr_err("Failed to allocate configuration arrays.\n");
2516 			break;
2517 		}
2518 	} while (0);
2519 	mutex_unlock(&mpam_list_lock);
2520 	cpus_read_unlock();
2521 
2522 	if (err) {
2523 		mpam_disable_reason = "Failed to enable.";
2524 		schedule_work(&mpam_broken_work);
2525 		return;
2526 	}
2527 
2528 	static_branch_enable(&mpam_enabled);
2529 	mpam_register_cpuhp_callbacks(mpam_cpu_online, mpam_cpu_offline,
2530 				      "mpam:online");
2531 
2532 	/* Use printk() to avoid the pr_fmt adding the function name. */
2533 	printk(KERN_INFO "MPAM enabled with %u PARTIDs and %u PMGs\n",
2534 	       mpam_partid_max + 1, mpam_pmg_max + 1);
2535 }
2536 
mpam_reset_component_locked(struct mpam_component * comp)2537 static void mpam_reset_component_locked(struct mpam_component *comp)
2538 {
2539 	struct mpam_vmsc *vmsc;
2540 
2541 	lockdep_assert_cpus_held();
2542 	mpam_assert_partid_sizes_fixed();
2543 
2544 	mpam_reset_component_cfg(comp);
2545 
2546 	guard(srcu)(&mpam_srcu);
2547 	list_for_each_entry_srcu(vmsc, &comp->vmsc, comp_list,
2548 				 srcu_read_lock_held(&mpam_srcu)) {
2549 		struct mpam_msc *msc = vmsc->msc;
2550 		struct mpam_msc_ris *ris;
2551 
2552 		list_for_each_entry_srcu(ris, &vmsc->ris, vmsc_list,
2553 					 srcu_read_lock_held(&mpam_srcu)) {
2554 			if (!ris->in_reset_state)
2555 				mpam_touch_msc(msc, mpam_reset_ris, ris);
2556 			ris->in_reset_state = true;
2557 		}
2558 	}
2559 }
2560 
mpam_reset_class_locked(struct mpam_class * class)2561 static void mpam_reset_class_locked(struct mpam_class *class)
2562 {
2563 	struct mpam_component *comp;
2564 
2565 	lockdep_assert_cpus_held();
2566 
2567 	guard(srcu)(&mpam_srcu);
2568 	list_for_each_entry_srcu(comp, &class->components, class_list,
2569 				 srcu_read_lock_held(&mpam_srcu))
2570 		mpam_reset_component_locked(comp);
2571 }
2572 
mpam_reset_class(struct mpam_class * class)2573 static void mpam_reset_class(struct mpam_class *class)
2574 {
2575 	cpus_read_lock();
2576 	mpam_reset_class_locked(class);
2577 	cpus_read_unlock();
2578 }
2579 
2580 /*
2581  * Called in response to an error IRQ.
2582  * All of MPAMs errors indicate a software bug, restore any modified
2583  * controls to their reset values.
2584  */
mpam_disable(struct work_struct * ignored)2585 void mpam_disable(struct work_struct *ignored)
2586 {
2587 	int idx;
2588 	struct mpam_class *class;
2589 	struct mpam_msc *msc, *tmp;
2590 
2591 	mutex_lock(&mpam_cpuhp_state_lock);
2592 	if (mpam_cpuhp_state) {
2593 		cpuhp_remove_state(mpam_cpuhp_state);
2594 		mpam_cpuhp_state = 0;
2595 	}
2596 	mutex_unlock(&mpam_cpuhp_state_lock);
2597 
2598 	static_branch_disable(&mpam_enabled);
2599 
2600 	mpam_unregister_irqs();
2601 
2602 	idx = srcu_read_lock(&mpam_srcu);
2603 	list_for_each_entry_srcu(class, &mpam_classes, classes_list,
2604 				 srcu_read_lock_held(&mpam_srcu))
2605 		mpam_reset_class(class);
2606 	srcu_read_unlock(&mpam_srcu, idx);
2607 
2608 	mutex_lock(&mpam_list_lock);
2609 	list_for_each_entry_safe(msc, tmp, &mpam_all_msc, all_msc_list)
2610 		mpam_msc_destroy(msc);
2611 	mutex_unlock(&mpam_list_lock);
2612 	mpam_free_garbage();
2613 
2614 	pr_err_once("MPAM disabled due to %s\n", mpam_disable_reason);
2615 }
2616 
2617 /*
2618  * Enable mpam once all devices have been probed.
2619  * Scheduled by mpam_discovery_cpu_online() once all devices have been created.
2620  * Also scheduled when new devices are probed when new CPUs come online.
2621  */
mpam_enable(struct work_struct * work)2622 void mpam_enable(struct work_struct *work)
2623 {
2624 	static atomic_t once;
2625 	struct mpam_msc *msc;
2626 	bool all_devices_probed = true;
2627 
2628 	/* Have we probed all the hw devices? */
2629 	guard(srcu)(&mpam_srcu);
2630 	list_for_each_entry_srcu(msc, &mpam_all_msc, all_msc_list,
2631 				 srcu_read_lock_held(&mpam_srcu)) {
2632 		mutex_lock(&msc->probe_lock);
2633 		if (!msc->probed)
2634 			all_devices_probed = false;
2635 		mutex_unlock(&msc->probe_lock);
2636 
2637 		if (!all_devices_probed)
2638 			break;
2639 	}
2640 
2641 	if (all_devices_probed && !atomic_fetch_inc(&once))
2642 		mpam_enable_once();
2643 }
2644 
2645 #define maybe_update_config(cfg, feature, newcfg, member, changes) do { \
2646 	if (mpam_has_feature(feature, newcfg) &&			\
2647 	    (newcfg)->member != (cfg)->member) {			\
2648 		(cfg)->member = (newcfg)->member;			\
2649 		mpam_set_feature(feature, cfg);				\
2650 									\
2651 		(changes) = true;					\
2652 	}								\
2653 } while (0)
2654 
mpam_update_config(struct mpam_config * cfg,const struct mpam_config * newcfg)2655 static bool mpam_update_config(struct mpam_config *cfg,
2656 			       const struct mpam_config *newcfg)
2657 {
2658 	bool has_changes = false;
2659 
2660 	maybe_update_config(cfg, mpam_feat_cpor_part, newcfg, cpbm, has_changes);
2661 	maybe_update_config(cfg, mpam_feat_mbw_part, newcfg, mbw_pbm, has_changes);
2662 	maybe_update_config(cfg, mpam_feat_mbw_max, newcfg, mbw_max, has_changes);
2663 
2664 	return has_changes;
2665 }
2666 
mpam_apply_config(struct mpam_component * comp,u16 partid,struct mpam_config * cfg)2667 int mpam_apply_config(struct mpam_component *comp, u16 partid,
2668 		      struct mpam_config *cfg)
2669 {
2670 	struct mpam_write_config_arg arg;
2671 	struct mpam_msc_ris *ris;
2672 	struct mpam_vmsc *vmsc;
2673 	struct mpam_msc *msc;
2674 
2675 	lockdep_assert_cpus_held();
2676 
2677 	/* Don't pass in the current config! */
2678 	WARN_ON_ONCE(&comp->cfg[partid] == cfg);
2679 
2680 	if (!mpam_update_config(&comp->cfg[partid], cfg))
2681 		return 0;
2682 
2683 	arg.comp = comp;
2684 	arg.partid = partid;
2685 
2686 	guard(srcu)(&mpam_srcu);
2687 	list_for_each_entry_srcu(vmsc, &comp->vmsc, comp_list,
2688 				 srcu_read_lock_held(&mpam_srcu)) {
2689 		msc = vmsc->msc;
2690 
2691 		mutex_lock(&msc->cfg_lock);
2692 		list_for_each_entry_srcu(ris, &vmsc->ris, vmsc_list,
2693 					 srcu_read_lock_held(&mpam_srcu)) {
2694 			arg.ris = ris;
2695 			mpam_touch_msc(msc, __write_config, &arg);
2696 		}
2697 		mutex_unlock(&msc->cfg_lock);
2698 	}
2699 
2700 	return 0;
2701 }
2702 
mpam_msc_driver_init(void)2703 static int __init mpam_msc_driver_init(void)
2704 {
2705 	if (!system_supports_mpam())
2706 		return -EOPNOTSUPP;
2707 
2708 	init_srcu_struct(&mpam_srcu);
2709 
2710 	fw_num_msc = acpi_mpam_count_msc();
2711 	if (fw_num_msc <= 0) {
2712 		pr_err("No MSC devices found in firmware\n");
2713 		return -EINVAL;
2714 	}
2715 
2716 	return platform_driver_register(&mpam_msc_driver);
2717 }
2718 
2719 /* Must occur after arm64_mpam_register_cpus() from arch_initcall() */
2720 subsys_initcall(mpam_msc_driver_init);
2721 
2722 #ifdef CONFIG_MPAM_KUNIT_TEST
2723 #include "test_mpam_devices.c"
2724 #endif
2725