xref: /linux/arch/x86/events/intel/p6.c (revision c8bfe3fad4f86a029da7157bae9699c816f0c309)
1 // SPDX-License-Identifier: GPL-2.0
2 #include <linux/perf_event.h>
3 #include <linux/types.h>
4 
5 #include "../perf_event.h"
6 
7 /*
8  * Not sure about some of these
9  */
10 static const u64 p6_perfmon_event_map[] =
11 {
12   [PERF_COUNT_HW_CPU_CYCLES]		= 0x0079,	/* CPU_CLK_UNHALTED */
13   [PERF_COUNT_HW_INSTRUCTIONS]		= 0x00c0,	/* INST_RETIRED     */
14   [PERF_COUNT_HW_CACHE_REFERENCES]	= 0x0f2e,	/* L2_RQSTS:M:E:S:I */
15   [PERF_COUNT_HW_CACHE_MISSES]		= 0x012e,	/* L2_RQSTS:I       */
16   [PERF_COUNT_HW_BRANCH_INSTRUCTIONS]	= 0x00c4,	/* BR_INST_RETIRED  */
17   [PERF_COUNT_HW_BRANCH_MISSES]		= 0x00c5,	/* BR_MISS_PRED_RETIRED */
18   [PERF_COUNT_HW_BUS_CYCLES]		= 0x0062,	/* BUS_DRDY_CLOCKS  */
19   [PERF_COUNT_HW_STALLED_CYCLES_FRONTEND] = 0x00a2,	/* RESOURCE_STALLS  */
20 
21 };
22 
23 static const u64 __initconst p6_hw_cache_event_ids
24 				[PERF_COUNT_HW_CACHE_MAX]
25 				[PERF_COUNT_HW_CACHE_OP_MAX]
26 				[PERF_COUNT_HW_CACHE_RESULT_MAX] =
27 {
28  [ C(L1D) ] = {
29 	[ C(OP_READ) ] = {
30 		[ C(RESULT_ACCESS) ] = 0x0043,	/* DATA_MEM_REFS       */
31                 [ C(RESULT_MISS)   ] = 0x0045,	/* DCU_LINES_IN        */
32 	},
33 	[ C(OP_WRITE) ] = {
34 		[ C(RESULT_ACCESS) ] = 0,
35 		[ C(RESULT_MISS)   ] = 0x0f29,	/* L2_LD:M:E:S:I       */
36 	},
37         [ C(OP_PREFETCH) ] = {
38 		[ C(RESULT_ACCESS) ] = 0,
39 		[ C(RESULT_MISS)   ] = 0,
40         },
41  },
42  [ C(L1I ) ] = {
43 	[ C(OP_READ) ] = {
44 		[ C(RESULT_ACCESS) ] = 0x0080,	/* IFU_IFETCH         */
45 		[ C(RESULT_MISS)   ] = 0x0f28,	/* L2_IFETCH:M:E:S:I  */
46 	},
47 	[ C(OP_WRITE) ] = {
48 		[ C(RESULT_ACCESS) ] = -1,
49 		[ C(RESULT_MISS)   ] = -1,
50 	},
51 	[ C(OP_PREFETCH) ] = {
52 		[ C(RESULT_ACCESS) ] = 0,
53 		[ C(RESULT_MISS)   ] = 0,
54 	},
55  },
56  [ C(LL  ) ] = {
57 	[ C(OP_READ) ] = {
58 		[ C(RESULT_ACCESS) ] = 0,
59 		[ C(RESULT_MISS)   ] = 0,
60 	},
61 	[ C(OP_WRITE) ] = {
62 		[ C(RESULT_ACCESS) ] = 0,
63 		[ C(RESULT_MISS)   ] = 0x0025,	/* L2_M_LINES_INM     */
64 	},
65 	[ C(OP_PREFETCH) ] = {
66 		[ C(RESULT_ACCESS) ] = 0,
67 		[ C(RESULT_MISS)   ] = 0,
68 	},
69  },
70  [ C(DTLB) ] = {
71 	[ C(OP_READ) ] = {
72 		[ C(RESULT_ACCESS) ] = 0x0043,	/* DATA_MEM_REFS      */
73 		[ C(RESULT_MISS)   ] = 0,
74 	},
75 	[ C(OP_WRITE) ] = {
76 		[ C(RESULT_ACCESS) ] = 0,
77 		[ C(RESULT_MISS)   ] = 0,
78 	},
79 	[ C(OP_PREFETCH) ] = {
80 		[ C(RESULT_ACCESS) ] = 0,
81 		[ C(RESULT_MISS)   ] = 0,
82 	},
83  },
84  [ C(ITLB) ] = {
85 	[ C(OP_READ) ] = {
86 		[ C(RESULT_ACCESS) ] = 0x0080,	/* IFU_IFETCH         */
87 		[ C(RESULT_MISS)   ] = 0x0085,	/* ITLB_MISS          */
88 	},
89 	[ C(OP_WRITE) ] = {
90 		[ C(RESULT_ACCESS) ] = -1,
91 		[ C(RESULT_MISS)   ] = -1,
92 	},
93 	[ C(OP_PREFETCH) ] = {
94 		[ C(RESULT_ACCESS) ] = -1,
95 		[ C(RESULT_MISS)   ] = -1,
96 	},
97  },
98  [ C(BPU ) ] = {
99 	[ C(OP_READ) ] = {
100 		[ C(RESULT_ACCESS) ] = 0x00c4,	/* BR_INST_RETIRED      */
101 		[ C(RESULT_MISS)   ] = 0x00c5,	/* BR_MISS_PRED_RETIRED */
102         },
103 	[ C(OP_WRITE) ] = {
104 		[ C(RESULT_ACCESS) ] = -1,
105 		[ C(RESULT_MISS)   ] = -1,
106 	},
107 	[ C(OP_PREFETCH) ] = {
108 		[ C(RESULT_ACCESS) ] = -1,
109 		[ C(RESULT_MISS)   ] = -1,
110 	},
111  },
112 };
113 
114 static u64 p6_pmu_event_map(int hw_event)
115 {
116 	return p6_perfmon_event_map[hw_event];
117 }
118 
119 /*
120  * Event setting that is specified not to count anything.
121  * We use this to effectively disable a counter.
122  *
123  * L2_RQSTS with 0 MESI unit mask.
124  */
125 #define P6_NOP_EVENT			0x0000002EULL
126 
127 static struct event_constraint p6_event_constraints[] =
128 {
129 	INTEL_EVENT_CONSTRAINT(0xc1, 0x1),	/* FLOPS */
130 	INTEL_EVENT_CONSTRAINT(0x10, 0x1),	/* FP_COMP_OPS_EXE */
131 	INTEL_EVENT_CONSTRAINT(0x11, 0x2),	/* FP_ASSIST */
132 	INTEL_EVENT_CONSTRAINT(0x12, 0x2),	/* MUL */
133 	INTEL_EVENT_CONSTRAINT(0x13, 0x2),	/* DIV */
134 	INTEL_EVENT_CONSTRAINT(0x14, 0x1),	/* CYCLES_DIV_BUSY */
135 	EVENT_CONSTRAINT_END
136 };
137 
138 static void p6_pmu_disable_all(void)
139 {
140 	u64 val;
141 
142 	/* p6 only has one enable register */
143 	rdmsrl(MSR_P6_EVNTSEL0, val);
144 	val &= ~ARCH_PERFMON_EVENTSEL_ENABLE;
145 	wrmsrl(MSR_P6_EVNTSEL0, val);
146 }
147 
148 static void p6_pmu_enable_all(int added)
149 {
150 	unsigned long val;
151 
152 	/* p6 only has one enable register */
153 	rdmsrl(MSR_P6_EVNTSEL0, val);
154 	val |= ARCH_PERFMON_EVENTSEL_ENABLE;
155 	wrmsrl(MSR_P6_EVNTSEL0, val);
156 }
157 
158 static inline void
159 p6_pmu_disable_event(struct perf_event *event)
160 {
161 	struct hw_perf_event *hwc = &event->hw;
162 	u64 val = P6_NOP_EVENT;
163 
164 	(void)wrmsrl_safe(hwc->config_base, val);
165 }
166 
167 static void p6_pmu_enable_event(struct perf_event *event)
168 {
169 	struct hw_perf_event *hwc = &event->hw;
170 	u64 val;
171 
172 	val = hwc->config;
173 
174 	/*
175 	 * p6 only has a global event enable, set on PerfEvtSel0
176 	 * We "disable" events by programming P6_NOP_EVENT
177 	 * and we rely on p6_pmu_enable_all() being called
178 	 * to actually enable the events.
179 	 */
180 
181 	(void)wrmsrl_safe(hwc->config_base, val);
182 }
183 
184 PMU_FORMAT_ATTR(event,	"config:0-7"	);
185 PMU_FORMAT_ATTR(umask,	"config:8-15"	);
186 PMU_FORMAT_ATTR(edge,	"config:18"	);
187 PMU_FORMAT_ATTR(pc,	"config:19"	);
188 PMU_FORMAT_ATTR(inv,	"config:23"	);
189 PMU_FORMAT_ATTR(cmask,	"config:24-31"	);
190 
191 static struct attribute *intel_p6_formats_attr[] = {
192 	&format_attr_event.attr,
193 	&format_attr_umask.attr,
194 	&format_attr_edge.attr,
195 	&format_attr_pc.attr,
196 	&format_attr_inv.attr,
197 	&format_attr_cmask.attr,
198 	NULL,
199 };
200 
201 static __initconst const struct x86_pmu p6_pmu = {
202 	.name			= "p6",
203 	.handle_irq		= x86_pmu_handle_irq,
204 	.disable_all		= p6_pmu_disable_all,
205 	.enable_all		= p6_pmu_enable_all,
206 	.enable			= p6_pmu_enable_event,
207 	.disable		= p6_pmu_disable_event,
208 	.hw_config		= x86_pmu_hw_config,
209 	.schedule_events	= x86_schedule_events,
210 	.eventsel		= MSR_P6_EVNTSEL0,
211 	.perfctr		= MSR_P6_PERFCTR0,
212 	.event_map		= p6_pmu_event_map,
213 	.max_events		= ARRAY_SIZE(p6_perfmon_event_map),
214 	.apic			= 1,
215 	.max_period		= (1ULL << 31) - 1,
216 	.version		= 0,
217 	.num_counters		= 2,
218 	/*
219 	 * Events have 40 bits implemented. However they are designed such
220 	 * that bits [32-39] are sign extensions of bit 31. As such the
221 	 * effective width of a event for P6-like PMU is 32 bits only.
222 	 *
223 	 * See IA-32 Intel Architecture Software developer manual Vol 3B
224 	 */
225 	.cntval_bits		= 32,
226 	.cntval_mask		= (1ULL << 32) - 1,
227 	.get_event_constraints	= x86_get_event_constraints,
228 	.event_constraints	= p6_event_constraints,
229 
230 	.format_attrs		= intel_p6_formats_attr,
231 	.events_sysfs_show	= intel_event_sysfs_show,
232 
233 };
234 
235 static __init void p6_pmu_rdpmc_quirk(void)
236 {
237 	if (boot_cpu_data.x86_stepping < 9) {
238 		/*
239 		 * PPro erratum 26; fixed in stepping 9 and above.
240 		 */
241 		pr_warn("Userspace RDPMC support disabled due to a CPU erratum\n");
242 		x86_pmu.attr_rdpmc_broken = 1;
243 		x86_pmu.attr_rdpmc = 0;
244 	}
245 }
246 
247 __init int p6_pmu_init(void)
248 {
249 	x86_pmu = p6_pmu;
250 
251 	switch (boot_cpu_data.x86_model) {
252 	case  1: /* Pentium Pro */
253 		x86_add_quirk(p6_pmu_rdpmc_quirk);
254 		break;
255 
256 	case  3: /* Pentium II - Klamath */
257 	case  5: /* Pentium II - Deschutes */
258 	case  6: /* Pentium II - Mendocino */
259 		break;
260 
261 	case  7: /* Pentium III - Katmai */
262 	case  8: /* Pentium III - Coppermine */
263 	case 10: /* Pentium III Xeon */
264 	case 11: /* Pentium III - Tualatin */
265 		break;
266 
267 	case  9: /* Pentium M - Banias */
268 	case 13: /* Pentium M - Dothan */
269 		break;
270 
271 	default:
272 		pr_cont("unsupported p6 CPU model %d ", boot_cpu_data.x86_model);
273 		return -ENODEV;
274 	}
275 
276 	memcpy(hw_cache_event_ids, p6_hw_cache_event_ids,
277 		sizeof(hw_cache_event_ids));
278 
279 	return 0;
280 }
281