]>
Commit | Line | Data |
---|---|---|
b2441318 | 1 | // SPDX-License-Identifier: GPL-2.0 |
de0428a7 KW |
2 | #include <linux/perf_event.h> |
3 | #include <linux/types.h> | |
4 | ||
27f6d22b | 5 | #include "../perf_event.h" |
f22f54f4 PZ |
6 | |
7 | /* | |
8 | * Not sure about some of these | |
9 | */ | |
10 | static const u64 p6_perfmon_event_map[] = | |
11 | { | |
e09df478 VW |
12 | [PERF_COUNT_HW_CPU_CYCLES] = 0x0079, /* CPU_CLK_UNHALTED */ |
13 | [PERF_COUNT_HW_INSTRUCTIONS] = 0x00c0, /* INST_RETIRED */ | |
14 | [PERF_COUNT_HW_CACHE_REFERENCES] = 0x0f2e, /* L2_RQSTS:M:E:S:I */ | |
15 | [PERF_COUNT_HW_CACHE_MISSES] = 0x012e, /* L2_RQSTS:I */ | |
16 | [PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = 0x00c4, /* BR_INST_RETIRED */ | |
17 | [PERF_COUNT_HW_BRANCH_MISSES] = 0x00c5, /* BR_MISS_PRED_RETIRED */ | |
18 | [PERF_COUNT_HW_BUS_CYCLES] = 0x0062, /* BUS_DRDY_CLOCKS */ | |
19 | [PERF_COUNT_HW_STALLED_CYCLES_FRONTEND] = 0x00a2, /* RESOURCE_STALLS */ | |
20 | ||
21 | }; | |
22 | ||
c391c788 | 23 | static const u64 __initconst p6_hw_cache_event_ids |
e09df478 VW |
24 | [PERF_COUNT_HW_CACHE_MAX] |
25 | [PERF_COUNT_HW_CACHE_OP_MAX] | |
26 | [PERF_COUNT_HW_CACHE_RESULT_MAX] = | |
27 | { | |
28 | [ C(L1D) ] = { | |
29 | [ C(OP_READ) ] = { | |
30 | [ C(RESULT_ACCESS) ] = 0x0043, /* DATA_MEM_REFS */ | |
31 | [ C(RESULT_MISS) ] = 0x0045, /* DCU_LINES_IN */ | |
32 | }, | |
33 | [ C(OP_WRITE) ] = { | |
34 | [ C(RESULT_ACCESS) ] = 0, | |
35 | [ C(RESULT_MISS) ] = 0x0f29, /* L2_LD:M:E:S:I */ | |
36 | }, | |
37 | [ C(OP_PREFETCH) ] = { | |
38 | [ C(RESULT_ACCESS) ] = 0, | |
39 | [ C(RESULT_MISS) ] = 0, | |
40 | }, | |
41 | }, | |
42 | [ C(L1I ) ] = { | |
43 | [ C(OP_READ) ] = { | |
44 | [ C(RESULT_ACCESS) ] = 0x0080, /* IFU_IFETCH */ | |
45 | [ C(RESULT_MISS) ] = 0x0f28, /* L2_IFETCH:M:E:S:I */ | |
46 | }, | |
47 | [ C(OP_WRITE) ] = { | |
48 | [ C(RESULT_ACCESS) ] = -1, | |
49 | [ C(RESULT_MISS) ] = -1, | |
50 | }, | |
51 | [ C(OP_PREFETCH) ] = { | |
52 | [ C(RESULT_ACCESS) ] = 0, | |
53 | [ C(RESULT_MISS) ] = 0, | |
54 | }, | |
55 | }, | |
56 | [ C(LL ) ] = { | |
57 | [ C(OP_READ) ] = { | |
58 | [ C(RESULT_ACCESS) ] = 0, | |
59 | [ C(RESULT_MISS) ] = 0, | |
60 | }, | |
61 | [ C(OP_WRITE) ] = { | |
62 | [ C(RESULT_ACCESS) ] = 0, | |
63 | [ C(RESULT_MISS) ] = 0x0025, /* L2_M_LINES_INM */ | |
64 | }, | |
65 | [ C(OP_PREFETCH) ] = { | |
66 | [ C(RESULT_ACCESS) ] = 0, | |
67 | [ C(RESULT_MISS) ] = 0, | |
68 | }, | |
69 | }, | |
70 | [ C(DTLB) ] = { | |
71 | [ C(OP_READ) ] = { | |
72 | [ C(RESULT_ACCESS) ] = 0x0043, /* DATA_MEM_REFS */ | |
73 | [ C(RESULT_MISS) ] = 0, | |
74 | }, | |
75 | [ C(OP_WRITE) ] = { | |
76 | [ C(RESULT_ACCESS) ] = 0, | |
77 | [ C(RESULT_MISS) ] = 0, | |
78 | }, | |
79 | [ C(OP_PREFETCH) ] = { | |
80 | [ C(RESULT_ACCESS) ] = 0, | |
81 | [ C(RESULT_MISS) ] = 0, | |
82 | }, | |
83 | }, | |
84 | [ C(ITLB) ] = { | |
85 | [ C(OP_READ) ] = { | |
86 | [ C(RESULT_ACCESS) ] = 0x0080, /* IFU_IFETCH */ | |
87 | [ C(RESULT_MISS) ] = 0x0085, /* ITLB_MISS */ | |
88 | }, | |
89 | [ C(OP_WRITE) ] = { | |
90 | [ C(RESULT_ACCESS) ] = -1, | |
91 | [ C(RESULT_MISS) ] = -1, | |
92 | }, | |
93 | [ C(OP_PREFETCH) ] = { | |
94 | [ C(RESULT_ACCESS) ] = -1, | |
95 | [ C(RESULT_MISS) ] = -1, | |
96 | }, | |
97 | }, | |
98 | [ C(BPU ) ] = { | |
99 | [ C(OP_READ) ] = { | |
100 | [ C(RESULT_ACCESS) ] = 0x00c4, /* BR_INST_RETIRED */ | |
101 | [ C(RESULT_MISS) ] = 0x00c5, /* BR_MISS_PRED_RETIRED */ | |
102 | }, | |
103 | [ C(OP_WRITE) ] = { | |
104 | [ C(RESULT_ACCESS) ] = -1, | |
105 | [ C(RESULT_MISS) ] = -1, | |
106 | }, | |
107 | [ C(OP_PREFETCH) ] = { | |
108 | [ C(RESULT_ACCESS) ] = -1, | |
109 | [ C(RESULT_MISS) ] = -1, | |
110 | }, | |
111 | }, | |
f22f54f4 PZ |
112 | }; |
113 | ||
114 | static u64 p6_pmu_event_map(int hw_event) | |
115 | { | |
116 | return p6_perfmon_event_map[hw_event]; | |
117 | } | |
118 | ||
119 | /* | |
120 | * Event setting that is specified not to count anything. | |
121 | * We use this to effectively disable a counter. | |
122 | * | |
123 | * L2_RQSTS with 0 MESI unit mask. | |
124 | */ | |
125 | #define P6_NOP_EVENT 0x0000002EULL | |
126 | ||
f22f54f4 PZ |
127 | static struct event_constraint p6_event_constraints[] = |
128 | { | |
129 | INTEL_EVENT_CONSTRAINT(0xc1, 0x1), /* FLOPS */ | |
130 | INTEL_EVENT_CONSTRAINT(0x10, 0x1), /* FP_COMP_OPS_EXE */ | |
7991c9ca | 131 | INTEL_EVENT_CONSTRAINT(0x11, 0x2), /* FP_ASSIST */ |
f22f54f4 PZ |
132 | INTEL_EVENT_CONSTRAINT(0x12, 0x2), /* MUL */ |
133 | INTEL_EVENT_CONSTRAINT(0x13, 0x2), /* DIV */ | |
134 | INTEL_EVENT_CONSTRAINT(0x14, 0x1), /* CYCLES_DIV_BUSY */ | |
135 | EVENT_CONSTRAINT_END | |
136 | }; | |
137 | ||
138 | static void p6_pmu_disable_all(void) | |
139 | { | |
140 | u64 val; | |
141 | ||
142 | /* p6 only has one enable register */ | |
143 | rdmsrl(MSR_P6_EVNTSEL0, val); | |
bb1165d6 | 144 | val &= ~ARCH_PERFMON_EVENTSEL_ENABLE; |
f22f54f4 PZ |
145 | wrmsrl(MSR_P6_EVNTSEL0, val); |
146 | } | |
147 | ||
11164cd4 | 148 | static void p6_pmu_enable_all(int added) |
f22f54f4 PZ |
149 | { |
150 | unsigned long val; | |
151 | ||
152 | /* p6 only has one enable register */ | |
153 | rdmsrl(MSR_P6_EVNTSEL0, val); | |
bb1165d6 | 154 | val |= ARCH_PERFMON_EVENTSEL_ENABLE; |
f22f54f4 PZ |
155 | wrmsrl(MSR_P6_EVNTSEL0, val); |
156 | } | |
157 | ||
158 | static inline void | |
aff3d91a | 159 | p6_pmu_disable_event(struct perf_event *event) |
f22f54f4 | 160 | { |
aff3d91a | 161 | struct hw_perf_event *hwc = &event->hw; |
f22f54f4 PZ |
162 | u64 val = P6_NOP_EVENT; |
163 | ||
715c85b1 | 164 | (void)wrmsrl_safe(hwc->config_base, val); |
f22f54f4 PZ |
165 | } |
166 | ||
aff3d91a | 167 | static void p6_pmu_enable_event(struct perf_event *event) |
f22f54f4 | 168 | { |
aff3d91a | 169 | struct hw_perf_event *hwc = &event->hw; |
f22f54f4 PZ |
170 | u64 val; |
171 | ||
172 | val = hwc->config; | |
58e9eaf0 VW |
173 | |
174 | /* | |
175 | * p6 only has a global event enable, set on PerfEvtSel0 | |
176 | * We "disable" events by programming P6_NOP_EVENT | |
177 | * and we rely on p6_pmu_enable_all() being called | |
178 | * to actually enable the events. | |
179 | */ | |
f22f54f4 | 180 | |
715c85b1 | 181 | (void)wrmsrl_safe(hwc->config_base, val); |
f22f54f4 PZ |
182 | } |
183 | ||
641cc938 JO |
184 | PMU_FORMAT_ATTR(event, "config:0-7" ); |
185 | PMU_FORMAT_ATTR(umask, "config:8-15" ); | |
186 | PMU_FORMAT_ATTR(edge, "config:18" ); | |
187 | PMU_FORMAT_ATTR(pc, "config:19" ); | |
188 | PMU_FORMAT_ATTR(inv, "config:23" ); | |
189 | PMU_FORMAT_ATTR(cmask, "config:24-31" ); | |
190 | ||
191 | static struct attribute *intel_p6_formats_attr[] = { | |
192 | &format_attr_event.attr, | |
193 | &format_attr_umask.attr, | |
194 | &format_attr_edge.attr, | |
195 | &format_attr_pc.attr, | |
196 | &format_attr_inv.attr, | |
197 | &format_attr_cmask.attr, | |
198 | NULL, | |
199 | }; | |
200 | ||
caaa8be3 | 201 | static __initconst const struct x86_pmu p6_pmu = { |
f22f54f4 PZ |
202 | .name = "p6", |
203 | .handle_irq = x86_pmu_handle_irq, | |
204 | .disable_all = p6_pmu_disable_all, | |
205 | .enable_all = p6_pmu_enable_all, | |
206 | .enable = p6_pmu_enable_event, | |
207 | .disable = p6_pmu_disable_event, | |
b4cdc5c2 | 208 | .hw_config = x86_pmu_hw_config, |
a072738e | 209 | .schedule_events = x86_schedule_events, |
f22f54f4 PZ |
210 | .eventsel = MSR_P6_EVNTSEL0, |
211 | .perfctr = MSR_P6_PERFCTR0, | |
212 | .event_map = p6_pmu_event_map, | |
f22f54f4 PZ |
213 | .max_events = ARRAY_SIZE(p6_perfmon_event_map), |
214 | .apic = 1, | |
215 | .max_period = (1ULL << 31) - 1, | |
216 | .version = 0, | |
948b1bb8 | 217 | .num_counters = 2, |
f22f54f4 PZ |
218 | /* |
219 | * Events have 40 bits implemented. However they are designed such | |
220 | * that bits [32-39] are sign extensions of bit 31. As such the | |
221 | * effective width of a event for P6-like PMU is 32 bits only. | |
222 | * | |
223 | * See IA-32 Intel Architecture Software developer manual Vol 3B | |
224 | */ | |
948b1bb8 RR |
225 | .cntval_bits = 32, |
226 | .cntval_mask = (1ULL << 32) - 1, | |
f22f54f4 PZ |
227 | .get_event_constraints = x86_get_event_constraints, |
228 | .event_constraints = p6_event_constraints, | |
641cc938 JO |
229 | |
230 | .format_attrs = intel_p6_formats_attr, | |
20550a43 JO |
231 | .events_sysfs_show = intel_event_sysfs_show, |
232 | ||
f22f54f4 PZ |
233 | }; |
234 | ||
e97df763 PZ |
235 | static __init void p6_pmu_rdpmc_quirk(void) |
236 | { | |
237 | if (boot_cpu_data.x86_mask < 9) { | |
238 | /* | |
239 | * PPro erratum 26; fixed in stepping 9 and above. | |
240 | */ | |
241 | pr_warn("Userspace RDPMC support disabled due to a CPU erratum\n"); | |
242 | x86_pmu.attr_rdpmc_broken = 1; | |
243 | x86_pmu.attr_rdpmc = 0; | |
244 | } | |
245 | } | |
246 | ||
de0428a7 | 247 | __init int p6_pmu_init(void) |
f22f54f4 | 248 | { |
e97df763 PZ |
249 | x86_pmu = p6_pmu; |
250 | ||
f22f54f4 | 251 | switch (boot_cpu_data.x86_model) { |
e97df763 PZ |
252 | case 1: /* Pentium Pro */ |
253 | x86_add_quirk(p6_pmu_rdpmc_quirk); | |
254 | break; | |
255 | ||
256 | case 3: /* Pentium II - Klamath */ | |
257 | case 5: /* Pentium II - Deschutes */ | |
258 | case 6: /* Pentium II - Mendocino */ | |
f22f54f4 | 259 | break; |
e97df763 PZ |
260 | |
261 | case 7: /* Pentium III - Katmai */ | |
262 | case 8: /* Pentium III - Coppermine */ | |
263 | case 10: /* Pentium III Xeon */ | |
264 | case 11: /* Pentium III - Tualatin */ | |
265 | break; | |
266 | ||
267 | case 9: /* Pentium M - Banias */ | |
268 | case 13: /* Pentium M - Dothan */ | |
269 | break; | |
270 | ||
f22f54f4 | 271 | default: |
e97df763 | 272 | pr_cont("unsupported p6 CPU model %d ", boot_cpu_data.x86_model); |
f22f54f4 PZ |
273 | return -ENODEV; |
274 | } | |
275 | ||
e09df478 VW |
276 | memcpy(hw_cache_event_ids, p6_hw_cache_event_ids, |
277 | sizeof(hw_cache_event_ids)); | |
278 | ||
f22f54f4 PZ |
279 | return 0; |
280 | } |