1 // SPDX-License-Identifier: GPL-2.0
3 * ARMv7 Cortex-A8 and Cortex-A9 Performance Events handling code.
5 * ARMv7 support: Jean Pihet <jpihet@mvista.com>
6 * 2010 (c) MontaVista Software, LLC.
8 * Copied from ARMv6 code, with the low level code inspired
9 * by the ARMv7 Oprofile code.
11 * Cortex-A8 has up to 4 configurable performance counters and
12 * a single cycle counter.
13 * Cortex-A9 has up to 31 configurable performance counters and
14 * a single cycle counter.
16 * All counters can be enabled/disabled and IRQ masked separately. The cycle
17 * counter and all 4 performance counters together can be reset separately.
23 #include <asm/cputype.h>
24 #include <asm/irq_regs.h>
26 #include "../vfp/vfpinstr.h"
29 #include <linux/perf/arm_pmu.h>
30 #include <linux/platform_device.h>
33 * Common ARMv7 event types
35 * Note: An implementation may not be able to count all of these events
36 * but the encodings are considered to be `reserved' in the case that
37 * they are not available.
39 #define ARMV7_PERFCTR_PMNC_SW_INCR 0x00
40 #define ARMV7_PERFCTR_L1_ICACHE_REFILL 0x01
41 #define ARMV7_PERFCTR_ITLB_REFILL 0x02
42 #define ARMV7_PERFCTR_L1_DCACHE_REFILL 0x03
43 #define ARMV7_PERFCTR_L1_DCACHE_ACCESS 0x04
44 #define ARMV7_PERFCTR_DTLB_REFILL 0x05
45 #define ARMV7_PERFCTR_MEM_READ 0x06
46 #define ARMV7_PERFCTR_MEM_WRITE 0x07
47 #define ARMV7_PERFCTR_INSTR_EXECUTED 0x08
48 #define ARMV7_PERFCTR_EXC_TAKEN 0x09
49 #define ARMV7_PERFCTR_EXC_EXECUTED 0x0A
50 #define ARMV7_PERFCTR_CID_WRITE 0x0B
53 * ARMV7_PERFCTR_PC_WRITE is equivalent to HW_BRANCH_INSTRUCTIONS.
55 * - all (taken) branch instructions,
56 * - instructions that explicitly write the PC,
57 * - exception generating instructions.
59 #define ARMV7_PERFCTR_PC_WRITE 0x0C
60 #define ARMV7_PERFCTR_PC_IMM_BRANCH 0x0D
61 #define ARMV7_PERFCTR_PC_PROC_RETURN 0x0E
62 #define ARMV7_PERFCTR_MEM_UNALIGNED_ACCESS 0x0F
63 #define ARMV7_PERFCTR_PC_BRANCH_MIS_PRED 0x10
64 #define ARMV7_PERFCTR_CLOCK_CYCLES 0x11
65 #define ARMV7_PERFCTR_PC_BRANCH_PRED 0x12
67 /* These events are defined by the PMUv2 supplement (ARM DDI 0457A). */
68 #define ARMV7_PERFCTR_MEM_ACCESS 0x13
69 #define ARMV7_PERFCTR_L1_ICACHE_ACCESS 0x14
70 #define ARMV7_PERFCTR_L1_DCACHE_WB 0x15
71 #define ARMV7_PERFCTR_L2_CACHE_ACCESS 0x16
72 #define ARMV7_PERFCTR_L2_CACHE_REFILL 0x17
73 #define ARMV7_PERFCTR_L2_CACHE_WB 0x18
74 #define ARMV7_PERFCTR_BUS_ACCESS 0x19
75 #define ARMV7_PERFCTR_MEM_ERROR 0x1A
76 #define ARMV7_PERFCTR_INSTR_SPEC 0x1B
77 #define ARMV7_PERFCTR_TTBR_WRITE 0x1C
78 #define ARMV7_PERFCTR_BUS_CYCLES 0x1D
80 #define ARMV7_PERFCTR_CPU_CYCLES 0xFF
82 /* ARMv7 Cortex-A8 specific event types */
83 #define ARMV7_A8_PERFCTR_L2_CACHE_ACCESS 0x43
84 #define ARMV7_A8_PERFCTR_L2_CACHE_REFILL 0x44
85 #define ARMV7_A8_PERFCTR_L1_ICACHE_ACCESS 0x50
86 #define ARMV7_A8_PERFCTR_STALL_ISIDE 0x56
88 /* ARMv7 Cortex-A9 specific event types */
89 #define ARMV7_A9_PERFCTR_INSTR_CORE_RENAME 0x68
90 #define ARMV7_A9_PERFCTR_STALL_ICACHE 0x60
91 #define ARMV7_A9_PERFCTR_STALL_DISPATCH 0x66
93 /* ARMv7 Cortex-A5 specific event types */
94 #define ARMV7_A5_PERFCTR_PREFETCH_LINEFILL 0xc2
95 #define ARMV7_A5_PERFCTR_PREFETCH_LINEFILL_DROP 0xc3
97 /* ARMv7 Cortex-A15 specific event types */
98 #define ARMV7_A15_PERFCTR_L1_DCACHE_ACCESS_READ 0x40
99 #define ARMV7_A15_PERFCTR_L1_DCACHE_ACCESS_WRITE 0x41
100 #define ARMV7_A15_PERFCTR_L1_DCACHE_REFILL_READ 0x42
101 #define ARMV7_A15_PERFCTR_L1_DCACHE_REFILL_WRITE 0x43
103 #define ARMV7_A15_PERFCTR_DTLB_REFILL_L1_READ 0x4C
104 #define ARMV7_A15_PERFCTR_DTLB_REFILL_L1_WRITE 0x4D
106 #define ARMV7_A15_PERFCTR_L2_CACHE_ACCESS_READ 0x50
107 #define ARMV7_A15_PERFCTR_L2_CACHE_ACCESS_WRITE 0x51
108 #define ARMV7_A15_PERFCTR_L2_CACHE_REFILL_READ 0x52
109 #define ARMV7_A15_PERFCTR_L2_CACHE_REFILL_WRITE 0x53
111 #define ARMV7_A15_PERFCTR_PC_WRITE_SPEC 0x76
113 /* ARMv7 Cortex-A12 specific event types */
114 #define ARMV7_A12_PERFCTR_L1_DCACHE_ACCESS_READ 0x40
115 #define ARMV7_A12_PERFCTR_L1_DCACHE_ACCESS_WRITE 0x41
117 #define ARMV7_A12_PERFCTR_L2_CACHE_ACCESS_READ 0x50
118 #define ARMV7_A12_PERFCTR_L2_CACHE_ACCESS_WRITE 0x51
120 #define ARMV7_A12_PERFCTR_PC_WRITE_SPEC 0x76
122 #define ARMV7_A12_PERFCTR_PF_TLB_REFILL 0xe7
124 /* ARMv7 Krait specific event types */
125 #define KRAIT_PMRESR0_GROUP0 0xcc
126 #define KRAIT_PMRESR1_GROUP0 0xd0
127 #define KRAIT_PMRESR2_GROUP0 0xd4
128 #define KRAIT_VPMRESR0_GROUP0 0xd8
130 #define KRAIT_PERFCTR_L1_ICACHE_ACCESS 0x10011
131 #define KRAIT_PERFCTR_L1_ICACHE_MISS 0x10010
133 #define KRAIT_PERFCTR_L1_ITLB_ACCESS 0x12222
134 #define KRAIT_PERFCTR_L1_DTLB_ACCESS 0x12210
136 /* ARMv7 Scorpion specific event types */
137 #define SCORPION_LPM0_GROUP0 0x4c
138 #define SCORPION_LPM1_GROUP0 0x50
139 #define SCORPION_LPM2_GROUP0 0x54
140 #define SCORPION_L2LPM_GROUP0 0x58
141 #define SCORPION_VLPM_GROUP0 0x5c
143 #define SCORPION_ICACHE_ACCESS 0x10053
144 #define SCORPION_ICACHE_MISS 0x10052
146 #define SCORPION_DTLB_ACCESS 0x12013
147 #define SCORPION_DTLB_MISS 0x12012
149 #define SCORPION_ITLB_MISS 0x12021
152 * Cortex-A8 HW events mapping
154 * The hardware events that we support. We do support cache operations but
155 * we have harvard caches and no way to combine instruction and data
156 * accesses/misses in hardware.
158 static const unsigned armv7_a8_perf_map[PERF_COUNT_HW_MAX] = {
159 PERF_MAP_ALL_UNSUPPORTED,
160 [PERF_COUNT_HW_CPU_CYCLES] = ARMV7_PERFCTR_CPU_CYCLES,
161 [PERF_COUNT_HW_INSTRUCTIONS] = ARMV7_PERFCTR_INSTR_EXECUTED,
162 [PERF_COUNT_HW_CACHE_REFERENCES] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
163 [PERF_COUNT_HW_CACHE_MISSES] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
164 [PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = ARMV7_PERFCTR_PC_WRITE,
165 [PERF_COUNT_HW_BRANCH_MISSES] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
166 [PERF_COUNT_HW_STALLED_CYCLES_FRONTEND] = ARMV7_A8_PERFCTR_STALL_ISIDE,
169 static const unsigned armv7_a8_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
170 [PERF_COUNT_HW_CACHE_OP_MAX]
171 [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
172 PERF_CACHE_MAP_ALL_UNSUPPORTED,
175 * The performance counters don't differentiate between read and write
176 * accesses/misses so this isn't strictly correct, but it's the best we
177 * can do. Writes and reads get combined.
179 [C(L1D)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
180 [C(L1D)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
181 [C(L1D)][C(OP_WRITE)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
182 [C(L1D)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
184 [C(L1I)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_A8_PERFCTR_L1_ICACHE_ACCESS,
185 [C(L1I)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_L1_ICACHE_REFILL,
187 [C(LL)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_A8_PERFCTR_L2_CACHE_ACCESS,
188 [C(LL)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_A8_PERFCTR_L2_CACHE_REFILL,
189 [C(LL)][C(OP_WRITE)][C(RESULT_ACCESS)] = ARMV7_A8_PERFCTR_L2_CACHE_ACCESS,
190 [C(LL)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_A8_PERFCTR_L2_CACHE_REFILL,
192 [C(DTLB)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_DTLB_REFILL,
193 [C(DTLB)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_DTLB_REFILL,
195 [C(ITLB)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
196 [C(ITLB)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
198 [C(BPU)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
199 [C(BPU)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
200 [C(BPU)][C(OP_WRITE)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
201 [C(BPU)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
205 * Cortex-A9 HW events mapping
207 static const unsigned armv7_a9_perf_map[PERF_COUNT_HW_MAX] = {
208 PERF_MAP_ALL_UNSUPPORTED,
209 [PERF_COUNT_HW_CPU_CYCLES] = ARMV7_PERFCTR_CPU_CYCLES,
210 [PERF_COUNT_HW_INSTRUCTIONS] = ARMV7_A9_PERFCTR_INSTR_CORE_RENAME,
211 [PERF_COUNT_HW_CACHE_REFERENCES] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
212 [PERF_COUNT_HW_CACHE_MISSES] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
213 [PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = ARMV7_PERFCTR_PC_WRITE,
214 [PERF_COUNT_HW_BRANCH_MISSES] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
215 [PERF_COUNT_HW_STALLED_CYCLES_FRONTEND] = ARMV7_A9_PERFCTR_STALL_ICACHE,
216 [PERF_COUNT_HW_STALLED_CYCLES_BACKEND] = ARMV7_A9_PERFCTR_STALL_DISPATCH,
219 static const unsigned armv7_a9_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
220 [PERF_COUNT_HW_CACHE_OP_MAX]
221 [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
222 PERF_CACHE_MAP_ALL_UNSUPPORTED,
225 * The performance counters don't differentiate between read and write
226 * accesses/misses so this isn't strictly correct, but it's the best we
227 * can do. Writes and reads get combined.
229 [C(L1D)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
230 [C(L1D)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
231 [C(L1D)][C(OP_WRITE)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
232 [C(L1D)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
234 [C(L1I)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_L1_ICACHE_REFILL,
236 [C(DTLB)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_DTLB_REFILL,
237 [C(DTLB)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_DTLB_REFILL,
239 [C(ITLB)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
240 [C(ITLB)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
242 [C(BPU)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
243 [C(BPU)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
244 [C(BPU)][C(OP_WRITE)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
245 [C(BPU)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
249 * Cortex-A5 HW events mapping
251 static const unsigned armv7_a5_perf_map[PERF_COUNT_HW_MAX] = {
252 PERF_MAP_ALL_UNSUPPORTED,
253 [PERF_COUNT_HW_CPU_CYCLES] = ARMV7_PERFCTR_CPU_CYCLES,
254 [PERF_COUNT_HW_INSTRUCTIONS] = ARMV7_PERFCTR_INSTR_EXECUTED,
255 [PERF_COUNT_HW_CACHE_REFERENCES] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
256 [PERF_COUNT_HW_CACHE_MISSES] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
257 [PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = ARMV7_PERFCTR_PC_WRITE,
258 [PERF_COUNT_HW_BRANCH_MISSES] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
261 static const unsigned armv7_a5_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
262 [PERF_COUNT_HW_CACHE_OP_MAX]
263 [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
264 PERF_CACHE_MAP_ALL_UNSUPPORTED,
266 [C(L1D)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
267 [C(L1D)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
268 [C(L1D)][C(OP_WRITE)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
269 [C(L1D)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
270 [C(L1D)][C(OP_PREFETCH)][C(RESULT_ACCESS)] = ARMV7_A5_PERFCTR_PREFETCH_LINEFILL,
271 [C(L1D)][C(OP_PREFETCH)][C(RESULT_MISS)] = ARMV7_A5_PERFCTR_PREFETCH_LINEFILL_DROP,
273 [C(L1I)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_ICACHE_ACCESS,
274 [C(L1I)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_L1_ICACHE_REFILL,
276 * The prefetch counters don't differentiate between the I side and the
279 [C(L1I)][C(OP_PREFETCH)][C(RESULT_ACCESS)] = ARMV7_A5_PERFCTR_PREFETCH_LINEFILL,
280 [C(L1I)][C(OP_PREFETCH)][C(RESULT_MISS)] = ARMV7_A5_PERFCTR_PREFETCH_LINEFILL_DROP,
282 [C(DTLB)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_DTLB_REFILL,
283 [C(DTLB)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_DTLB_REFILL,
285 [C(ITLB)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
286 [C(ITLB)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
288 [C(BPU)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
289 [C(BPU)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
290 [C(BPU)][C(OP_WRITE)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
291 [C(BPU)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
295 * Cortex-A15 HW events mapping
297 static const unsigned armv7_a15_perf_map[PERF_COUNT_HW_MAX] = {
298 PERF_MAP_ALL_UNSUPPORTED,
299 [PERF_COUNT_HW_CPU_CYCLES] = ARMV7_PERFCTR_CPU_CYCLES,
300 [PERF_COUNT_HW_INSTRUCTIONS] = ARMV7_PERFCTR_INSTR_EXECUTED,
301 [PERF_COUNT_HW_CACHE_REFERENCES] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
302 [PERF_COUNT_HW_CACHE_MISSES] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
303 [PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = ARMV7_A15_PERFCTR_PC_WRITE_SPEC,
304 [PERF_COUNT_HW_BRANCH_MISSES] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
305 [PERF_COUNT_HW_BUS_CYCLES] = ARMV7_PERFCTR_BUS_CYCLES,
308 static const unsigned armv7_a15_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
309 [PERF_COUNT_HW_CACHE_OP_MAX]
310 [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
311 PERF_CACHE_MAP_ALL_UNSUPPORTED,
313 [C(L1D)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_A15_PERFCTR_L1_DCACHE_ACCESS_READ,
314 [C(L1D)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_A15_PERFCTR_L1_DCACHE_REFILL_READ,
315 [C(L1D)][C(OP_WRITE)][C(RESULT_ACCESS)] = ARMV7_A15_PERFCTR_L1_DCACHE_ACCESS_WRITE,
316 [C(L1D)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_A15_PERFCTR_L1_DCACHE_REFILL_WRITE,
319 * Not all performance counters differentiate between read and write
320 * accesses/misses so we're not always strictly correct, but it's the
321 * best we can do. Writes and reads get combined in these cases.
323 [C(L1I)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_ICACHE_ACCESS,
324 [C(L1I)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_L1_ICACHE_REFILL,
326 [C(LL)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_A15_PERFCTR_L2_CACHE_ACCESS_READ,
327 [C(LL)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_A15_PERFCTR_L2_CACHE_REFILL_READ,
328 [C(LL)][C(OP_WRITE)][C(RESULT_ACCESS)] = ARMV7_A15_PERFCTR_L2_CACHE_ACCESS_WRITE,
329 [C(LL)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_A15_PERFCTR_L2_CACHE_REFILL_WRITE,
331 [C(DTLB)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_A15_PERFCTR_DTLB_REFILL_L1_READ,
332 [C(DTLB)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_A15_PERFCTR_DTLB_REFILL_L1_WRITE,
334 [C(ITLB)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
335 [C(ITLB)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
337 [C(BPU)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
338 [C(BPU)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
339 [C(BPU)][C(OP_WRITE)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
340 [C(BPU)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
344 * Cortex-A7 HW events mapping
346 static const unsigned armv7_a7_perf_map[PERF_COUNT_HW_MAX] = {
347 PERF_MAP_ALL_UNSUPPORTED,
348 [PERF_COUNT_HW_CPU_CYCLES] = ARMV7_PERFCTR_CPU_CYCLES,
349 [PERF_COUNT_HW_INSTRUCTIONS] = ARMV7_PERFCTR_INSTR_EXECUTED,
350 [PERF_COUNT_HW_CACHE_REFERENCES] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
351 [PERF_COUNT_HW_CACHE_MISSES] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
352 [PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = ARMV7_PERFCTR_PC_WRITE,
353 [PERF_COUNT_HW_BRANCH_MISSES] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
354 [PERF_COUNT_HW_BUS_CYCLES] = ARMV7_PERFCTR_BUS_CYCLES,
357 static const unsigned armv7_a7_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
358 [PERF_COUNT_HW_CACHE_OP_MAX]
359 [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
360 PERF_CACHE_MAP_ALL_UNSUPPORTED,
363 * The performance counters don't differentiate between read and write
364 * accesses/misses so this isn't strictly correct, but it's the best we
365 * can do. Writes and reads get combined.
367 [C(L1D)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
368 [C(L1D)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
369 [C(L1D)][C(OP_WRITE)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
370 [C(L1D)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
372 [C(L1I)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_ICACHE_ACCESS,
373 [C(L1I)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_L1_ICACHE_REFILL,
375 [C(LL)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_L2_CACHE_ACCESS,
376 [C(LL)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_L2_CACHE_REFILL,
377 [C(LL)][C(OP_WRITE)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_L2_CACHE_ACCESS,
378 [C(LL)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_L2_CACHE_REFILL,
380 [C(DTLB)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_DTLB_REFILL,
381 [C(DTLB)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_DTLB_REFILL,
383 [C(ITLB)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
384 [C(ITLB)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
386 [C(BPU)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
387 [C(BPU)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
388 [C(BPU)][C(OP_WRITE)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
389 [C(BPU)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
393 * Cortex-A12 HW events mapping
395 static const unsigned armv7_a12_perf_map[PERF_COUNT_HW_MAX] = {
396 PERF_MAP_ALL_UNSUPPORTED,
397 [PERF_COUNT_HW_CPU_CYCLES] = ARMV7_PERFCTR_CPU_CYCLES,
398 [PERF_COUNT_HW_INSTRUCTIONS] = ARMV7_PERFCTR_INSTR_EXECUTED,
399 [PERF_COUNT_HW_CACHE_REFERENCES] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
400 [PERF_COUNT_HW_CACHE_MISSES] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
401 [PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = ARMV7_A12_PERFCTR_PC_WRITE_SPEC,
402 [PERF_COUNT_HW_BRANCH_MISSES] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
403 [PERF_COUNT_HW_BUS_CYCLES] = ARMV7_PERFCTR_BUS_CYCLES,
406 static const unsigned armv7_a12_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
407 [PERF_COUNT_HW_CACHE_OP_MAX]
408 [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
409 PERF_CACHE_MAP_ALL_UNSUPPORTED,
411 [C(L1D)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_A12_PERFCTR_L1_DCACHE_ACCESS_READ,
412 [C(L1D)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
413 [C(L1D)][C(OP_WRITE)][C(RESULT_ACCESS)] = ARMV7_A12_PERFCTR_L1_DCACHE_ACCESS_WRITE,
414 [C(L1D)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
417 * Not all performance counters differentiate between read and write
418 * accesses/misses so we're not always strictly correct, but it's the
419 * best we can do. Writes and reads get combined in these cases.
421 [C(L1I)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_ICACHE_ACCESS,
422 [C(L1I)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_L1_ICACHE_REFILL,
424 [C(LL)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_A12_PERFCTR_L2_CACHE_ACCESS_READ,
425 [C(LL)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_L2_CACHE_REFILL,
426 [C(LL)][C(OP_WRITE)][C(RESULT_ACCESS)] = ARMV7_A12_PERFCTR_L2_CACHE_ACCESS_WRITE,
427 [C(LL)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_L2_CACHE_REFILL,
429 [C(DTLB)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_DTLB_REFILL,
430 [C(DTLB)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_DTLB_REFILL,
431 [C(DTLB)][C(OP_PREFETCH)][C(RESULT_MISS)] = ARMV7_A12_PERFCTR_PF_TLB_REFILL,
433 [C(ITLB)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
434 [C(ITLB)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
436 [C(BPU)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
437 [C(BPU)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
438 [C(BPU)][C(OP_WRITE)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
439 [C(BPU)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
443 * Krait HW events mapping
445 static const unsigned krait_perf_map[PERF_COUNT_HW_MAX] = {
446 PERF_MAP_ALL_UNSUPPORTED,
447 [PERF_COUNT_HW_CPU_CYCLES] = ARMV7_PERFCTR_CPU_CYCLES,
448 [PERF_COUNT_HW_INSTRUCTIONS] = ARMV7_PERFCTR_INSTR_EXECUTED,
449 [PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = ARMV7_PERFCTR_PC_WRITE,
450 [PERF_COUNT_HW_BRANCH_MISSES] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
451 [PERF_COUNT_HW_BUS_CYCLES] = ARMV7_PERFCTR_CLOCK_CYCLES,
454 static const unsigned krait_perf_map_no_branch[PERF_COUNT_HW_MAX] = {
455 PERF_MAP_ALL_UNSUPPORTED,
456 [PERF_COUNT_HW_CPU_CYCLES] = ARMV7_PERFCTR_CPU_CYCLES,
457 [PERF_COUNT_HW_INSTRUCTIONS] = ARMV7_PERFCTR_INSTR_EXECUTED,
458 [PERF_COUNT_HW_BRANCH_MISSES] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
459 [PERF_COUNT_HW_BUS_CYCLES] = ARMV7_PERFCTR_CLOCK_CYCLES,
462 static const unsigned krait_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
463 [PERF_COUNT_HW_CACHE_OP_MAX]
464 [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
465 PERF_CACHE_MAP_ALL_UNSUPPORTED,
468 * The performance counters don't differentiate between read and write
469 * accesses/misses so this isn't strictly correct, but it's the best we
470 * can do. Writes and reads get combined.
472 [C(L1D)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
473 [C(L1D)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
474 [C(L1D)][C(OP_WRITE)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
475 [C(L1D)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
477 [C(L1I)][C(OP_READ)][C(RESULT_ACCESS)] = KRAIT_PERFCTR_L1_ICACHE_ACCESS,
478 [C(L1I)][C(OP_READ)][C(RESULT_MISS)] = KRAIT_PERFCTR_L1_ICACHE_MISS,
480 [C(DTLB)][C(OP_READ)][C(RESULT_ACCESS)] = KRAIT_PERFCTR_L1_DTLB_ACCESS,
481 [C(DTLB)][C(OP_WRITE)][C(RESULT_ACCESS)] = KRAIT_PERFCTR_L1_DTLB_ACCESS,
483 [C(ITLB)][C(OP_READ)][C(RESULT_ACCESS)] = KRAIT_PERFCTR_L1_ITLB_ACCESS,
484 [C(ITLB)][C(OP_WRITE)][C(RESULT_ACCESS)] = KRAIT_PERFCTR_L1_ITLB_ACCESS,
486 [C(BPU)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
487 [C(BPU)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
488 [C(BPU)][C(OP_WRITE)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
489 [C(BPU)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
493 * Scorpion HW events mapping
495 static const unsigned scorpion_perf_map[PERF_COUNT_HW_MAX] = {
496 PERF_MAP_ALL_UNSUPPORTED,
497 [PERF_COUNT_HW_CPU_CYCLES] = ARMV7_PERFCTR_CPU_CYCLES,
498 [PERF_COUNT_HW_INSTRUCTIONS] = ARMV7_PERFCTR_INSTR_EXECUTED,
499 [PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = ARMV7_PERFCTR_PC_WRITE,
500 [PERF_COUNT_HW_BRANCH_MISSES] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
501 [PERF_COUNT_HW_BUS_CYCLES] = ARMV7_PERFCTR_CLOCK_CYCLES,
504 static const unsigned scorpion_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
505 [PERF_COUNT_HW_CACHE_OP_MAX]
506 [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
507 PERF_CACHE_MAP_ALL_UNSUPPORTED,
509 * The performance counters don't differentiate between read and write
510 * accesses/misses so this isn't strictly correct, but it's the best we
511 * can do. Writes and reads get combined.
513 [C(L1D)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
514 [C(L1D)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
515 [C(L1D)][C(OP_WRITE)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
516 [C(L1D)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
517 [C(L1I)][C(OP_READ)][C(RESULT_ACCESS)] = SCORPION_ICACHE_ACCESS,
518 [C(L1I)][C(OP_READ)][C(RESULT_MISS)] = SCORPION_ICACHE_MISS,
520 * Only ITLB misses and DTLB refills are supported. If users want the
521 * DTLB refills misses a raw counter must be used.
523 [C(DTLB)][C(OP_READ)][C(RESULT_ACCESS)] = SCORPION_DTLB_ACCESS,
524 [C(DTLB)][C(OP_READ)][C(RESULT_MISS)] = SCORPION_DTLB_MISS,
525 [C(DTLB)][C(OP_WRITE)][C(RESULT_ACCESS)] = SCORPION_DTLB_ACCESS,
526 [C(DTLB)][C(OP_WRITE)][C(RESULT_MISS)] = SCORPION_DTLB_MISS,
527 [C(ITLB)][C(OP_READ)][C(RESULT_MISS)] = SCORPION_ITLB_MISS,
528 [C(ITLB)][C(OP_WRITE)][C(RESULT_MISS)] = SCORPION_ITLB_MISS,
529 [C(BPU)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
530 [C(BPU)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
531 [C(BPU)][C(OP_WRITE)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
532 [C(BPU)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
535 PMU_FORMAT_ATTR(event, "config:0-7");
537 static struct attribute *armv7_pmu_format_attrs[] = {
538 &format_attr_event.attr,
542 static struct attribute_group armv7_pmu_format_attr_group = {
544 .attrs = armv7_pmu_format_attrs,
547 #define ARMV7_EVENT_ATTR_RESOLVE(m) #m
548 #define ARMV7_EVENT_ATTR(name, config) \
549 PMU_EVENT_ATTR_STRING(name, armv7_event_attr_##name, \
550 "event=" ARMV7_EVENT_ATTR_RESOLVE(config))
552 ARMV7_EVENT_ATTR(sw_incr, ARMV7_PERFCTR_PMNC_SW_INCR);
553 ARMV7_EVENT_ATTR(l1i_cache_refill, ARMV7_PERFCTR_L1_ICACHE_REFILL);
554 ARMV7_EVENT_ATTR(l1i_tlb_refill, ARMV7_PERFCTR_ITLB_REFILL);
555 ARMV7_EVENT_ATTR(l1d_cache_refill, ARMV7_PERFCTR_L1_DCACHE_REFILL);
556 ARMV7_EVENT_ATTR(l1d_cache, ARMV7_PERFCTR_L1_DCACHE_ACCESS);
557 ARMV7_EVENT_ATTR(l1d_tlb_refill, ARMV7_PERFCTR_DTLB_REFILL);
558 ARMV7_EVENT_ATTR(ld_retired, ARMV7_PERFCTR_MEM_READ);
559 ARMV7_EVENT_ATTR(st_retired, ARMV7_PERFCTR_MEM_WRITE);
560 ARMV7_EVENT_ATTR(inst_retired, ARMV7_PERFCTR_INSTR_EXECUTED);
561 ARMV7_EVENT_ATTR(exc_taken, ARMV7_PERFCTR_EXC_TAKEN);
562 ARMV7_EVENT_ATTR(exc_return, ARMV7_PERFCTR_EXC_EXECUTED);
563 ARMV7_EVENT_ATTR(cid_write_retired, ARMV7_PERFCTR_CID_WRITE);
564 ARMV7_EVENT_ATTR(pc_write_retired, ARMV7_PERFCTR_PC_WRITE);
565 ARMV7_EVENT_ATTR(br_immed_retired, ARMV7_PERFCTR_PC_IMM_BRANCH);
566 ARMV7_EVENT_ATTR(br_return_retired, ARMV7_PERFCTR_PC_PROC_RETURN);
567 ARMV7_EVENT_ATTR(unaligned_ldst_retired, ARMV7_PERFCTR_MEM_UNALIGNED_ACCESS);
568 ARMV7_EVENT_ATTR(br_mis_pred, ARMV7_PERFCTR_PC_BRANCH_MIS_PRED);
569 ARMV7_EVENT_ATTR(cpu_cycles, ARMV7_PERFCTR_CLOCK_CYCLES);
570 ARMV7_EVENT_ATTR(br_pred, ARMV7_PERFCTR_PC_BRANCH_PRED);
572 static struct attribute *armv7_pmuv1_event_attrs[] = {
573 &armv7_event_attr_sw_incr.attr.attr,
574 &armv7_event_attr_l1i_cache_refill.attr.attr,
575 &armv7_event_attr_l1i_tlb_refill.attr.attr,
576 &armv7_event_attr_l1d_cache_refill.attr.attr,
577 &armv7_event_attr_l1d_cache.attr.attr,
578 &armv7_event_attr_l1d_tlb_refill.attr.attr,
579 &armv7_event_attr_ld_retired.attr.attr,
580 &armv7_event_attr_st_retired.attr.attr,
581 &armv7_event_attr_inst_retired.attr.attr,
582 &armv7_event_attr_exc_taken.attr.attr,
583 &armv7_event_attr_exc_return.attr.attr,
584 &armv7_event_attr_cid_write_retired.attr.attr,
585 &armv7_event_attr_pc_write_retired.attr.attr,
586 &armv7_event_attr_br_immed_retired.attr.attr,
587 &armv7_event_attr_br_return_retired.attr.attr,
588 &armv7_event_attr_unaligned_ldst_retired.attr.attr,
589 &armv7_event_attr_br_mis_pred.attr.attr,
590 &armv7_event_attr_cpu_cycles.attr.attr,
591 &armv7_event_attr_br_pred.attr.attr,
595 static struct attribute_group armv7_pmuv1_events_attr_group = {
597 .attrs = armv7_pmuv1_event_attrs,
600 ARMV7_EVENT_ATTR(mem_access, ARMV7_PERFCTR_MEM_ACCESS);
601 ARMV7_EVENT_ATTR(l1i_cache, ARMV7_PERFCTR_L1_ICACHE_ACCESS);
602 ARMV7_EVENT_ATTR(l1d_cache_wb, ARMV7_PERFCTR_L1_DCACHE_WB);
603 ARMV7_EVENT_ATTR(l2d_cache, ARMV7_PERFCTR_L2_CACHE_ACCESS);
604 ARMV7_EVENT_ATTR(l2d_cache_refill, ARMV7_PERFCTR_L2_CACHE_REFILL);
605 ARMV7_EVENT_ATTR(l2d_cache_wb, ARMV7_PERFCTR_L2_CACHE_WB);
606 ARMV7_EVENT_ATTR(bus_access, ARMV7_PERFCTR_BUS_ACCESS);
607 ARMV7_EVENT_ATTR(memory_error, ARMV7_PERFCTR_MEM_ERROR);
608 ARMV7_EVENT_ATTR(inst_spec, ARMV7_PERFCTR_INSTR_SPEC);
609 ARMV7_EVENT_ATTR(ttbr_write_retired, ARMV7_PERFCTR_TTBR_WRITE);
610 ARMV7_EVENT_ATTR(bus_cycles, ARMV7_PERFCTR_BUS_CYCLES);
612 static struct attribute *armv7_pmuv2_event_attrs[] = {
613 &armv7_event_attr_sw_incr.attr.attr,
614 &armv7_event_attr_l1i_cache_refill.attr.attr,
615 &armv7_event_attr_l1i_tlb_refill.attr.attr,
616 &armv7_event_attr_l1d_cache_refill.attr.attr,
617 &armv7_event_attr_l1d_cache.attr.attr,
618 &armv7_event_attr_l1d_tlb_refill.attr.attr,
619 &armv7_event_attr_ld_retired.attr.attr,
620 &armv7_event_attr_st_retired.attr.attr,
621 &armv7_event_attr_inst_retired.attr.attr,
622 &armv7_event_attr_exc_taken.attr.attr,
623 &armv7_event_attr_exc_return.attr.attr,
624 &armv7_event_attr_cid_write_retired.attr.attr,
625 &armv7_event_attr_pc_write_retired.attr.attr,
626 &armv7_event_attr_br_immed_retired.attr.attr,
627 &armv7_event_attr_br_return_retired.attr.attr,
628 &armv7_event_attr_unaligned_ldst_retired.attr.attr,
629 &armv7_event_attr_br_mis_pred.attr.attr,
630 &armv7_event_attr_cpu_cycles.attr.attr,
631 &armv7_event_attr_br_pred.attr.attr,
632 &armv7_event_attr_mem_access.attr.attr,
633 &armv7_event_attr_l1i_cache.attr.attr,
634 &armv7_event_attr_l1d_cache_wb.attr.attr,
635 &armv7_event_attr_l2d_cache.attr.attr,
636 &armv7_event_attr_l2d_cache_refill.attr.attr,
637 &armv7_event_attr_l2d_cache_wb.attr.attr,
638 &armv7_event_attr_bus_access.attr.attr,
639 &armv7_event_attr_memory_error.attr.attr,
640 &armv7_event_attr_inst_spec.attr.attr,
641 &armv7_event_attr_ttbr_write_retired.attr.attr,
642 &armv7_event_attr_bus_cycles.attr.attr,
646 static struct attribute_group armv7_pmuv2_events_attr_group = {
648 .attrs = armv7_pmuv2_event_attrs,
652 * Perf Events' indices
654 #define ARMV7_IDX_CYCLE_COUNTER 0
655 #define ARMV7_IDX_COUNTER0 1
656 #define ARMV7_IDX_COUNTER_LAST(cpu_pmu) \
657 (ARMV7_IDX_CYCLE_COUNTER + cpu_pmu->num_events - 1)
659 #define ARMV7_MAX_COUNTERS 32
660 #define ARMV7_COUNTER_MASK (ARMV7_MAX_COUNTERS - 1)
663 * ARMv7 low level PMNC access
667 * Perf Event to low level counters mapping
669 #define ARMV7_IDX_TO_COUNTER(x) \
670 (((x) - ARMV7_IDX_COUNTER0) & ARMV7_COUNTER_MASK)
673 * Per-CPU PMNC: config reg
675 #define ARMV7_PMNC_E (1 << 0) /* Enable all counters */
676 #define ARMV7_PMNC_P (1 << 1) /* Reset all counters */
677 #define ARMV7_PMNC_C (1 << 2) /* Cycle counter reset */
678 #define ARMV7_PMNC_D (1 << 3) /* CCNT counts every 64th cpu cycle */
679 #define ARMV7_PMNC_X (1 << 4) /* Export to ETM */
680 #define ARMV7_PMNC_DP (1 << 5) /* Disable CCNT if non-invasive debug*/
681 #define ARMV7_PMNC_N_SHIFT 11 /* Number of counters supported */
682 #define ARMV7_PMNC_N_MASK 0x1f
683 #define ARMV7_PMNC_MASK 0x3f /* Mask for writable bits */
686 * FLAG: counters overflow flag status reg
688 #define ARMV7_FLAG_MASK 0xffffffff /* Mask for writable bits */
689 #define ARMV7_OVERFLOWED_MASK ARMV7_FLAG_MASK
692 * PMXEVTYPER: Event selection reg
694 #define ARMV7_EVTYPE_MASK 0xc80000ff /* Mask for writable bits */
695 #define ARMV7_EVTYPE_EVENT 0xff /* Mask for EVENT bits */
698 * Event filters for PMUv2
700 #define ARMV7_EXCLUDE_PL1 (1 << 31)
701 #define ARMV7_EXCLUDE_USER (1 << 30)
702 #define ARMV7_INCLUDE_HYP (1 << 27)
705 * Secure debug enable reg
707 #define ARMV7_SDER_SUNIDEN BIT(1) /* Permit non-invasive debug */
709 static inline u32 armv7_pmnc_read(void)
712 asm volatile("mrc p15, 0, %0, c9, c12, 0" : "=r"(val));
716 static inline void armv7_pmnc_write(u32 val)
718 val &= ARMV7_PMNC_MASK;
720 asm volatile("mcr p15, 0, %0, c9, c12, 0" : : "r"(val));
723 static inline int armv7_pmnc_has_overflowed(u32 pmnc)
725 return pmnc & ARMV7_OVERFLOWED_MASK;
728 static inline int armv7_pmnc_counter_valid(struct arm_pmu *cpu_pmu, int idx)
730 return idx >= ARMV7_IDX_CYCLE_COUNTER &&
731 idx <= ARMV7_IDX_COUNTER_LAST(cpu_pmu);
734 static inline int armv7_pmnc_counter_has_overflowed(u32 pmnc, int idx)
736 return pmnc & BIT(ARMV7_IDX_TO_COUNTER(idx));
739 static inline void armv7_pmnc_select_counter(int idx)
741 u32 counter = ARMV7_IDX_TO_COUNTER(idx);
742 asm volatile("mcr p15, 0, %0, c9, c12, 5" : : "r" (counter));
746 static inline u64 armv7pmu_read_counter(struct perf_event *event)
748 struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
749 struct hw_perf_event *hwc = &event->hw;
753 if (!armv7_pmnc_counter_valid(cpu_pmu, idx)) {
754 pr_err("CPU%u reading wrong counter %d\n",
755 smp_processor_id(), idx);
756 } else if (idx == ARMV7_IDX_CYCLE_COUNTER) {
757 asm volatile("mrc p15, 0, %0, c9, c13, 0" : "=r" (value));
759 armv7_pmnc_select_counter(idx);
760 asm volatile("mrc p15, 0, %0, c9, c13, 2" : "=r" (value));
766 static inline void armv7pmu_write_counter(struct perf_event *event, u64 value)
768 struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
769 struct hw_perf_event *hwc = &event->hw;
772 if (!armv7_pmnc_counter_valid(cpu_pmu, idx)) {
773 pr_err("CPU%u writing wrong counter %d\n",
774 smp_processor_id(), idx);
775 } else if (idx == ARMV7_IDX_CYCLE_COUNTER) {
776 asm volatile("mcr p15, 0, %0, c9, c13, 0" : : "r" ((u32)value));
778 armv7_pmnc_select_counter(idx);
779 asm volatile("mcr p15, 0, %0, c9, c13, 2" : : "r" ((u32)value));
783 static inline void armv7_pmnc_write_evtsel(int idx, u32 val)
785 armv7_pmnc_select_counter(idx);
786 val &= ARMV7_EVTYPE_MASK;
787 asm volatile("mcr p15, 0, %0, c9, c13, 1" : : "r" (val));
790 static inline void armv7_pmnc_enable_counter(int idx)
792 u32 counter = ARMV7_IDX_TO_COUNTER(idx);
793 asm volatile("mcr p15, 0, %0, c9, c12, 1" : : "r" (BIT(counter)));
796 static inline void armv7_pmnc_disable_counter(int idx)
798 u32 counter = ARMV7_IDX_TO_COUNTER(idx);
799 asm volatile("mcr p15, 0, %0, c9, c12, 2" : : "r" (BIT(counter)));
802 static inline void armv7_pmnc_enable_intens(int idx)
804 u32 counter = ARMV7_IDX_TO_COUNTER(idx);
805 asm volatile("mcr p15, 0, %0, c9, c14, 1" : : "r" (BIT(counter)));
808 static inline void armv7_pmnc_disable_intens(int idx)
810 u32 counter = ARMV7_IDX_TO_COUNTER(idx);
811 asm volatile("mcr p15, 0, %0, c9, c14, 2" : : "r" (BIT(counter)));
813 /* Clear the overflow flag in case an interrupt is pending. */
814 asm volatile("mcr p15, 0, %0, c9, c12, 3" : : "r" (BIT(counter)));
818 static inline u32 armv7_pmnc_getreset_flags(void)
823 asm volatile("mrc p15, 0, %0, c9, c12, 3" : "=r" (val));
825 /* Write to clear flags */
826 val &= ARMV7_FLAG_MASK;
827 asm volatile("mcr p15, 0, %0, c9, c12, 3" : : "r" (val));
833 static void armv7_pmnc_dump_regs(struct arm_pmu *cpu_pmu)
838 pr_info("PMNC registers dump:\n");
840 asm volatile("mrc p15, 0, %0, c9, c12, 0" : "=r" (val));
841 pr_info("PMNC =0x%08x\n", val);
843 asm volatile("mrc p15, 0, %0, c9, c12, 1" : "=r" (val));
844 pr_info("CNTENS=0x%08x\n", val);
846 asm volatile("mrc p15, 0, %0, c9, c14, 1" : "=r" (val));
847 pr_info("INTENS=0x%08x\n", val);
849 asm volatile("mrc p15, 0, %0, c9, c12, 3" : "=r" (val));
850 pr_info("FLAGS =0x%08x\n", val);
852 asm volatile("mrc p15, 0, %0, c9, c12, 5" : "=r" (val));
853 pr_info("SELECT=0x%08x\n", val);
855 asm volatile("mrc p15, 0, %0, c9, c13, 0" : "=r" (val));
856 pr_info("CCNT =0x%08x\n", val);
858 for (cnt = ARMV7_IDX_COUNTER0;
859 cnt <= ARMV7_IDX_COUNTER_LAST(cpu_pmu); cnt++) {
860 armv7_pmnc_select_counter(cnt);
861 asm volatile("mrc p15, 0, %0, c9, c13, 2" : "=r" (val));
862 pr_info("CNT[%d] count =0x%08x\n",
863 ARMV7_IDX_TO_COUNTER(cnt), val);
864 asm volatile("mrc p15, 0, %0, c9, c13, 1" : "=r" (val));
865 pr_info("CNT[%d] evtsel=0x%08x\n",
866 ARMV7_IDX_TO_COUNTER(cnt), val);
871 static void armv7pmu_enable_event(struct perf_event *event)
874 struct hw_perf_event *hwc = &event->hw;
875 struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
876 struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
879 if (!armv7_pmnc_counter_valid(cpu_pmu, idx)) {
880 pr_err("CPU%u enabling wrong PMNC counter IRQ enable %d\n",
881 smp_processor_id(), idx);
886 * Enable counter and interrupt, and set the counter to count
887 * the event that we're interested in.
889 raw_spin_lock_irqsave(&events->pmu_lock, flags);
894 armv7_pmnc_disable_counter(idx);
897 * Set event (if destined for PMNx counters)
898 * We only need to set the event for the cycle counter if we
899 * have the ability to perform event filtering.
901 if (cpu_pmu->set_event_filter || idx != ARMV7_IDX_CYCLE_COUNTER)
902 armv7_pmnc_write_evtsel(idx, hwc->config_base);
905 * Enable interrupt for this counter
907 armv7_pmnc_enable_intens(idx);
912 armv7_pmnc_enable_counter(idx);
914 raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
917 static void armv7pmu_disable_event(struct perf_event *event)
920 struct hw_perf_event *hwc = &event->hw;
921 struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
922 struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
925 if (!armv7_pmnc_counter_valid(cpu_pmu, idx)) {
926 pr_err("CPU%u disabling wrong PMNC counter IRQ enable %d\n",
927 smp_processor_id(), idx);
932 * Disable counter and interrupt
934 raw_spin_lock_irqsave(&events->pmu_lock, flags);
939 armv7_pmnc_disable_counter(idx);
942 * Disable interrupt for this counter
944 armv7_pmnc_disable_intens(idx);
946 raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
949 static irqreturn_t armv7pmu_handle_irq(struct arm_pmu *cpu_pmu)
952 struct perf_sample_data data;
953 struct pmu_hw_events *cpuc = this_cpu_ptr(cpu_pmu->hw_events);
954 struct pt_regs *regs;
958 * Get and reset the IRQ flags
960 pmnc = armv7_pmnc_getreset_flags();
963 * Did an overflow occur?
965 if (!armv7_pmnc_has_overflowed(pmnc))
969 * Handle the counter(s) overflow(s)
971 regs = get_irq_regs();
973 for (idx = 0; idx < cpu_pmu->num_events; ++idx) {
974 struct perf_event *event = cpuc->events[idx];
975 struct hw_perf_event *hwc;
977 /* Ignore if we don't have an event. */
982 * We have a single interrupt for all counters. Check that
983 * each counter has overflowed before we process it.
985 if (!armv7_pmnc_counter_has_overflowed(pmnc, idx))
989 armpmu_event_update(event);
990 perf_sample_data_init(&data, 0, hwc->last_period);
991 if (!armpmu_event_set_period(event))
994 if (perf_event_overflow(event, &data, regs))
995 cpu_pmu->disable(event);
999 * Handle the pending perf events.
1001 * Note: this call *must* be run with interrupts disabled. For
1002 * platforms that can have the PMU interrupts raised as an NMI, this
1010 static void armv7pmu_start(struct arm_pmu *cpu_pmu)
1012 unsigned long flags;
1013 struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
1015 raw_spin_lock_irqsave(&events->pmu_lock, flags);
1016 /* Enable all counters */
1017 armv7_pmnc_write(armv7_pmnc_read() | ARMV7_PMNC_E);
1018 raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
1021 static void armv7pmu_stop(struct arm_pmu *cpu_pmu)
1023 unsigned long flags;
1024 struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
1026 raw_spin_lock_irqsave(&events->pmu_lock, flags);
1027 /* Disable all counters */
1028 armv7_pmnc_write(armv7_pmnc_read() & ~ARMV7_PMNC_E);
1029 raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
1032 static int armv7pmu_get_event_idx(struct pmu_hw_events *cpuc,
1033 struct perf_event *event)
1036 struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
1037 struct hw_perf_event *hwc = &event->hw;
1038 unsigned long evtype = hwc->config_base & ARMV7_EVTYPE_EVENT;
1040 /* Always place a cycle counter into the cycle counter. */
1041 if (evtype == ARMV7_PERFCTR_CPU_CYCLES) {
1042 if (test_and_set_bit(ARMV7_IDX_CYCLE_COUNTER, cpuc->used_mask))
1045 return ARMV7_IDX_CYCLE_COUNTER;
1049 * For anything other than a cycle counter, try and use
1050 * the events counters
1052 for (idx = ARMV7_IDX_COUNTER0; idx < cpu_pmu->num_events; ++idx) {
1053 if (!test_and_set_bit(idx, cpuc->used_mask))
1057 /* The counters are all in use. */
1061 static void armv7pmu_clear_event_idx(struct pmu_hw_events *cpuc,
1062 struct perf_event *event)
1064 clear_bit(event->hw.idx, cpuc->used_mask);
1068 * Add an event filter to a given event. This will only work for PMUv2 PMUs.
1070 static int armv7pmu_set_event_filter(struct hw_perf_event *event,
1071 struct perf_event_attr *attr)
1073 unsigned long config_base = 0;
1075 if (attr->exclude_idle)
1077 if (attr->exclude_user)
1078 config_base |= ARMV7_EXCLUDE_USER;
1079 if (attr->exclude_kernel)
1080 config_base |= ARMV7_EXCLUDE_PL1;
1081 if (!attr->exclude_hv)
1082 config_base |= ARMV7_INCLUDE_HYP;
1085 * Install the filter into config_base as this is used to
1086 * construct the event type.
1088 event->config_base = config_base;
1093 static void armv7pmu_reset(void *info)
1095 struct arm_pmu *cpu_pmu = (struct arm_pmu *)info;
1096 u32 idx, nb_cnt = cpu_pmu->num_events, val;
1098 if (cpu_pmu->secure_access) {
1099 asm volatile("mrc p15, 0, %0, c1, c1, 1" : "=r" (val));
1100 val |= ARMV7_SDER_SUNIDEN;
1101 asm volatile("mcr p15, 0, %0, c1, c1, 1" : : "r" (val));
1104 /* The counter and interrupt enable registers are unknown at reset. */
1105 for (idx = ARMV7_IDX_CYCLE_COUNTER; idx < nb_cnt; ++idx) {
1106 armv7_pmnc_disable_counter(idx);
1107 armv7_pmnc_disable_intens(idx);
1110 /* Initialize & Reset PMNC: C and P bits */
1111 armv7_pmnc_write(ARMV7_PMNC_P | ARMV7_PMNC_C);
1114 static int armv7_a8_map_event(struct perf_event *event)
1116 return armpmu_map_event(event, &armv7_a8_perf_map,
1117 &armv7_a8_perf_cache_map, 0xFF);
1120 static int armv7_a9_map_event(struct perf_event *event)
1122 return armpmu_map_event(event, &armv7_a9_perf_map,
1123 &armv7_a9_perf_cache_map, 0xFF);
1126 static int armv7_a5_map_event(struct perf_event *event)
1128 return armpmu_map_event(event, &armv7_a5_perf_map,
1129 &armv7_a5_perf_cache_map, 0xFF);
1132 static int armv7_a15_map_event(struct perf_event *event)
1134 return armpmu_map_event(event, &armv7_a15_perf_map,
1135 &armv7_a15_perf_cache_map, 0xFF);
1138 static int armv7_a7_map_event(struct perf_event *event)
1140 return armpmu_map_event(event, &armv7_a7_perf_map,
1141 &armv7_a7_perf_cache_map, 0xFF);
1144 static int armv7_a12_map_event(struct perf_event *event)
1146 return armpmu_map_event(event, &armv7_a12_perf_map,
1147 &armv7_a12_perf_cache_map, 0xFF);
1150 static int krait_map_event(struct perf_event *event)
1152 return armpmu_map_event(event, &krait_perf_map,
1153 &krait_perf_cache_map, 0xFFFFF);
1156 static int krait_map_event_no_branch(struct perf_event *event)
1158 return armpmu_map_event(event, &krait_perf_map_no_branch,
1159 &krait_perf_cache_map, 0xFFFFF);
1162 static int scorpion_map_event(struct perf_event *event)
1164 return armpmu_map_event(event, &scorpion_perf_map,
1165 &scorpion_perf_cache_map, 0xFFFFF);
1168 static void armv7pmu_init(struct arm_pmu *cpu_pmu)
1170 cpu_pmu->handle_irq = armv7pmu_handle_irq;
1171 cpu_pmu->enable = armv7pmu_enable_event;
1172 cpu_pmu->disable = armv7pmu_disable_event;
1173 cpu_pmu->read_counter = armv7pmu_read_counter;
1174 cpu_pmu->write_counter = armv7pmu_write_counter;
1175 cpu_pmu->get_event_idx = armv7pmu_get_event_idx;
1176 cpu_pmu->clear_event_idx = armv7pmu_clear_event_idx;
1177 cpu_pmu->start = armv7pmu_start;
1178 cpu_pmu->stop = armv7pmu_stop;
1179 cpu_pmu->reset = armv7pmu_reset;
1182 static void armv7_read_num_pmnc_events(void *info)
1186 /* Read the nb of CNTx counters supported from PMNC */
1187 *nb_cnt = (armv7_pmnc_read() >> ARMV7_PMNC_N_SHIFT) & ARMV7_PMNC_N_MASK;
1189 /* Add the CPU cycles counter */
1193 static int armv7_probe_num_events(struct arm_pmu *arm_pmu)
1195 return smp_call_function_any(&arm_pmu->supported_cpus,
1196 armv7_read_num_pmnc_events,
1197 &arm_pmu->num_events, 1);
1200 static int armv7_a8_pmu_init(struct arm_pmu *cpu_pmu)
1202 armv7pmu_init(cpu_pmu);
1203 cpu_pmu->name = "armv7_cortex_a8";
1204 cpu_pmu->map_event = armv7_a8_map_event;
1205 cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_EVENTS] =
1206 &armv7_pmuv1_events_attr_group;
1207 cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_FORMATS] =
1208 &armv7_pmu_format_attr_group;
1209 return armv7_probe_num_events(cpu_pmu);
1212 static int armv7_a9_pmu_init(struct arm_pmu *cpu_pmu)
1214 armv7pmu_init(cpu_pmu);
1215 cpu_pmu->name = "armv7_cortex_a9";
1216 cpu_pmu->map_event = armv7_a9_map_event;
1217 cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_EVENTS] =
1218 &armv7_pmuv1_events_attr_group;
1219 cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_FORMATS] =
1220 &armv7_pmu_format_attr_group;
1221 return armv7_probe_num_events(cpu_pmu);
1224 static int armv7_a5_pmu_init(struct arm_pmu *cpu_pmu)
1226 armv7pmu_init(cpu_pmu);
1227 cpu_pmu->name = "armv7_cortex_a5";
1228 cpu_pmu->map_event = armv7_a5_map_event;
1229 cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_EVENTS] =
1230 &armv7_pmuv1_events_attr_group;
1231 cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_FORMATS] =
1232 &armv7_pmu_format_attr_group;
1233 return armv7_probe_num_events(cpu_pmu);
1236 static int armv7_a15_pmu_init(struct arm_pmu *cpu_pmu)
1238 armv7pmu_init(cpu_pmu);
1239 cpu_pmu->name = "armv7_cortex_a15";
1240 cpu_pmu->map_event = armv7_a15_map_event;
1241 cpu_pmu->set_event_filter = armv7pmu_set_event_filter;
1242 cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_EVENTS] =
1243 &armv7_pmuv2_events_attr_group;
1244 cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_FORMATS] =
1245 &armv7_pmu_format_attr_group;
1246 return armv7_probe_num_events(cpu_pmu);
1249 static int armv7_a7_pmu_init(struct arm_pmu *cpu_pmu)
1251 armv7pmu_init(cpu_pmu);
1252 cpu_pmu->name = "armv7_cortex_a7";
1253 cpu_pmu->map_event = armv7_a7_map_event;
1254 cpu_pmu->set_event_filter = armv7pmu_set_event_filter;
1255 cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_EVENTS] =
1256 &armv7_pmuv2_events_attr_group;
1257 cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_FORMATS] =
1258 &armv7_pmu_format_attr_group;
1259 return armv7_probe_num_events(cpu_pmu);
1262 static int armv7_a12_pmu_init(struct arm_pmu *cpu_pmu)
1264 armv7pmu_init(cpu_pmu);
1265 cpu_pmu->name = "armv7_cortex_a12";
1266 cpu_pmu->map_event = armv7_a12_map_event;
1267 cpu_pmu->set_event_filter = armv7pmu_set_event_filter;
1268 cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_EVENTS] =
1269 &armv7_pmuv2_events_attr_group;
1270 cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_FORMATS] =
1271 &armv7_pmu_format_attr_group;
1272 return armv7_probe_num_events(cpu_pmu);
1275 static int armv7_a17_pmu_init(struct arm_pmu *cpu_pmu)
1277 int ret = armv7_a12_pmu_init(cpu_pmu);
1278 cpu_pmu->name = "armv7_cortex_a17";
1279 cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_EVENTS] =
1280 &armv7_pmuv2_events_attr_group;
1281 cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_FORMATS] =
1282 &armv7_pmu_format_attr_group;
1287 * Krait Performance Monitor Region Event Selection Register (PMRESRn)
1290 * +--------------------------------+
1291 * PMRESR0 | EN | CC | CC | CC | CC | N = 1, R = 0
1292 * +--------------------------------+
1293 * PMRESR1 | EN | CC | CC | CC | CC | N = 1, R = 1
1294 * +--------------------------------+
1295 * PMRESR2 | EN | CC | CC | CC | CC | N = 1, R = 2
1296 * +--------------------------------+
1297 * VPMRESR0 | EN | CC | CC | CC | CC | N = 2, R = ?
1298 * +--------------------------------+
1299 * EN | G=3 | G=2 | G=1 | G=0
1303 * hwc->config_base = 0xNRCCG
1305 * N = prefix, 1 for Krait CPU (PMRESRn), 2 for Venum VFP (VPMRESR)
1306 * R = region register
1307 * CC = class of events the group G is choosing from
1308 * G = group or particular event
1310 * Example: 0x12021 is a Krait CPU event in PMRESR2's group 1 with code 2
1312 * A region (R) corresponds to a piece of the CPU (execution unit, instruction
1313 * unit, etc.) while the event code (CC) corresponds to a particular class of
1314 * events (interrupts for example). An event code is broken down into
1315 * groups (G) that can be mapped into the PMU (irq, fiqs, and irq+fiqs for
1319 #define KRAIT_EVENT (1 << 16)
1320 #define VENUM_EVENT (2 << 16)
1321 #define KRAIT_EVENT_MASK (KRAIT_EVENT | VENUM_EVENT)
1322 #define PMRESRn_EN BIT(31)
1324 #define EVENT_REGION(event) (((event) >> 12) & 0xf) /* R */
1325 #define EVENT_GROUP(event) ((event) & 0xf) /* G */
1326 #define EVENT_CODE(event) (((event) >> 4) & 0xff) /* CC */
1327 #define EVENT_VENUM(event) (!!(event & VENUM_EVENT)) /* N=2 */
1328 #define EVENT_CPU(event) (!!(event & KRAIT_EVENT)) /* N=1 */
1330 static u32 krait_read_pmresrn(int n)
1336 asm volatile("mrc p15, 1, %0, c9, c15, 0" : "=r" (val));
1339 asm volatile("mrc p15, 1, %0, c9, c15, 1" : "=r" (val));
1342 asm volatile("mrc p15, 1, %0, c9, c15, 2" : "=r" (val));
1345 BUG(); /* Should be validated in krait_pmu_get_event_idx() */
1351 static void krait_write_pmresrn(int n, u32 val)
1355 asm volatile("mcr p15, 1, %0, c9, c15, 0" : : "r" (val));
1358 asm volatile("mcr p15, 1, %0, c9, c15, 1" : : "r" (val));
1361 asm volatile("mcr p15, 1, %0, c9, c15, 2" : : "r" (val));
1364 BUG(); /* Should be validated in krait_pmu_get_event_idx() */
1368 static u32 venum_read_pmresr(void)
1371 asm volatile("mrc p10, 7, %0, c11, c0, 0" : "=r" (val));
1375 static void venum_write_pmresr(u32 val)
1377 asm volatile("mcr p10, 7, %0, c11, c0, 0" : : "r" (val));
1380 static void venum_pre_pmresr(u32 *venum_orig_val, u32 *fp_orig_val)
1385 BUG_ON(preemptible());
1386 /* CPACR Enable CP10 and CP11 access */
1387 *venum_orig_val = get_copro_access();
1388 venum_new_val = *venum_orig_val | CPACC_SVC(10) | CPACC_SVC(11);
1389 set_copro_access(venum_new_val);
1392 *fp_orig_val = fmrx(FPEXC);
1393 fp_new_val = *fp_orig_val | FPEXC_EN;
1394 fmxr(FPEXC, fp_new_val);
1397 static void venum_post_pmresr(u32 venum_orig_val, u32 fp_orig_val)
1399 BUG_ON(preemptible());
1401 fmxr(FPEXC, fp_orig_val);
1404 set_copro_access(venum_orig_val);
1407 static u32 krait_get_pmresrn_event(unsigned int region)
1409 static const u32 pmresrn_table[] = { KRAIT_PMRESR0_GROUP0,
1410 KRAIT_PMRESR1_GROUP0,
1411 KRAIT_PMRESR2_GROUP0 };
1412 return pmresrn_table[region];
1415 static void krait_evt_setup(int idx, u32 config_base)
1420 unsigned int region = EVENT_REGION(config_base);
1421 unsigned int group = EVENT_GROUP(config_base);
1422 unsigned int code = EVENT_CODE(config_base);
1423 unsigned int group_shift;
1424 bool venum_event = EVENT_VENUM(config_base);
1426 group_shift = group * 8;
1427 mask = 0xff << group_shift;
1429 /* Configure evtsel for the region and group */
1431 val = KRAIT_VPMRESR0_GROUP0;
1433 val = krait_get_pmresrn_event(region);
1435 /* Mix in mode-exclusion bits */
1436 val |= config_base & (ARMV7_EXCLUDE_USER | ARMV7_EXCLUDE_PL1);
1437 armv7_pmnc_write_evtsel(idx, val);
1440 venum_pre_pmresr(&vval, &fval);
1441 val = venum_read_pmresr();
1443 val |= code << group_shift;
1445 venum_write_pmresr(val);
1446 venum_post_pmresr(vval, fval);
1448 val = krait_read_pmresrn(region);
1450 val |= code << group_shift;
1452 krait_write_pmresrn(region, val);
1456 static u32 clear_pmresrn_group(u32 val, int group)
1461 group_shift = group * 8;
1462 mask = 0xff << group_shift;
1465 /* Don't clear enable bit if entire region isn't disabled */
1466 if (val & ~PMRESRn_EN)
1467 return val |= PMRESRn_EN;
1472 static void krait_clearpmu(u32 config_base)
1476 unsigned int region = EVENT_REGION(config_base);
1477 unsigned int group = EVENT_GROUP(config_base);
1478 bool venum_event = EVENT_VENUM(config_base);
1481 venum_pre_pmresr(&vval, &fval);
1482 val = venum_read_pmresr();
1483 val = clear_pmresrn_group(val, group);
1484 venum_write_pmresr(val);
1485 venum_post_pmresr(vval, fval);
1487 val = krait_read_pmresrn(region);
1488 val = clear_pmresrn_group(val, group);
1489 krait_write_pmresrn(region, val);
1493 static void krait_pmu_disable_event(struct perf_event *event)
1495 unsigned long flags;
1496 struct hw_perf_event *hwc = &event->hw;
1498 struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
1499 struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
1501 /* Disable counter and interrupt */
1502 raw_spin_lock_irqsave(&events->pmu_lock, flags);
1504 /* Disable counter */
1505 armv7_pmnc_disable_counter(idx);
1508 * Clear pmresr code (if destined for PMNx counters)
1510 if (hwc->config_base & KRAIT_EVENT_MASK)
1511 krait_clearpmu(hwc->config_base);
1513 /* Disable interrupt for this counter */
1514 armv7_pmnc_disable_intens(idx);
1516 raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
1519 static void krait_pmu_enable_event(struct perf_event *event)
1521 unsigned long flags;
1522 struct hw_perf_event *hwc = &event->hw;
1524 struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
1525 struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
1528 * Enable counter and interrupt, and set the counter to count
1529 * the event that we're interested in.
1531 raw_spin_lock_irqsave(&events->pmu_lock, flags);
1533 /* Disable counter */
1534 armv7_pmnc_disable_counter(idx);
1537 * Set event (if destined for PMNx counters)
1538 * We set the event for the cycle counter because we
1539 * have the ability to perform event filtering.
1541 if (hwc->config_base & KRAIT_EVENT_MASK)
1542 krait_evt_setup(idx, hwc->config_base);
1544 armv7_pmnc_write_evtsel(idx, hwc->config_base);
1546 /* Enable interrupt for this counter */
1547 armv7_pmnc_enable_intens(idx);
1549 /* Enable counter */
1550 armv7_pmnc_enable_counter(idx);
1552 raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
1555 static void krait_pmu_reset(void *info)
1558 struct arm_pmu *cpu_pmu = info;
1559 u32 idx, nb_cnt = cpu_pmu->num_events;
1561 armv7pmu_reset(info);
1563 /* Clear all pmresrs */
1564 krait_write_pmresrn(0, 0);
1565 krait_write_pmresrn(1, 0);
1566 krait_write_pmresrn(2, 0);
1568 venum_pre_pmresr(&vval, &fval);
1569 venum_write_pmresr(0);
1570 venum_post_pmresr(vval, fval);
1572 /* Reset PMxEVNCTCR to sane default */
1573 for (idx = ARMV7_IDX_CYCLE_COUNTER; idx < nb_cnt; ++idx) {
1574 armv7_pmnc_select_counter(idx);
1575 asm volatile("mcr p15, 0, %0, c9, c15, 0" : : "r" (0));
1580 static int krait_event_to_bit(struct perf_event *event, unsigned int region,
1584 struct hw_perf_event *hwc = &event->hw;
1585 struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
1587 if (hwc->config_base & VENUM_EVENT)
1588 bit = KRAIT_VPMRESR0_GROUP0;
1590 bit = krait_get_pmresrn_event(region);
1591 bit -= krait_get_pmresrn_event(0);
1594 * Lower bits are reserved for use by the counters (see
1595 * armv7pmu_get_event_idx() for more info)
1597 bit += ARMV7_IDX_COUNTER_LAST(cpu_pmu) + 1;
1603 * We check for column exclusion constraints here.
1604 * Two events cant use the same group within a pmresr register.
1606 static int krait_pmu_get_event_idx(struct pmu_hw_events *cpuc,
1607 struct perf_event *event)
1611 struct hw_perf_event *hwc = &event->hw;
1612 unsigned int region = EVENT_REGION(hwc->config_base);
1613 unsigned int code = EVENT_CODE(hwc->config_base);
1614 unsigned int group = EVENT_GROUP(hwc->config_base);
1615 bool venum_event = EVENT_VENUM(hwc->config_base);
1616 bool krait_event = EVENT_CPU(hwc->config_base);
1618 if (venum_event || krait_event) {
1619 /* Ignore invalid events */
1620 if (group > 3 || region > 2)
1622 if (venum_event && (code & 0xe0))
1625 bit = krait_event_to_bit(event, region, group);
1626 if (test_and_set_bit(bit, cpuc->used_mask))
1630 idx = armv7pmu_get_event_idx(cpuc, event);
1631 if (idx < 0 && bit >= 0)
1632 clear_bit(bit, cpuc->used_mask);
1637 static void krait_pmu_clear_event_idx(struct pmu_hw_events *cpuc,
1638 struct perf_event *event)
1641 struct hw_perf_event *hwc = &event->hw;
1642 unsigned int region = EVENT_REGION(hwc->config_base);
1643 unsigned int group = EVENT_GROUP(hwc->config_base);
1644 bool venum_event = EVENT_VENUM(hwc->config_base);
1645 bool krait_event = EVENT_CPU(hwc->config_base);
1647 armv7pmu_clear_event_idx(cpuc, event);
1648 if (venum_event || krait_event) {
1649 bit = krait_event_to_bit(event, region, group);
1650 clear_bit(bit, cpuc->used_mask);
1654 static int krait_pmu_init(struct arm_pmu *cpu_pmu)
1656 armv7pmu_init(cpu_pmu);
1657 cpu_pmu->name = "armv7_krait";
1658 /* Some early versions of Krait don't support PC write events */
1659 if (of_property_read_bool(cpu_pmu->plat_device->dev.of_node,
1660 "qcom,no-pc-write"))
1661 cpu_pmu->map_event = krait_map_event_no_branch;
1663 cpu_pmu->map_event = krait_map_event;
1664 cpu_pmu->set_event_filter = armv7pmu_set_event_filter;
1665 cpu_pmu->reset = krait_pmu_reset;
1666 cpu_pmu->enable = krait_pmu_enable_event;
1667 cpu_pmu->disable = krait_pmu_disable_event;
1668 cpu_pmu->get_event_idx = krait_pmu_get_event_idx;
1669 cpu_pmu->clear_event_idx = krait_pmu_clear_event_idx;
1670 return armv7_probe_num_events(cpu_pmu);
1674 * Scorpion Local Performance Monitor Register (LPMn)
1677 * +--------------------------------+
1678 * LPM0 | EN | CC | CC | CC | CC | N = 1, R = 0
1679 * +--------------------------------+
1680 * LPM1 | EN | CC | CC | CC | CC | N = 1, R = 1
1681 * +--------------------------------+
1682 * LPM2 | EN | CC | CC | CC | CC | N = 1, R = 2
1683 * +--------------------------------+
1684 * L2LPM | EN | CC | CC | CC | CC | N = 1, R = 3
1685 * +--------------------------------+
1686 * VLPM | EN | CC | CC | CC | CC | N = 2, R = ?
1687 * +--------------------------------+
1688 * EN | G=3 | G=2 | G=1 | G=0
1693 * hwc->config_base = 0xNRCCG
1695 * N = prefix, 1 for Scorpion CPU (LPMn/L2LPM), 2 for Venum VFP (VLPM)
1696 * R = region register
1697 * CC = class of events the group G is choosing from
1698 * G = group or particular event
1700 * Example: 0x12021 is a Scorpion CPU event in LPM2's group 1 with code 2
1702 * A region (R) corresponds to a piece of the CPU (execution unit, instruction
1703 * unit, etc.) while the event code (CC) corresponds to a particular class of
1704 * events (interrupts for example). An event code is broken down into
1705 * groups (G) that can be mapped into the PMU (irq, fiqs, and irq+fiqs for
1709 static u32 scorpion_read_pmresrn(int n)
1715 asm volatile("mrc p15, 0, %0, c15, c0, 0" : "=r" (val));
1718 asm volatile("mrc p15, 1, %0, c15, c0, 0" : "=r" (val));
1721 asm volatile("mrc p15, 2, %0, c15, c0, 0" : "=r" (val));
1724 asm volatile("mrc p15, 3, %0, c15, c2, 0" : "=r" (val));
1727 BUG(); /* Should be validated in scorpion_pmu_get_event_idx() */
1733 static void scorpion_write_pmresrn(int n, u32 val)
1737 asm volatile("mcr p15, 0, %0, c15, c0, 0" : : "r" (val));
1740 asm volatile("mcr p15, 1, %0, c15, c0, 0" : : "r" (val));
1743 asm volatile("mcr p15, 2, %0, c15, c0, 0" : : "r" (val));
1746 asm volatile("mcr p15, 3, %0, c15, c2, 0" : : "r" (val));
1749 BUG(); /* Should be validated in scorpion_pmu_get_event_idx() */
1753 static u32 scorpion_get_pmresrn_event(unsigned int region)
1755 static const u32 pmresrn_table[] = { SCORPION_LPM0_GROUP0,
1756 SCORPION_LPM1_GROUP0,
1757 SCORPION_LPM2_GROUP0,
1758 SCORPION_L2LPM_GROUP0 };
1759 return pmresrn_table[region];
1762 static void scorpion_evt_setup(int idx, u32 config_base)
1767 unsigned int region = EVENT_REGION(config_base);
1768 unsigned int group = EVENT_GROUP(config_base);
1769 unsigned int code = EVENT_CODE(config_base);
1770 unsigned int group_shift;
1771 bool venum_event = EVENT_VENUM(config_base);
1773 group_shift = group * 8;
1774 mask = 0xff << group_shift;
1776 /* Configure evtsel for the region and group */
1778 val = SCORPION_VLPM_GROUP0;
1780 val = scorpion_get_pmresrn_event(region);
1782 /* Mix in mode-exclusion bits */
1783 val |= config_base & (ARMV7_EXCLUDE_USER | ARMV7_EXCLUDE_PL1);
1784 armv7_pmnc_write_evtsel(idx, val);
1786 asm volatile("mcr p15, 0, %0, c9, c15, 0" : : "r" (0));
1789 venum_pre_pmresr(&vval, &fval);
1790 val = venum_read_pmresr();
1792 val |= code << group_shift;
1794 venum_write_pmresr(val);
1795 venum_post_pmresr(vval, fval);
1797 val = scorpion_read_pmresrn(region);
1799 val |= code << group_shift;
1801 scorpion_write_pmresrn(region, val);
1805 static void scorpion_clearpmu(u32 config_base)
1809 unsigned int region = EVENT_REGION(config_base);
1810 unsigned int group = EVENT_GROUP(config_base);
1811 bool venum_event = EVENT_VENUM(config_base);
1814 venum_pre_pmresr(&vval, &fval);
1815 val = venum_read_pmresr();
1816 val = clear_pmresrn_group(val, group);
1817 venum_write_pmresr(val);
1818 venum_post_pmresr(vval, fval);
1820 val = scorpion_read_pmresrn(region);
1821 val = clear_pmresrn_group(val, group);
1822 scorpion_write_pmresrn(region, val);
1826 static void scorpion_pmu_disable_event(struct perf_event *event)
1828 unsigned long flags;
1829 struct hw_perf_event *hwc = &event->hw;
1831 struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
1832 struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
1834 /* Disable counter and interrupt */
1835 raw_spin_lock_irqsave(&events->pmu_lock, flags);
1837 /* Disable counter */
1838 armv7_pmnc_disable_counter(idx);
1841 * Clear pmresr code (if destined for PMNx counters)
1843 if (hwc->config_base & KRAIT_EVENT_MASK)
1844 scorpion_clearpmu(hwc->config_base);
1846 /* Disable interrupt for this counter */
1847 armv7_pmnc_disable_intens(idx);
1849 raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
1852 static void scorpion_pmu_enable_event(struct perf_event *event)
1854 unsigned long flags;
1855 struct hw_perf_event *hwc = &event->hw;
1857 struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
1858 struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
1861 * Enable counter and interrupt, and set the counter to count
1862 * the event that we're interested in.
1864 raw_spin_lock_irqsave(&events->pmu_lock, flags);
1866 /* Disable counter */
1867 armv7_pmnc_disable_counter(idx);
1870 * Set event (if destined for PMNx counters)
1871 * We don't set the event for the cycle counter because we
1872 * don't have the ability to perform event filtering.
1874 if (hwc->config_base & KRAIT_EVENT_MASK)
1875 scorpion_evt_setup(idx, hwc->config_base);
1876 else if (idx != ARMV7_IDX_CYCLE_COUNTER)
1877 armv7_pmnc_write_evtsel(idx, hwc->config_base);
1879 /* Enable interrupt for this counter */
1880 armv7_pmnc_enable_intens(idx);
1882 /* Enable counter */
1883 armv7_pmnc_enable_counter(idx);
1885 raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
1888 static void scorpion_pmu_reset(void *info)
1891 struct arm_pmu *cpu_pmu = info;
1892 u32 idx, nb_cnt = cpu_pmu->num_events;
1894 armv7pmu_reset(info);
1896 /* Clear all pmresrs */
1897 scorpion_write_pmresrn(0, 0);
1898 scorpion_write_pmresrn(1, 0);
1899 scorpion_write_pmresrn(2, 0);
1900 scorpion_write_pmresrn(3, 0);
1902 venum_pre_pmresr(&vval, &fval);
1903 venum_write_pmresr(0);
1904 venum_post_pmresr(vval, fval);
1906 /* Reset PMxEVNCTCR to sane default */
1907 for (idx = ARMV7_IDX_CYCLE_COUNTER; idx < nb_cnt; ++idx) {
1908 armv7_pmnc_select_counter(idx);
1909 asm volatile("mcr p15, 0, %0, c9, c15, 0" : : "r" (0));
1913 static int scorpion_event_to_bit(struct perf_event *event, unsigned int region,
1917 struct hw_perf_event *hwc = &event->hw;
1918 struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
1920 if (hwc->config_base & VENUM_EVENT)
1921 bit = SCORPION_VLPM_GROUP0;
1923 bit = scorpion_get_pmresrn_event(region);
1924 bit -= scorpion_get_pmresrn_event(0);
1927 * Lower bits are reserved for use by the counters (see
1928 * armv7pmu_get_event_idx() for more info)
1930 bit += ARMV7_IDX_COUNTER_LAST(cpu_pmu) + 1;
1936 * We check for column exclusion constraints here.
1937 * Two events cant use the same group within a pmresr register.
1939 static int scorpion_pmu_get_event_idx(struct pmu_hw_events *cpuc,
1940 struct perf_event *event)
1944 struct hw_perf_event *hwc = &event->hw;
1945 unsigned int region = EVENT_REGION(hwc->config_base);
1946 unsigned int group = EVENT_GROUP(hwc->config_base);
1947 bool venum_event = EVENT_VENUM(hwc->config_base);
1948 bool scorpion_event = EVENT_CPU(hwc->config_base);
1950 if (venum_event || scorpion_event) {
1951 /* Ignore invalid events */
1952 if (group > 3 || region > 3)
1955 bit = scorpion_event_to_bit(event, region, group);
1956 if (test_and_set_bit(bit, cpuc->used_mask))
1960 idx = armv7pmu_get_event_idx(cpuc, event);
1961 if (idx < 0 && bit >= 0)
1962 clear_bit(bit, cpuc->used_mask);
1967 static void scorpion_pmu_clear_event_idx(struct pmu_hw_events *cpuc,
1968 struct perf_event *event)
1971 struct hw_perf_event *hwc = &event->hw;
1972 unsigned int region = EVENT_REGION(hwc->config_base);
1973 unsigned int group = EVENT_GROUP(hwc->config_base);
1974 bool venum_event = EVENT_VENUM(hwc->config_base);
1975 bool scorpion_event = EVENT_CPU(hwc->config_base);
1977 armv7pmu_clear_event_idx(cpuc, event);
1978 if (venum_event || scorpion_event) {
1979 bit = scorpion_event_to_bit(event, region, group);
1980 clear_bit(bit, cpuc->used_mask);
1984 static int scorpion_pmu_init(struct arm_pmu *cpu_pmu)
1986 armv7pmu_init(cpu_pmu);
1987 cpu_pmu->name = "armv7_scorpion";
1988 cpu_pmu->map_event = scorpion_map_event;
1989 cpu_pmu->reset = scorpion_pmu_reset;
1990 cpu_pmu->enable = scorpion_pmu_enable_event;
1991 cpu_pmu->disable = scorpion_pmu_disable_event;
1992 cpu_pmu->get_event_idx = scorpion_pmu_get_event_idx;
1993 cpu_pmu->clear_event_idx = scorpion_pmu_clear_event_idx;
1994 return armv7_probe_num_events(cpu_pmu);
1997 static int scorpion_mp_pmu_init(struct arm_pmu *cpu_pmu)
1999 armv7pmu_init(cpu_pmu);
2000 cpu_pmu->name = "armv7_scorpion_mp";
2001 cpu_pmu->map_event = scorpion_map_event;
2002 cpu_pmu->reset = scorpion_pmu_reset;
2003 cpu_pmu->enable = scorpion_pmu_enable_event;
2004 cpu_pmu->disable = scorpion_pmu_disable_event;
2005 cpu_pmu->get_event_idx = scorpion_pmu_get_event_idx;
2006 cpu_pmu->clear_event_idx = scorpion_pmu_clear_event_idx;
2007 return armv7_probe_num_events(cpu_pmu);
2010 static const struct of_device_id armv7_pmu_of_device_ids[] = {
2011 {.compatible = "arm,cortex-a17-pmu", .data = armv7_a17_pmu_init},
2012 {.compatible = "arm,cortex-a15-pmu", .data = armv7_a15_pmu_init},
2013 {.compatible = "arm,cortex-a12-pmu", .data = armv7_a12_pmu_init},
2014 {.compatible = "arm,cortex-a9-pmu", .data = armv7_a9_pmu_init},
2015 {.compatible = "arm,cortex-a8-pmu", .data = armv7_a8_pmu_init},
2016 {.compatible = "arm,cortex-a7-pmu", .data = armv7_a7_pmu_init},
2017 {.compatible = "arm,cortex-a5-pmu", .data = armv7_a5_pmu_init},
2018 {.compatible = "qcom,krait-pmu", .data = krait_pmu_init},
2019 {.compatible = "qcom,scorpion-pmu", .data = scorpion_pmu_init},
2020 {.compatible = "qcom,scorpion-mp-pmu", .data = scorpion_mp_pmu_init},
2024 static const struct pmu_probe_info armv7_pmu_probe_table[] = {
2025 ARM_PMU_PROBE(ARM_CPU_PART_CORTEX_A8, armv7_a8_pmu_init),
2026 ARM_PMU_PROBE(ARM_CPU_PART_CORTEX_A9, armv7_a9_pmu_init),
2027 { /* sentinel value */ }
2031 static int armv7_pmu_device_probe(struct platform_device *pdev)
2033 return arm_pmu_device_probe(pdev, armv7_pmu_of_device_ids,
2034 armv7_pmu_probe_table);
2037 static struct platform_driver armv7_pmu_driver = {
2039 .name = "armv7-pmu",
2040 .of_match_table = armv7_pmu_of_device_ids,
2041 .suppress_bind_attrs = true,
2043 .probe = armv7_pmu_device_probe,
2046 builtin_platform_driver(armv7_pmu_driver);
2047 #endif /* CONFIG_CPU_V7 */