2 * ARMv7 Cortex-A8 and Cortex-A9 Performance Events handling code.
4 * ARMv7 support: Jean Pihet <jpihet@mvista.com>
5 * 2010 (c) MontaVista Software, LLC.
7 * Copied from ARMv6 code, with the low level code inspired
8 * by the ARMv7 Oprofile code.
10 * Cortex-A8 has up to 4 configurable performance counters and
11 * a single cycle counter.
12 * Cortex-A9 has up to 31 configurable performance counters and
13 * a single cycle counter.
15 * All counters can be enabled/disabled and IRQ masked separately. The cycle
16 * counter and all 4 performance counters together can be reset separately.
22 * Common ARMv7 event types
24 * Note: An implementation may not be able to count all of these events
25 * but the encodings are considered to be `reserved' in the case that
26 * they are not available.
28 enum armv7_perf_types {
29 ARMV7_PERFCTR_PMNC_SW_INCR = 0x00,
30 ARMV7_PERFCTR_L1_ICACHE_REFILL = 0x01,
31 ARMV7_PERFCTR_ITLB_REFILL = 0x02,
32 ARMV7_PERFCTR_L1_DCACHE_REFILL = 0x03,
33 ARMV7_PERFCTR_L1_DCACHE_ACCESS = 0x04,
34 ARMV7_PERFCTR_DTLB_REFILL = 0x05,
35 ARMV7_PERFCTR_MEM_READ = 0x06,
36 ARMV7_PERFCTR_MEM_WRITE = 0x07,
37 ARMV7_PERFCTR_INSTR_EXECUTED = 0x08,
38 ARMV7_PERFCTR_EXC_TAKEN = 0x09,
39 ARMV7_PERFCTR_EXC_EXECUTED = 0x0A,
40 ARMV7_PERFCTR_CID_WRITE = 0x0B,
43 * ARMV7_PERFCTR_PC_WRITE is equivalent to HW_BRANCH_INSTRUCTIONS.
45 * - all (taken) branch instructions,
46 * - instructions that explicitly write the PC,
47 * - exception generating instructions.
49 ARMV7_PERFCTR_PC_WRITE = 0x0C,
50 ARMV7_PERFCTR_PC_IMM_BRANCH = 0x0D,
51 ARMV7_PERFCTR_PC_PROC_RETURN = 0x0E,
52 ARMV7_PERFCTR_MEM_UNALIGNED_ACCESS = 0x0F,
53 ARMV7_PERFCTR_PC_BRANCH_MIS_PRED = 0x10,
54 ARMV7_PERFCTR_CLOCK_CYCLES = 0x11,
55 ARMV7_PERFCTR_PC_BRANCH_PRED = 0x12,
57 /* These events are defined by the PMUv2 supplement (ARM DDI 0457A). */
58 ARMV7_PERFCTR_MEM_ACCESS = 0x13,
59 ARMV7_PERFCTR_L1_ICACHE_ACCESS = 0x14,
60 ARMV7_PERFCTR_L1_DCACHE_WB = 0x15,
61 ARMV7_PERFCTR_L2_CACHE_ACCESS = 0x16,
62 ARMV7_PERFCTR_L2_CACHE_REFILL = 0x17,
63 ARMV7_PERFCTR_L2_CACHE_WB = 0x18,
64 ARMV7_PERFCTR_BUS_ACCESS = 0x19,
65 ARMV7_PERFCTR_MEM_ERROR = 0x1A,
66 ARMV7_PERFCTR_INSTR_SPEC = 0x1B,
67 ARMV7_PERFCTR_TTBR_WRITE = 0x1C,
68 ARMV7_PERFCTR_BUS_CYCLES = 0x1D,
70 ARMV7_PERFCTR_CPU_CYCLES = 0xFF
73 /* ARMv7 Cortex-A8 specific event types */
74 enum armv7_a8_perf_types {
75 ARMV7_A8_PERFCTR_L2_CACHE_ACCESS = 0x43,
76 ARMV7_A8_PERFCTR_L2_CACHE_REFILL = 0x44,
77 ARMV7_A8_PERFCTR_L1_ICACHE_ACCESS = 0x50,
78 ARMV7_A8_PERFCTR_STALL_ISIDE = 0x56,
81 /* ARMv7 Cortex-A9 specific event types */
82 enum armv7_a9_perf_types {
83 ARMV7_A9_PERFCTR_INSTR_CORE_RENAME = 0x68,
84 ARMV7_A9_PERFCTR_STALL_ICACHE = 0x60,
85 ARMV7_A9_PERFCTR_STALL_DISPATCH = 0x66,
88 /* ARMv7 Cortex-A5 specific event types */
89 enum armv7_a5_perf_types {
90 ARMV7_A5_PERFCTR_PREFETCH_LINEFILL = 0xc2,
91 ARMV7_A5_PERFCTR_PREFETCH_LINEFILL_DROP = 0xc3,
94 /* ARMv7 Cortex-A15 specific event types */
95 enum armv7_a15_perf_types {
96 ARMV7_A15_PERFCTR_L1_DCACHE_ACCESS_READ = 0x40,
97 ARMV7_A15_PERFCTR_L1_DCACHE_ACCESS_WRITE = 0x41,
98 ARMV7_A15_PERFCTR_L1_DCACHE_REFILL_READ = 0x42,
99 ARMV7_A15_PERFCTR_L1_DCACHE_REFILL_WRITE = 0x43,
101 ARMV7_A15_PERFCTR_DTLB_REFILL_L1_READ = 0x4C,
102 ARMV7_A15_PERFCTR_DTLB_REFILL_L1_WRITE = 0x4D,
104 ARMV7_A15_PERFCTR_L2_CACHE_ACCESS_READ = 0x50,
105 ARMV7_A15_PERFCTR_L2_CACHE_ACCESS_WRITE = 0x51,
106 ARMV7_A15_PERFCTR_L2_CACHE_REFILL_READ = 0x52,
107 ARMV7_A15_PERFCTR_L2_CACHE_REFILL_WRITE = 0x53,
109 ARMV7_A15_PERFCTR_PC_WRITE_SPEC = 0x76,
112 /* ARMv7 Cortex-A12 specific event types */
113 enum armv7_a12_perf_types {
114 ARMV7_A12_PERFCTR_L1_DCACHE_ACCESS_READ = 0x40,
115 ARMV7_A12_PERFCTR_L1_DCACHE_ACCESS_WRITE = 0x41,
117 ARMV7_A12_PERFCTR_L2_CACHE_ACCESS_READ = 0x50,
118 ARMV7_A12_PERFCTR_L2_CACHE_ACCESS_WRITE = 0x51,
120 ARMV7_A12_PERFCTR_PC_WRITE_SPEC = 0x76,
122 ARMV7_A12_PERFCTR_PF_TLB_REFILL = 0xe7,
126 * Cortex-A8 HW events mapping
128 * The hardware events that we support. We do support cache operations but
129 * we have harvard caches and no way to combine instruction and data
130 * accesses/misses in hardware.
132 static const unsigned armv7_a8_perf_map[PERF_COUNT_HW_MAX] = {
133 [PERF_COUNT_HW_CPU_CYCLES] = ARMV7_PERFCTR_CPU_CYCLES,
134 [PERF_COUNT_HW_INSTRUCTIONS] = ARMV7_PERFCTR_INSTR_EXECUTED,
135 [PERF_COUNT_HW_CACHE_REFERENCES] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
136 [PERF_COUNT_HW_CACHE_MISSES] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
137 [PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = ARMV7_PERFCTR_PC_WRITE,
138 [PERF_COUNT_HW_BRANCH_MISSES] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
139 [PERF_COUNT_HW_BUS_CYCLES] = HW_OP_UNSUPPORTED,
140 [PERF_COUNT_HW_STALLED_CYCLES_FRONTEND] = ARMV7_A8_PERFCTR_STALL_ISIDE,
141 [PERF_COUNT_HW_STALLED_CYCLES_BACKEND] = HW_OP_UNSUPPORTED,
144 static const unsigned armv7_a8_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
145 [PERF_COUNT_HW_CACHE_OP_MAX]
146 [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
149 * The performance counters don't differentiate between read
150 * and write accesses/misses so this isn't strictly correct,
151 * but it's the best we can do. Writes and reads get
155 [C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
156 [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
159 [C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
160 [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
163 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
164 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
169 [C(RESULT_ACCESS)] = ARMV7_A8_PERFCTR_L1_ICACHE_ACCESS,
170 [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_ICACHE_REFILL,
173 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
174 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
177 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
178 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
183 [C(RESULT_ACCESS)] = ARMV7_A8_PERFCTR_L2_CACHE_ACCESS,
184 [C(RESULT_MISS)] = ARMV7_A8_PERFCTR_L2_CACHE_REFILL,
187 [C(RESULT_ACCESS)] = ARMV7_A8_PERFCTR_L2_CACHE_ACCESS,
188 [C(RESULT_MISS)] = ARMV7_A8_PERFCTR_L2_CACHE_REFILL,
191 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
192 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
197 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
198 [C(RESULT_MISS)] = ARMV7_PERFCTR_DTLB_REFILL,
201 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
202 [C(RESULT_MISS)] = ARMV7_PERFCTR_DTLB_REFILL,
205 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
206 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
211 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
212 [C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
215 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
216 [C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
219 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
220 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
225 [C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
226 [C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
229 [C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
230 [C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
233 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
234 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
239 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
240 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
243 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
244 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
247 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
248 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
254 * Cortex-A9 HW events mapping
256 static const unsigned armv7_a9_perf_map[PERF_COUNT_HW_MAX] = {
257 [PERF_COUNT_HW_CPU_CYCLES] = ARMV7_PERFCTR_CPU_CYCLES,
258 [PERF_COUNT_HW_INSTRUCTIONS] = ARMV7_A9_PERFCTR_INSTR_CORE_RENAME,
259 [PERF_COUNT_HW_CACHE_REFERENCES] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
260 [PERF_COUNT_HW_CACHE_MISSES] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
261 [PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = ARMV7_PERFCTR_PC_WRITE,
262 [PERF_COUNT_HW_BRANCH_MISSES] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
263 [PERF_COUNT_HW_BUS_CYCLES] = HW_OP_UNSUPPORTED,
264 [PERF_COUNT_HW_STALLED_CYCLES_FRONTEND] = ARMV7_A9_PERFCTR_STALL_ICACHE,
265 [PERF_COUNT_HW_STALLED_CYCLES_BACKEND] = ARMV7_A9_PERFCTR_STALL_DISPATCH,
268 static const unsigned armv7_a9_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
269 [PERF_COUNT_HW_CACHE_OP_MAX]
270 [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
273 * The performance counters don't differentiate between read
274 * and write accesses/misses so this isn't strictly correct,
275 * but it's the best we can do. Writes and reads get
279 [C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
280 [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
283 [C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
284 [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
287 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
288 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
293 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
294 [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_ICACHE_REFILL,
297 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
298 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
301 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
302 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
307 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
308 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
311 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
312 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
315 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
316 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
321 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
322 [C(RESULT_MISS)] = ARMV7_PERFCTR_DTLB_REFILL,
325 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
326 [C(RESULT_MISS)] = ARMV7_PERFCTR_DTLB_REFILL,
329 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
330 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
335 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
336 [C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
339 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
340 [C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
343 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
344 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
349 [C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
350 [C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
353 [C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
354 [C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
357 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
358 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
363 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
364 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
367 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
368 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
371 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
372 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
378 * Cortex-A5 HW events mapping
380 static const unsigned armv7_a5_perf_map[PERF_COUNT_HW_MAX] = {
381 [PERF_COUNT_HW_CPU_CYCLES] = ARMV7_PERFCTR_CPU_CYCLES,
382 [PERF_COUNT_HW_INSTRUCTIONS] = ARMV7_PERFCTR_INSTR_EXECUTED,
383 [PERF_COUNT_HW_CACHE_REFERENCES] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
384 [PERF_COUNT_HW_CACHE_MISSES] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
385 [PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = ARMV7_PERFCTR_PC_WRITE,
386 [PERF_COUNT_HW_BRANCH_MISSES] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
387 [PERF_COUNT_HW_BUS_CYCLES] = HW_OP_UNSUPPORTED,
388 [PERF_COUNT_HW_STALLED_CYCLES_FRONTEND] = HW_OP_UNSUPPORTED,
389 [PERF_COUNT_HW_STALLED_CYCLES_BACKEND] = HW_OP_UNSUPPORTED,
392 static const unsigned armv7_a5_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
393 [PERF_COUNT_HW_CACHE_OP_MAX]
394 [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
397 [C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
398 [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
401 [C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
402 [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
405 [C(RESULT_ACCESS)] = ARMV7_A5_PERFCTR_PREFETCH_LINEFILL,
406 [C(RESULT_MISS)] = ARMV7_A5_PERFCTR_PREFETCH_LINEFILL_DROP,
411 [C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_ICACHE_ACCESS,
412 [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_ICACHE_REFILL,
415 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
416 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
419 * The prefetch counters don't differentiate between the I
420 * side and the D side.
423 [C(RESULT_ACCESS)] = ARMV7_A5_PERFCTR_PREFETCH_LINEFILL,
424 [C(RESULT_MISS)] = ARMV7_A5_PERFCTR_PREFETCH_LINEFILL_DROP,
429 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
430 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
433 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
434 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
437 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
438 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
443 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
444 [C(RESULT_MISS)] = ARMV7_PERFCTR_DTLB_REFILL,
447 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
448 [C(RESULT_MISS)] = ARMV7_PERFCTR_DTLB_REFILL,
451 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
452 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
457 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
458 [C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
461 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
462 [C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
465 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
466 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
471 [C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
472 [C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
475 [C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
476 [C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
479 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
480 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
485 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
486 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
489 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
490 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
493 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
494 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
500 * Cortex-A15 HW events mapping
502 static const unsigned armv7_a15_perf_map[PERF_COUNT_HW_MAX] = {
503 [PERF_COUNT_HW_CPU_CYCLES] = ARMV7_PERFCTR_CPU_CYCLES,
504 [PERF_COUNT_HW_INSTRUCTIONS] = ARMV7_PERFCTR_INSTR_EXECUTED,
505 [PERF_COUNT_HW_CACHE_REFERENCES] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
506 [PERF_COUNT_HW_CACHE_MISSES] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
507 [PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = ARMV7_A15_PERFCTR_PC_WRITE_SPEC,
508 [PERF_COUNT_HW_BRANCH_MISSES] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
509 [PERF_COUNT_HW_BUS_CYCLES] = ARMV7_PERFCTR_BUS_CYCLES,
510 [PERF_COUNT_HW_STALLED_CYCLES_FRONTEND] = HW_OP_UNSUPPORTED,
511 [PERF_COUNT_HW_STALLED_CYCLES_BACKEND] = HW_OP_UNSUPPORTED,
514 static const unsigned armv7_a15_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
515 [PERF_COUNT_HW_CACHE_OP_MAX]
516 [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
519 [C(RESULT_ACCESS)] = ARMV7_A15_PERFCTR_L1_DCACHE_ACCESS_READ,
520 [C(RESULT_MISS)] = ARMV7_A15_PERFCTR_L1_DCACHE_REFILL_READ,
523 [C(RESULT_ACCESS)] = ARMV7_A15_PERFCTR_L1_DCACHE_ACCESS_WRITE,
524 [C(RESULT_MISS)] = ARMV7_A15_PERFCTR_L1_DCACHE_REFILL_WRITE,
527 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
528 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
533 * Not all performance counters differentiate between read
534 * and write accesses/misses so we're not always strictly
535 * correct, but it's the best we can do. Writes and reads get
536 * combined in these cases.
539 [C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_ICACHE_ACCESS,
540 [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_ICACHE_REFILL,
543 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
544 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
547 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
548 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
553 [C(RESULT_ACCESS)] = ARMV7_A15_PERFCTR_L2_CACHE_ACCESS_READ,
554 [C(RESULT_MISS)] = ARMV7_A15_PERFCTR_L2_CACHE_REFILL_READ,
557 [C(RESULT_ACCESS)] = ARMV7_A15_PERFCTR_L2_CACHE_ACCESS_WRITE,
558 [C(RESULT_MISS)] = ARMV7_A15_PERFCTR_L2_CACHE_REFILL_WRITE,
561 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
562 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
567 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
568 [C(RESULT_MISS)] = ARMV7_A15_PERFCTR_DTLB_REFILL_L1_READ,
571 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
572 [C(RESULT_MISS)] = ARMV7_A15_PERFCTR_DTLB_REFILL_L1_WRITE,
575 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
576 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
581 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
582 [C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
585 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
586 [C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
589 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
590 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
595 [C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
596 [C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
599 [C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
600 [C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
603 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
604 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
609 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
610 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
613 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
614 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
617 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
618 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
624 * Cortex-A7 HW events mapping
626 static const unsigned armv7_a7_perf_map[PERF_COUNT_HW_MAX] = {
627 [PERF_COUNT_HW_CPU_CYCLES] = ARMV7_PERFCTR_CPU_CYCLES,
628 [PERF_COUNT_HW_INSTRUCTIONS] = ARMV7_PERFCTR_INSTR_EXECUTED,
629 [PERF_COUNT_HW_CACHE_REFERENCES] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
630 [PERF_COUNT_HW_CACHE_MISSES] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
631 [PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = ARMV7_PERFCTR_PC_WRITE,
632 [PERF_COUNT_HW_BRANCH_MISSES] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
633 [PERF_COUNT_HW_BUS_CYCLES] = ARMV7_PERFCTR_BUS_CYCLES,
634 [PERF_COUNT_HW_STALLED_CYCLES_FRONTEND] = HW_OP_UNSUPPORTED,
635 [PERF_COUNT_HW_STALLED_CYCLES_BACKEND] = HW_OP_UNSUPPORTED,
638 static const unsigned armv7_a7_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
639 [PERF_COUNT_HW_CACHE_OP_MAX]
640 [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
643 * The performance counters don't differentiate between read
644 * and write accesses/misses so this isn't strictly correct,
645 * but it's the best we can do. Writes and reads get
649 [C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
650 [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
653 [C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
654 [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
657 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
658 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
663 [C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_ICACHE_ACCESS,
664 [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_ICACHE_REFILL,
667 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
668 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
671 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
672 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
677 [C(RESULT_ACCESS)] = ARMV7_PERFCTR_L2_CACHE_ACCESS,
678 [C(RESULT_MISS)] = ARMV7_PERFCTR_L2_CACHE_REFILL,
681 [C(RESULT_ACCESS)] = ARMV7_PERFCTR_L2_CACHE_ACCESS,
682 [C(RESULT_MISS)] = ARMV7_PERFCTR_L2_CACHE_REFILL,
685 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
686 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
691 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
692 [C(RESULT_MISS)] = ARMV7_PERFCTR_DTLB_REFILL,
695 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
696 [C(RESULT_MISS)] = ARMV7_PERFCTR_DTLB_REFILL,
699 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
700 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
705 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
706 [C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
709 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
710 [C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
713 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
714 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
719 [C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
720 [C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
723 [C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
724 [C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
727 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
728 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
733 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
734 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
737 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
738 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
741 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
742 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
748 * Cortex-A12 HW events mapping
750 static const unsigned armv7_a12_perf_map[PERF_COUNT_HW_MAX] = {
751 [PERF_COUNT_HW_CPU_CYCLES] = ARMV7_PERFCTR_CPU_CYCLES,
752 [PERF_COUNT_HW_INSTRUCTIONS] = ARMV7_PERFCTR_INSTR_EXECUTED,
753 [PERF_COUNT_HW_CACHE_REFERENCES] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
754 [PERF_COUNT_HW_CACHE_MISSES] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
755 [PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = ARMV7_A12_PERFCTR_PC_WRITE_SPEC,
756 [PERF_COUNT_HW_BRANCH_MISSES] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
757 [PERF_COUNT_HW_BUS_CYCLES] = ARMV7_PERFCTR_BUS_CYCLES,
758 [PERF_COUNT_HW_STALLED_CYCLES_FRONTEND] = HW_OP_UNSUPPORTED,
759 [PERF_COUNT_HW_STALLED_CYCLES_BACKEND] = HW_OP_UNSUPPORTED,
762 static const unsigned armv7_a12_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
763 [PERF_COUNT_HW_CACHE_OP_MAX]
764 [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
767 [C(RESULT_ACCESS)] = ARMV7_A12_PERFCTR_L1_DCACHE_ACCESS_READ,
768 [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
771 [C(RESULT_ACCESS)] = ARMV7_A12_PERFCTR_L1_DCACHE_ACCESS_WRITE,
772 [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
775 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
776 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
781 * Not all performance counters differentiate between read
782 * and write accesses/misses so we're not always strictly
783 * correct, but it's the best we can do. Writes and reads get
784 * combined in these cases.
787 [C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_ICACHE_ACCESS,
788 [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_ICACHE_REFILL,
791 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
792 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
795 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
796 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
801 [C(RESULT_ACCESS)] = ARMV7_A12_PERFCTR_L2_CACHE_ACCESS_READ,
802 [C(RESULT_MISS)] = ARMV7_PERFCTR_L2_CACHE_REFILL,
805 [C(RESULT_ACCESS)] = ARMV7_A12_PERFCTR_L2_CACHE_ACCESS_WRITE,
806 [C(RESULT_MISS)] = ARMV7_PERFCTR_L2_CACHE_REFILL,
809 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
810 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
815 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
816 [C(RESULT_MISS)] = ARMV7_PERFCTR_DTLB_REFILL,
819 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
820 [C(RESULT_MISS)] = ARMV7_PERFCTR_DTLB_REFILL,
823 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
824 [C(RESULT_MISS)] = ARMV7_A12_PERFCTR_PF_TLB_REFILL,
829 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
830 [C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
833 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
834 [C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
837 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
838 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
843 [C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
844 [C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
847 [C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
848 [C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
851 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
852 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
857 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
858 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
861 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
862 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
865 [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
866 [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
872 * Perf Events' indices
874 #define ARMV7_IDX_CYCLE_COUNTER 0
875 #define ARMV7_IDX_COUNTER0 1
876 #define ARMV7_IDX_COUNTER_LAST(cpu_pmu) \
877 (ARMV7_IDX_CYCLE_COUNTER + cpu_pmu->num_events - 1)
879 #define ARMV7_MAX_COUNTERS 32
880 #define ARMV7_COUNTER_MASK (ARMV7_MAX_COUNTERS - 1)
883 * ARMv7 low level PMNC access
887 * Perf Event to low level counters mapping
889 #define ARMV7_IDX_TO_COUNTER(x) \
890 (((x) - ARMV7_IDX_COUNTER0) & ARMV7_COUNTER_MASK)
893 * Per-CPU PMNC: config reg
895 #define ARMV7_PMNC_E (1 << 0) /* Enable all counters */
896 #define ARMV7_PMNC_P (1 << 1) /* Reset all counters */
897 #define ARMV7_PMNC_C (1 << 2) /* Cycle counter reset */
898 #define ARMV7_PMNC_D (1 << 3) /* CCNT counts every 64th cpu cycle */
899 #define ARMV7_PMNC_X (1 << 4) /* Export to ETM */
900 #define ARMV7_PMNC_DP (1 << 5) /* Disable CCNT if non-invasive debug*/
901 #define ARMV7_PMNC_N_SHIFT 11 /* Number of counters supported */
902 #define ARMV7_PMNC_N_MASK 0x1f
903 #define ARMV7_PMNC_MASK 0x3f /* Mask for writable bits */
906 * FLAG: counters overflow flag status reg
908 #define ARMV7_FLAG_MASK 0xffffffff /* Mask for writable bits */
909 #define ARMV7_OVERFLOWED_MASK ARMV7_FLAG_MASK
912 * PMXEVTYPER: Event selection reg
914 #define ARMV7_EVTYPE_MASK 0xc80000ff /* Mask for writable bits */
915 #define ARMV7_EVTYPE_EVENT 0xff /* Mask for EVENT bits */
918 * Event filters for PMUv2
920 #define ARMV7_EXCLUDE_PL1 (1 << 31)
921 #define ARMV7_EXCLUDE_USER (1 << 30)
922 #define ARMV7_INCLUDE_HYP (1 << 27)
924 static inline u32 armv7_pmnc_read(void)
927 asm volatile("mrc p15, 0, %0, c9, c12, 0" : "=r"(val));
931 static inline void armv7_pmnc_write(u32 val)
933 val &= ARMV7_PMNC_MASK;
935 asm volatile("mcr p15, 0, %0, c9, c12, 0" : : "r"(val));
938 static inline int armv7_pmnc_has_overflowed(u32 pmnc)
940 return pmnc & ARMV7_OVERFLOWED_MASK;
943 static inline int armv7_pmnc_counter_valid(struct arm_pmu *cpu_pmu, int idx)
945 return idx >= ARMV7_IDX_CYCLE_COUNTER &&
946 idx <= ARMV7_IDX_COUNTER_LAST(cpu_pmu);
949 static inline int armv7_pmnc_counter_has_overflowed(u32 pmnc, int idx)
951 return pmnc & BIT(ARMV7_IDX_TO_COUNTER(idx));
954 static inline int armv7_pmnc_select_counter(int idx)
956 u32 counter = ARMV7_IDX_TO_COUNTER(idx);
957 asm volatile("mcr p15, 0, %0, c9, c12, 5" : : "r" (counter));
963 static inline u32 armv7pmu_read_counter(struct perf_event *event)
965 struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
966 struct hw_perf_event *hwc = &event->hw;
970 if (!armv7_pmnc_counter_valid(cpu_pmu, idx))
971 pr_err("CPU%u reading wrong counter %d\n",
972 smp_processor_id(), idx);
973 else if (idx == ARMV7_IDX_CYCLE_COUNTER)
974 asm volatile("mrc p15, 0, %0, c9, c13, 0" : "=r" (value));
975 else if (armv7_pmnc_select_counter(idx) == idx)
976 asm volatile("mrc p15, 0, %0, c9, c13, 2" : "=r" (value));
981 static inline void armv7pmu_write_counter(struct perf_event *event, u32 value)
983 struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
984 struct hw_perf_event *hwc = &event->hw;
987 if (!armv7_pmnc_counter_valid(cpu_pmu, idx))
988 pr_err("CPU%u writing wrong counter %d\n",
989 smp_processor_id(), idx);
990 else if (idx == ARMV7_IDX_CYCLE_COUNTER)
991 asm volatile("mcr p15, 0, %0, c9, c13, 0" : : "r" (value));
992 else if (armv7_pmnc_select_counter(idx) == idx)
993 asm volatile("mcr p15, 0, %0, c9, c13, 2" : : "r" (value));
996 static inline void armv7_pmnc_write_evtsel(int idx, u32 val)
998 if (armv7_pmnc_select_counter(idx) == idx) {
999 val &= ARMV7_EVTYPE_MASK;
1000 asm volatile("mcr p15, 0, %0, c9, c13, 1" : : "r" (val));
1004 static inline int armv7_pmnc_enable_counter(int idx)
1006 u32 counter = ARMV7_IDX_TO_COUNTER(idx);
1007 asm volatile("mcr p15, 0, %0, c9, c12, 1" : : "r" (BIT(counter)));
1011 static inline int armv7_pmnc_disable_counter(int idx)
1013 u32 counter = ARMV7_IDX_TO_COUNTER(idx);
1014 asm volatile("mcr p15, 0, %0, c9, c12, 2" : : "r" (BIT(counter)));
1018 static inline int armv7_pmnc_enable_intens(int idx)
1020 u32 counter = ARMV7_IDX_TO_COUNTER(idx);
1021 asm volatile("mcr p15, 0, %0, c9, c14, 1" : : "r" (BIT(counter)));
1025 static inline int armv7_pmnc_disable_intens(int idx)
1027 u32 counter = ARMV7_IDX_TO_COUNTER(idx);
1028 asm volatile("mcr p15, 0, %0, c9, c14, 2" : : "r" (BIT(counter)));
1030 /* Clear the overflow flag in case an interrupt is pending. */
1031 asm volatile("mcr p15, 0, %0, c9, c12, 3" : : "r" (BIT(counter)));
1037 static inline u32 armv7_pmnc_getreset_flags(void)
1042 asm volatile("mrc p15, 0, %0, c9, c12, 3" : "=r" (val));
1044 /* Write to clear flags */
1045 val &= ARMV7_FLAG_MASK;
1046 asm volatile("mcr p15, 0, %0, c9, c12, 3" : : "r" (val));
1052 static void armv7_pmnc_dump_regs(struct arm_pmu *cpu_pmu)
1057 printk(KERN_INFO "PMNC registers dump:\n");
1059 asm volatile("mrc p15, 0, %0, c9, c12, 0" : "=r" (val));
1060 printk(KERN_INFO "PMNC =0x%08x\n", val);
1062 asm volatile("mrc p15, 0, %0, c9, c12, 1" : "=r" (val));
1063 printk(KERN_INFO "CNTENS=0x%08x\n", val);
1065 asm volatile("mrc p15, 0, %0, c9, c14, 1" : "=r" (val));
1066 printk(KERN_INFO "INTENS=0x%08x\n", val);
1068 asm volatile("mrc p15, 0, %0, c9, c12, 3" : "=r" (val));
1069 printk(KERN_INFO "FLAGS =0x%08x\n", val);
1071 asm volatile("mrc p15, 0, %0, c9, c12, 5" : "=r" (val));
1072 printk(KERN_INFO "SELECT=0x%08x\n", val);
1074 asm volatile("mrc p15, 0, %0, c9, c13, 0" : "=r" (val));
1075 printk(KERN_INFO "CCNT =0x%08x\n", val);
1077 for (cnt = ARMV7_IDX_COUNTER0;
1078 cnt <= ARMV7_IDX_COUNTER_LAST(cpu_pmu); cnt++) {
1079 armv7_pmnc_select_counter(cnt);
1080 asm volatile("mrc p15, 0, %0, c9, c13, 2" : "=r" (val));
1081 printk(KERN_INFO "CNT[%d] count =0x%08x\n",
1082 ARMV7_IDX_TO_COUNTER(cnt), val);
1083 asm volatile("mrc p15, 0, %0, c9, c13, 1" : "=r" (val));
1084 printk(KERN_INFO "CNT[%d] evtsel=0x%08x\n",
1085 ARMV7_IDX_TO_COUNTER(cnt), val);
1090 static void armv7pmu_save_regs(struct arm_pmu *cpu_pmu,
1091 struct cpupmu_regs *regs)
1094 asm volatile("mrc p15, 0, %0, c9, c12, 0" : "=r" (regs->pmc));
1095 if (!(regs->pmc & ARMV7_PMNC_E))
1098 asm volatile("mrc p15, 0, %0, c9, c12, 1" : "=r" (regs->pmcntenset));
1099 asm volatile("mrc p15, 0, %0, c9, c14, 0" : "=r" (regs->pmuseren));
1100 asm volatile("mrc p15, 0, %0, c9, c14, 1" : "=r" (regs->pmintenset));
1101 asm volatile("mrc p15, 0, %0, c9, c13, 0" : "=r" (regs->pmxevtcnt[0]));
1102 for (cnt = ARMV7_IDX_COUNTER0;
1103 cnt <= ARMV7_IDX_COUNTER_LAST(cpu_pmu); cnt++) {
1104 armv7_pmnc_select_counter(cnt);
1105 asm volatile("mrc p15, 0, %0, c9, c13, 1"
1106 : "=r"(regs->pmxevttype[cnt]));
1107 asm volatile("mrc p15, 0, %0, c9, c13, 2"
1108 : "=r"(regs->pmxevtcnt[cnt]));
1113 static void armv7pmu_restore_regs(struct arm_pmu *cpu_pmu,
1114 struct cpupmu_regs *regs)
1117 if (!(regs->pmc & ARMV7_PMNC_E))
1120 asm volatile("mcr p15, 0, %0, c9, c12, 1" : : "r" (regs->pmcntenset));
1121 asm volatile("mcr p15, 0, %0, c9, c14, 0" : : "r" (regs->pmuseren));
1122 asm volatile("mcr p15, 0, %0, c9, c14, 1" : : "r" (regs->pmintenset));
1123 asm volatile("mcr p15, 0, %0, c9, c13, 0" : : "r" (regs->pmxevtcnt[0]));
1124 for (cnt = ARMV7_IDX_COUNTER0;
1125 cnt <= ARMV7_IDX_COUNTER_LAST(cpu_pmu); cnt++) {
1126 armv7_pmnc_select_counter(cnt);
1127 asm volatile("mcr p15, 0, %0, c9, c13, 1"
1128 : : "r"(regs->pmxevttype[cnt]));
1129 asm volatile("mcr p15, 0, %0, c9, c13, 2"
1130 : : "r"(regs->pmxevtcnt[cnt]));
1132 asm volatile("mcr p15, 0, %0, c9, c12, 0" : : "r" (regs->pmc));
1135 static void armv7pmu_enable_event(struct perf_event *event)
1137 unsigned long flags;
1138 struct hw_perf_event *hwc = &event->hw;
1139 struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
1140 struct pmu_hw_events *events = cpu_pmu->get_hw_events();
1143 if (!armv7_pmnc_counter_valid(cpu_pmu, idx)) {
1144 pr_err("CPU%u enabling wrong PMNC counter IRQ enable %d\n",
1145 smp_processor_id(), idx);
1150 * Enable counter and interrupt, and set the counter to count
1151 * the event that we're interested in.
1153 raw_spin_lock_irqsave(&events->pmu_lock, flags);
1158 armv7_pmnc_disable_counter(idx);
1161 * Set event (if destined for PMNx counters)
1162 * We only need to set the event for the cycle counter if we
1163 * have the ability to perform event filtering.
1165 if (cpu_pmu->set_event_filter || idx != ARMV7_IDX_CYCLE_COUNTER)
1166 armv7_pmnc_write_evtsel(idx, hwc->config_base);
1169 * Enable interrupt for this counter
1171 armv7_pmnc_enable_intens(idx);
1176 armv7_pmnc_enable_counter(idx);
1178 raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
1181 static void armv7pmu_disable_event(struct perf_event *event)
1183 unsigned long flags;
1184 struct hw_perf_event *hwc = &event->hw;
1185 struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
1186 struct pmu_hw_events *events = cpu_pmu->get_hw_events();
1189 if (!armv7_pmnc_counter_valid(cpu_pmu, idx)) {
1190 pr_err("CPU%u disabling wrong PMNC counter IRQ enable %d\n",
1191 smp_processor_id(), idx);
1196 * Disable counter and interrupt
1198 raw_spin_lock_irqsave(&events->pmu_lock, flags);
1203 armv7_pmnc_disable_counter(idx);
1206 * Disable interrupt for this counter
1208 armv7_pmnc_disable_intens(idx);
1210 raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
1213 static irqreturn_t armv7pmu_handle_irq(int irq_num, void *dev)
1216 struct perf_sample_data data;
1217 struct arm_pmu *cpu_pmu = (struct arm_pmu *)dev;
1218 struct pmu_hw_events *cpuc = cpu_pmu->get_hw_events();
1219 struct pt_regs *regs;
1223 * Get and reset the IRQ flags
1225 pmnc = armv7_pmnc_getreset_flags();
1228 * Did an overflow occur?
1230 if (!armv7_pmnc_has_overflowed(pmnc))
1234 * Handle the counter(s) overflow(s)
1236 regs = get_irq_regs();
1238 for (idx = 0; idx < cpu_pmu->num_events; ++idx) {
1239 struct perf_event *event = cpuc->events[idx];
1240 struct hw_perf_event *hwc;
1242 /* Ignore if we don't have an event. */
1247 * We have a single interrupt for all counters. Check that
1248 * each counter has overflowed before we process it.
1250 if (!armv7_pmnc_counter_has_overflowed(pmnc, idx))
1254 armpmu_event_update(event);
1255 perf_sample_data_init(&data, 0, hwc->last_period);
1256 if (!armpmu_event_set_period(event))
1259 if (perf_event_overflow(event, &data, regs))
1260 cpu_pmu->disable(event);
1264 * Handle the pending perf events.
1266 * Note: this call *must* be run with interrupts disabled. For
1267 * platforms that can have the PMU interrupts raised as an NMI, this
1275 static void armv7pmu_start(struct arm_pmu *cpu_pmu)
1277 unsigned long flags;
1278 struct pmu_hw_events *events = cpu_pmu->get_hw_events();
1280 raw_spin_lock_irqsave(&events->pmu_lock, flags);
1281 /* Enable all counters */
1282 armv7_pmnc_write(armv7_pmnc_read() | ARMV7_PMNC_E);
1283 raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
1286 static void armv7pmu_stop(struct arm_pmu *cpu_pmu)
1288 unsigned long flags;
1289 struct pmu_hw_events *events = cpu_pmu->get_hw_events();
1291 raw_spin_lock_irqsave(&events->pmu_lock, flags);
1292 /* Disable all counters */
1293 armv7_pmnc_write(armv7_pmnc_read() & ~ARMV7_PMNC_E);
1294 raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
1297 static int armv7pmu_get_event_idx(struct pmu_hw_events *cpuc,
1298 struct perf_event *event)
1301 struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
1302 struct hw_perf_event *hwc = &event->hw;
1303 unsigned long evtype = hwc->config_base & ARMV7_EVTYPE_EVENT;
1305 /* Always place a cycle counter into the cycle counter. */
1306 if (evtype == ARMV7_PERFCTR_CPU_CYCLES) {
1307 if (test_and_set_bit(ARMV7_IDX_CYCLE_COUNTER, cpuc->used_mask))
1310 return ARMV7_IDX_CYCLE_COUNTER;
1314 * For anything other than a cycle counter, try and use
1315 * the events counters
1317 for (idx = ARMV7_IDX_COUNTER0; idx < cpu_pmu->num_events; ++idx) {
1318 if (!test_and_set_bit(idx, cpuc->used_mask))
1322 /* The counters are all in use. */
1327 * Add an event filter to a given event. This will only work for PMUv2 PMUs.
1329 static int armv7pmu_set_event_filter(struct hw_perf_event *event,
1330 struct perf_event_attr *attr)
1332 unsigned long config_base = 0;
1334 if (attr->exclude_idle)
1336 if (attr->exclude_user)
1337 config_base |= ARMV7_EXCLUDE_USER;
1338 if (attr->exclude_kernel)
1339 config_base |= ARMV7_EXCLUDE_PL1;
1340 if (!attr->exclude_hv)
1341 config_base |= ARMV7_INCLUDE_HYP;
1344 * Install the filter into config_base as this is used to
1345 * construct the event type.
1347 event->config_base = config_base;
1352 static void armv7pmu_reset(void *info)
1354 struct arm_pmu *cpu_pmu = (struct arm_pmu *)info;
1355 u32 idx, nb_cnt = cpu_pmu->num_events;
1357 /* The counter and interrupt enable registers are unknown at reset. */
1358 for (idx = ARMV7_IDX_CYCLE_COUNTER; idx < nb_cnt; ++idx) {
1359 armv7_pmnc_disable_counter(idx);
1360 armv7_pmnc_disable_intens(idx);
1363 /* Initialize & Reset PMNC: C and P bits */
1364 armv7_pmnc_write(ARMV7_PMNC_P | ARMV7_PMNC_C);
1367 static int armv7_a8_map_event(struct perf_event *event)
1369 return armpmu_map_event(event, &armv7_a8_perf_map,
1370 &armv7_a8_perf_cache_map, 0xFF);
1373 static int armv7_a9_map_event(struct perf_event *event)
1375 return armpmu_map_event(event, &armv7_a9_perf_map,
1376 &armv7_a9_perf_cache_map, 0xFF);
1379 static int armv7_a5_map_event(struct perf_event *event)
1381 return armpmu_map_event(event, &armv7_a5_perf_map,
1382 &armv7_a5_perf_cache_map, 0xFF);
1385 static int armv7_a15_map_event(struct perf_event *event)
1387 return armpmu_map_event(event, &armv7_a15_perf_map,
1388 &armv7_a15_perf_cache_map, 0xFF);
1391 static int armv7_a7_map_event(struct perf_event *event)
1393 return armpmu_map_event(event, &armv7_a7_perf_map,
1394 &armv7_a7_perf_cache_map, 0xFF);
1397 static int armv7_a12_map_event(struct perf_event *event)
1399 return armpmu_map_event(event, &armv7_a12_perf_map,
1400 &armv7_a12_perf_cache_map, 0xFF);
1403 static void armv7pmu_init(struct arm_pmu *cpu_pmu)
1405 cpu_pmu->handle_irq = armv7pmu_handle_irq;
1406 cpu_pmu->enable = armv7pmu_enable_event;
1407 cpu_pmu->disable = armv7pmu_disable_event;
1408 cpu_pmu->read_counter = armv7pmu_read_counter;
1409 cpu_pmu->write_counter = armv7pmu_write_counter;
1410 cpu_pmu->get_event_idx = armv7pmu_get_event_idx;
1411 cpu_pmu->start = armv7pmu_start;
1412 cpu_pmu->stop = armv7pmu_stop;
1413 cpu_pmu->reset = armv7pmu_reset;
1414 cpu_pmu->save_regs = armv7pmu_save_regs;
1415 cpu_pmu->restore_regs = armv7pmu_restore_regs;
1416 cpu_pmu->max_period = (1LLU << 32) - 1;
1419 static u32 armv7_read_num_pmnc_events(void)
1423 /* Read the nb of CNTx counters supported from PMNC */
1424 nb_cnt = (armv7_pmnc_read() >> ARMV7_PMNC_N_SHIFT) & ARMV7_PMNC_N_MASK;
1426 /* Add the CPU cycles counter and return */
1430 static int armv7_a8_pmu_init(struct arm_pmu *cpu_pmu)
1432 armv7pmu_init(cpu_pmu);
1433 cpu_pmu->name = "ARMv7_Cortex_A8";
1434 cpu_pmu->map_event = armv7_a8_map_event;
1435 cpu_pmu->num_events = armv7_read_num_pmnc_events();
1439 static int armv7_a9_pmu_init(struct arm_pmu *cpu_pmu)
1441 armv7pmu_init(cpu_pmu);
1442 cpu_pmu->name = "ARMv7_Cortex_A9";
1443 cpu_pmu->map_event = armv7_a9_map_event;
1444 cpu_pmu->num_events = armv7_read_num_pmnc_events();
1448 static int armv7_a5_pmu_init(struct arm_pmu *cpu_pmu)
1450 armv7pmu_init(cpu_pmu);
1451 cpu_pmu->name = "ARMv7_Cortex_A5";
1452 cpu_pmu->map_event = armv7_a5_map_event;
1453 cpu_pmu->num_events = armv7_read_num_pmnc_events();
1457 static int armv7_a15_pmu_init(struct arm_pmu *cpu_pmu)
1459 armv7pmu_init(cpu_pmu);
1460 cpu_pmu->name = "ARMv7_Cortex_A15";
1461 cpu_pmu->map_event = armv7_a15_map_event;
1462 cpu_pmu->num_events = armv7_read_num_pmnc_events();
1463 cpu_pmu->set_event_filter = armv7pmu_set_event_filter;
1467 static int armv7_a7_pmu_init(struct arm_pmu *cpu_pmu)
1469 armv7pmu_init(cpu_pmu);
1470 cpu_pmu->name = "ARMv7_Cortex_A7";
1471 cpu_pmu->map_event = armv7_a7_map_event;
1472 cpu_pmu->num_events = armv7_read_num_pmnc_events();
1473 cpu_pmu->set_event_filter = armv7pmu_set_event_filter;
1477 static int armv7_a12_pmu_init(struct arm_pmu *cpu_pmu)
1479 armv7pmu_init(cpu_pmu);
1480 cpu_pmu->name = "ARMv7 Cortex-A12";
1481 cpu_pmu->map_event = armv7_a12_map_event;
1482 cpu_pmu->num_events = armv7_read_num_pmnc_events();
1483 cpu_pmu->set_event_filter = armv7pmu_set_event_filter;
1487 static inline int armv7_a8_pmu_init(struct arm_pmu *cpu_pmu)
1492 static inline int armv7_a9_pmu_init(struct arm_pmu *cpu_pmu)
1497 static inline int armv7_a5_pmu_init(struct arm_pmu *cpu_pmu)
1502 static inline int armv7_a15_pmu_init(struct arm_pmu *cpu_pmu)
1507 static inline int armv7_a7_pmu_init(struct arm_pmu *cpu_pmu)
1512 static inline int armv7_a12_pmu_init(struct arm_pmu *cpu_pmu)
1516 #endif /* CONFIG_CPU_V7 */