2 * ARMv7 Cortex-A8 and Cortex-A9 Performance Events handling code.
4 * ARMv7 support: Jean Pihet <jpihet@mvista.com>
5 * 2010 (c) MontaVista Software, LLC.
7 * Copied from ARMv6 code, with the low level code inspired
8 * by the ARMv7 Oprofile code.
10 * Cortex-A8 has up to 4 configurable performance counters and
11 * a single cycle counter.
12 * Cortex-A9 has up to 31 configurable performance counters and
13 * a single cycle counter.
15 * All counters can be enabled/disabled and IRQ masked separately. The cycle
16 * counter and all 4 performance counters together can be reset separately.
21 * Common ARMv7 event types
23 * Note: An implementation may not be able to count all of these events
24 * but the encodings are considered to be `reserved' in the case that
25 * they are not available.
27 enum armv7_perf_types
{
28 ARMV7_PERFCTR_PMNC_SW_INCR
= 0x00,
29 ARMV7_PERFCTR_IFETCH_MISS
= 0x01,
30 ARMV7_PERFCTR_ITLB_MISS
= 0x02,
31 ARMV7_PERFCTR_DCACHE_REFILL
= 0x03, /* L1 */
32 ARMV7_PERFCTR_DCACHE_ACCESS
= 0x04, /* L1 */
33 ARMV7_PERFCTR_DTLB_REFILL
= 0x05,
34 ARMV7_PERFCTR_DREAD
= 0x06,
35 ARMV7_PERFCTR_DWRITE
= 0x07,
36 ARMV7_PERFCTR_INSTR_EXECUTED
= 0x08,
37 ARMV7_PERFCTR_EXC_TAKEN
= 0x09,
38 ARMV7_PERFCTR_EXC_EXECUTED
= 0x0A,
39 ARMV7_PERFCTR_CID_WRITE
= 0x0B,
40 /* ARMV7_PERFCTR_PC_WRITE is equivalent to HW_BRANCH_INSTRUCTIONS.
42 * - all branch instructions,
43 * - instructions that explicitly write the PC,
44 * - exception generating instructions.
46 ARMV7_PERFCTR_PC_WRITE
= 0x0C,
47 ARMV7_PERFCTR_PC_IMM_BRANCH
= 0x0D,
48 ARMV7_PERFCTR_PC_PROC_RETURN
= 0x0E,
49 ARMV7_PERFCTR_UNALIGNED_ACCESS
= 0x0F,
51 /* These events are defined by the PMUv2 supplement (ARM DDI 0457A). */
52 ARMV7_PERFCTR_PC_BRANCH_MIS_PRED
= 0x10,
53 ARMV7_PERFCTR_CLOCK_CYCLES
= 0x11,
54 ARMV7_PERFCTR_PC_BRANCH_PRED
= 0x12,
55 ARMV7_PERFCTR_MEM_ACCESS
= 0x13,
56 ARMV7_PERFCTR_L1_ICACHE_ACCESS
= 0x14,
57 ARMV7_PERFCTR_L1_DCACHE_WB
= 0x15,
58 ARMV7_PERFCTR_L2_DCACHE_ACCESS
= 0x16,
59 ARMV7_PERFCTR_L2_DCACHE_REFILL
= 0x17,
60 ARMV7_PERFCTR_L2_DCACHE_WB
= 0x18,
61 ARMV7_PERFCTR_BUS_ACCESS
= 0x19,
62 ARMV7_PERFCTR_MEMORY_ERROR
= 0x1A,
63 ARMV7_PERFCTR_INSTR_SPEC
= 0x1B,
64 ARMV7_PERFCTR_TTBR_WRITE
= 0x1C,
65 ARMV7_PERFCTR_BUS_CYCLES
= 0x1D,
67 ARMV7_PERFCTR_CPU_CYCLES
= 0xFF
70 /* ARMv7 Cortex-A8 specific event types */
71 enum armv7_a8_perf_types
{
72 ARMV7_PERFCTR_WRITE_BUFFER_FULL
= 0x40,
73 ARMV7_PERFCTR_L2_STORE_MERGED
= 0x41,
74 ARMV7_PERFCTR_L2_STORE_BUFF
= 0x42,
75 ARMV7_PERFCTR_L2_ACCESS
= 0x43,
76 ARMV7_PERFCTR_L2_CACH_MISS
= 0x44,
77 ARMV7_PERFCTR_AXI_READ_CYCLES
= 0x45,
78 ARMV7_PERFCTR_AXI_WRITE_CYCLES
= 0x46,
79 ARMV7_PERFCTR_MEMORY_REPLAY
= 0x47,
80 ARMV7_PERFCTR_UNALIGNED_ACCESS_REPLAY
= 0x48,
81 ARMV7_PERFCTR_L1_DATA_MISS
= 0x49,
82 ARMV7_PERFCTR_L1_INST_MISS
= 0x4A,
83 ARMV7_PERFCTR_L1_DATA_COLORING
= 0x4B,
84 ARMV7_PERFCTR_L1_NEON_DATA
= 0x4C,
85 ARMV7_PERFCTR_L1_NEON_CACH_DATA
= 0x4D,
86 ARMV7_PERFCTR_L2_NEON
= 0x4E,
87 ARMV7_PERFCTR_L2_NEON_HIT
= 0x4F,
88 ARMV7_PERFCTR_L1_INST
= 0x50,
89 ARMV7_PERFCTR_PC_RETURN_MIS_PRED
= 0x51,
90 ARMV7_PERFCTR_PC_BRANCH_FAILED
= 0x52,
91 ARMV7_PERFCTR_PC_BRANCH_TAKEN
= 0x53,
92 ARMV7_PERFCTR_PC_BRANCH_EXECUTED
= 0x54,
93 ARMV7_PERFCTR_OP_EXECUTED
= 0x55,
94 ARMV7_PERFCTR_CYCLES_INST_STALL
= 0x56,
95 ARMV7_PERFCTR_CYCLES_INST
= 0x57,
96 ARMV7_PERFCTR_CYCLES_NEON_DATA_STALL
= 0x58,
97 ARMV7_PERFCTR_CYCLES_NEON_INST_STALL
= 0x59,
98 ARMV7_PERFCTR_NEON_CYCLES
= 0x5A,
100 ARMV7_PERFCTR_PMU0_EVENTS
= 0x70,
101 ARMV7_PERFCTR_PMU1_EVENTS
= 0x71,
102 ARMV7_PERFCTR_PMU_EVENTS
= 0x72,
105 /* ARMv7 Cortex-A9 specific event types */
106 enum armv7_a9_perf_types
{
107 ARMV7_PERFCTR_JAVA_HW_BYTECODE_EXEC
= 0x40,
108 ARMV7_PERFCTR_JAVA_SW_BYTECODE_EXEC
= 0x41,
109 ARMV7_PERFCTR_JAZELLE_BRANCH_EXEC
= 0x42,
111 ARMV7_PERFCTR_COHERENT_LINE_MISS
= 0x50,
112 ARMV7_PERFCTR_COHERENT_LINE_HIT
= 0x51,
114 ARMV7_PERFCTR_ICACHE_DEP_STALL_CYCLES
= 0x60,
115 ARMV7_PERFCTR_DCACHE_DEP_STALL_CYCLES
= 0x61,
116 ARMV7_PERFCTR_TLB_MISS_DEP_STALL_CYCLES
= 0x62,
117 ARMV7_PERFCTR_STREX_EXECUTED_PASSED
= 0x63,
118 ARMV7_PERFCTR_STREX_EXECUTED_FAILED
= 0x64,
119 ARMV7_PERFCTR_DATA_EVICTION
= 0x65,
120 ARMV7_PERFCTR_ISSUE_STAGE_NO_INST
= 0x66,
121 ARMV7_PERFCTR_ISSUE_STAGE_EMPTY
= 0x67,
122 ARMV7_PERFCTR_INST_OUT_OF_RENAME_STAGE
= 0x68,
124 ARMV7_PERFCTR_PREDICTABLE_FUNCT_RETURNS
= 0x6E,
126 ARMV7_PERFCTR_MAIN_UNIT_EXECUTED_INST
= 0x70,
127 ARMV7_PERFCTR_SECOND_UNIT_EXECUTED_INST
= 0x71,
128 ARMV7_PERFCTR_LD_ST_UNIT_EXECUTED_INST
= 0x72,
129 ARMV7_PERFCTR_FP_EXECUTED_INST
= 0x73,
130 ARMV7_PERFCTR_NEON_EXECUTED_INST
= 0x74,
132 ARMV7_PERFCTR_PLD_FULL_DEP_STALL_CYCLES
= 0x80,
133 ARMV7_PERFCTR_DATA_WR_DEP_STALL_CYCLES
= 0x81,
134 ARMV7_PERFCTR_ITLB_MISS_DEP_STALL_CYCLES
= 0x82,
135 ARMV7_PERFCTR_DTLB_MISS_DEP_STALL_CYCLES
= 0x83,
136 ARMV7_PERFCTR_MICRO_ITLB_MISS_DEP_STALL_CYCLES
= 0x84,
137 ARMV7_PERFCTR_MICRO_DTLB_MISS_DEP_STALL_CYCLES
= 0x85,
138 ARMV7_PERFCTR_DMB_DEP_STALL_CYCLES
= 0x86,
140 ARMV7_PERFCTR_INTGR_CLK_ENABLED_CYCLES
= 0x8A,
141 ARMV7_PERFCTR_DATA_ENGINE_CLK_EN_CYCLES
= 0x8B,
143 ARMV7_PERFCTR_ISB_INST
= 0x90,
144 ARMV7_PERFCTR_DSB_INST
= 0x91,
145 ARMV7_PERFCTR_DMB_INST
= 0x92,
146 ARMV7_PERFCTR_EXT_INTERRUPTS
= 0x93,
148 ARMV7_PERFCTR_PLE_CACHE_LINE_RQST_COMPLETED
= 0xA0,
149 ARMV7_PERFCTR_PLE_CACHE_LINE_RQST_SKIPPED
= 0xA1,
150 ARMV7_PERFCTR_PLE_FIFO_FLUSH
= 0xA2,
151 ARMV7_PERFCTR_PLE_RQST_COMPLETED
= 0xA3,
152 ARMV7_PERFCTR_PLE_FIFO_OVERFLOW
= 0xA4,
153 ARMV7_PERFCTR_PLE_RQST_PROG
= 0xA5
156 /* ARMv7 Cortex-A5 specific event types */
157 enum armv7_a5_perf_types
{
158 ARMV7_PERFCTR_IRQ_TAKEN
= 0x86,
159 ARMV7_PERFCTR_FIQ_TAKEN
= 0x87,
161 ARMV7_PERFCTR_EXT_MEM_RQST
= 0xc0,
162 ARMV7_PERFCTR_NC_EXT_MEM_RQST
= 0xc1,
163 ARMV7_PERFCTR_PREFETCH_LINEFILL
= 0xc2,
164 ARMV7_PERFCTR_PREFETCH_LINEFILL_DROP
= 0xc3,
165 ARMV7_PERFCTR_ENTER_READ_ALLOC
= 0xc4,
166 ARMV7_PERFCTR_READ_ALLOC
= 0xc5,
168 ARMV7_PERFCTR_STALL_SB_FULL
= 0xc9,
172 * Cortex-A8 HW events mapping
174 * The hardware events that we support. We do support cache operations but
175 * we have harvard caches and no way to combine instruction and data
176 * accesses/misses in hardware.
178 static const unsigned armv7_a8_perf_map
[PERF_COUNT_HW_MAX
] = {
179 [PERF_COUNT_HW_CPU_CYCLES
] = ARMV7_PERFCTR_CPU_CYCLES
,
180 [PERF_COUNT_HW_INSTRUCTIONS
] = ARMV7_PERFCTR_INSTR_EXECUTED
,
181 [PERF_COUNT_HW_CACHE_REFERENCES
] = HW_OP_UNSUPPORTED
,
182 [PERF_COUNT_HW_CACHE_MISSES
] = HW_OP_UNSUPPORTED
,
183 [PERF_COUNT_HW_BRANCH_INSTRUCTIONS
] = ARMV7_PERFCTR_PC_WRITE
,
184 [PERF_COUNT_HW_BRANCH_MISSES
] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED
,
185 [PERF_COUNT_HW_BUS_CYCLES
] = ARMV7_PERFCTR_CLOCK_CYCLES
,
188 static const unsigned armv7_a8_perf_cache_map
[PERF_COUNT_HW_CACHE_MAX
]
189 [PERF_COUNT_HW_CACHE_OP_MAX
]
190 [PERF_COUNT_HW_CACHE_RESULT_MAX
] = {
193 * The performance counters don't differentiate between read
194 * and write accesses/misses so this isn't strictly correct,
195 * but it's the best we can do. Writes and reads get
199 [C(RESULT_ACCESS
)] = ARMV7_PERFCTR_DCACHE_ACCESS
,
200 [C(RESULT_MISS
)] = ARMV7_PERFCTR_DCACHE_REFILL
,
203 [C(RESULT_ACCESS
)] = ARMV7_PERFCTR_DCACHE_ACCESS
,
204 [C(RESULT_MISS
)] = ARMV7_PERFCTR_DCACHE_REFILL
,
207 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
208 [C(RESULT_MISS
)] = CACHE_OP_UNSUPPORTED
,
213 [C(RESULT_ACCESS
)] = ARMV7_PERFCTR_L1_INST
,
214 [C(RESULT_MISS
)] = ARMV7_PERFCTR_L1_INST_MISS
,
217 [C(RESULT_ACCESS
)] = ARMV7_PERFCTR_L1_INST
,
218 [C(RESULT_MISS
)] = ARMV7_PERFCTR_L1_INST_MISS
,
221 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
222 [C(RESULT_MISS
)] = CACHE_OP_UNSUPPORTED
,
227 [C(RESULT_ACCESS
)] = ARMV7_PERFCTR_L2_ACCESS
,
228 [C(RESULT_MISS
)] = ARMV7_PERFCTR_L2_CACH_MISS
,
231 [C(RESULT_ACCESS
)] = ARMV7_PERFCTR_L2_ACCESS
,
232 [C(RESULT_MISS
)] = ARMV7_PERFCTR_L2_CACH_MISS
,
235 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
236 [C(RESULT_MISS
)] = CACHE_OP_UNSUPPORTED
,
241 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
242 [C(RESULT_MISS
)] = ARMV7_PERFCTR_DTLB_REFILL
,
245 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
246 [C(RESULT_MISS
)] = ARMV7_PERFCTR_DTLB_REFILL
,
249 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
250 [C(RESULT_MISS
)] = CACHE_OP_UNSUPPORTED
,
255 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
256 [C(RESULT_MISS
)] = ARMV7_PERFCTR_ITLB_MISS
,
259 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
260 [C(RESULT_MISS
)] = ARMV7_PERFCTR_ITLB_MISS
,
263 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
264 [C(RESULT_MISS
)] = CACHE_OP_UNSUPPORTED
,
269 [C(RESULT_ACCESS
)] = ARMV7_PERFCTR_PC_WRITE
,
271 = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED
,
274 [C(RESULT_ACCESS
)] = ARMV7_PERFCTR_PC_WRITE
,
276 = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED
,
279 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
280 [C(RESULT_MISS
)] = CACHE_OP_UNSUPPORTED
,
286 * Cortex-A9 HW events mapping
288 static const unsigned armv7_a9_perf_map
[PERF_COUNT_HW_MAX
] = {
289 [PERF_COUNT_HW_CPU_CYCLES
] = ARMV7_PERFCTR_CPU_CYCLES
,
290 [PERF_COUNT_HW_INSTRUCTIONS
] =
291 ARMV7_PERFCTR_INST_OUT_OF_RENAME_STAGE
,
292 [PERF_COUNT_HW_CACHE_REFERENCES
] = ARMV7_PERFCTR_COHERENT_LINE_HIT
,
293 [PERF_COUNT_HW_CACHE_MISSES
] = ARMV7_PERFCTR_COHERENT_LINE_MISS
,
294 [PERF_COUNT_HW_BRANCH_INSTRUCTIONS
] = ARMV7_PERFCTR_PC_WRITE
,
295 [PERF_COUNT_HW_BRANCH_MISSES
] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED
,
296 [PERF_COUNT_HW_BUS_CYCLES
] = ARMV7_PERFCTR_CLOCK_CYCLES
,
299 static const unsigned armv7_a9_perf_cache_map
[PERF_COUNT_HW_CACHE_MAX
]
300 [PERF_COUNT_HW_CACHE_OP_MAX
]
301 [PERF_COUNT_HW_CACHE_RESULT_MAX
] = {
304 * The performance counters don't differentiate between read
305 * and write accesses/misses so this isn't strictly correct,
306 * but it's the best we can do. Writes and reads get
310 [C(RESULT_ACCESS
)] = ARMV7_PERFCTR_DCACHE_ACCESS
,
311 [C(RESULT_MISS
)] = ARMV7_PERFCTR_DCACHE_REFILL
,
314 [C(RESULT_ACCESS
)] = ARMV7_PERFCTR_DCACHE_ACCESS
,
315 [C(RESULT_MISS
)] = ARMV7_PERFCTR_DCACHE_REFILL
,
318 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
319 [C(RESULT_MISS
)] = CACHE_OP_UNSUPPORTED
,
324 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
325 [C(RESULT_MISS
)] = ARMV7_PERFCTR_IFETCH_MISS
,
328 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
329 [C(RESULT_MISS
)] = ARMV7_PERFCTR_IFETCH_MISS
,
332 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
333 [C(RESULT_MISS
)] = CACHE_OP_UNSUPPORTED
,
338 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
339 [C(RESULT_MISS
)] = CACHE_OP_UNSUPPORTED
,
342 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
343 [C(RESULT_MISS
)] = CACHE_OP_UNSUPPORTED
,
346 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
347 [C(RESULT_MISS
)] = CACHE_OP_UNSUPPORTED
,
352 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
353 [C(RESULT_MISS
)] = ARMV7_PERFCTR_DTLB_REFILL
,
356 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
357 [C(RESULT_MISS
)] = ARMV7_PERFCTR_DTLB_REFILL
,
360 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
361 [C(RESULT_MISS
)] = CACHE_OP_UNSUPPORTED
,
366 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
367 [C(RESULT_MISS
)] = ARMV7_PERFCTR_ITLB_MISS
,
370 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
371 [C(RESULT_MISS
)] = ARMV7_PERFCTR_ITLB_MISS
,
374 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
375 [C(RESULT_MISS
)] = CACHE_OP_UNSUPPORTED
,
380 [C(RESULT_ACCESS
)] = ARMV7_PERFCTR_PC_WRITE
,
382 = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED
,
385 [C(RESULT_ACCESS
)] = ARMV7_PERFCTR_PC_WRITE
,
387 = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED
,
390 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
391 [C(RESULT_MISS
)] = CACHE_OP_UNSUPPORTED
,
397 * Cortex-A5 HW events mapping
399 static const unsigned armv7_a5_perf_map
[PERF_COUNT_HW_MAX
] = {
400 [PERF_COUNT_HW_CPU_CYCLES
] = ARMV7_PERFCTR_CPU_CYCLES
,
401 [PERF_COUNT_HW_INSTRUCTIONS
] = ARMV7_PERFCTR_INSTR_EXECUTED
,
402 [PERF_COUNT_HW_CACHE_REFERENCES
] = HW_OP_UNSUPPORTED
,
403 [PERF_COUNT_HW_CACHE_MISSES
] = HW_OP_UNSUPPORTED
,
404 [PERF_COUNT_HW_BRANCH_INSTRUCTIONS
] = ARMV7_PERFCTR_PC_WRITE
,
405 [PERF_COUNT_HW_BRANCH_MISSES
] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED
,
406 [PERF_COUNT_HW_BUS_CYCLES
] = HW_OP_UNSUPPORTED
,
409 static const unsigned armv7_a5_perf_cache_map
[PERF_COUNT_HW_CACHE_MAX
]
410 [PERF_COUNT_HW_CACHE_OP_MAX
]
411 [PERF_COUNT_HW_CACHE_RESULT_MAX
] = {
415 = ARMV7_PERFCTR_DCACHE_ACCESS
,
417 = ARMV7_PERFCTR_DCACHE_REFILL
,
421 = ARMV7_PERFCTR_DCACHE_ACCESS
,
423 = ARMV7_PERFCTR_DCACHE_REFILL
,
427 = ARMV7_PERFCTR_PREFETCH_LINEFILL
,
429 = ARMV7_PERFCTR_PREFETCH_LINEFILL_DROP
,
434 [C(RESULT_ACCESS
)] = ARMV7_PERFCTR_L1_ICACHE_ACCESS
,
435 [C(RESULT_MISS
)] = ARMV7_PERFCTR_IFETCH_MISS
,
438 [C(RESULT_ACCESS
)] = ARMV7_PERFCTR_L1_ICACHE_ACCESS
,
439 [C(RESULT_MISS
)] = ARMV7_PERFCTR_IFETCH_MISS
,
442 * The prefetch counters don't differentiate between the I
443 * side and the D side.
447 = ARMV7_PERFCTR_PREFETCH_LINEFILL
,
449 = ARMV7_PERFCTR_PREFETCH_LINEFILL_DROP
,
454 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
455 [C(RESULT_MISS
)] = CACHE_OP_UNSUPPORTED
,
458 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
459 [C(RESULT_MISS
)] = CACHE_OP_UNSUPPORTED
,
462 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
463 [C(RESULT_MISS
)] = CACHE_OP_UNSUPPORTED
,
468 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
469 [C(RESULT_MISS
)] = ARMV7_PERFCTR_DTLB_REFILL
,
472 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
473 [C(RESULT_MISS
)] = ARMV7_PERFCTR_DTLB_REFILL
,
476 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
477 [C(RESULT_MISS
)] = CACHE_OP_UNSUPPORTED
,
482 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
483 [C(RESULT_MISS
)] = ARMV7_PERFCTR_ITLB_MISS
,
486 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
487 [C(RESULT_MISS
)] = ARMV7_PERFCTR_ITLB_MISS
,
490 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
491 [C(RESULT_MISS
)] = CACHE_OP_UNSUPPORTED
,
496 [C(RESULT_ACCESS
)] = ARMV7_PERFCTR_PC_BRANCH_PRED
,
498 = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED
,
501 [C(RESULT_ACCESS
)] = ARMV7_PERFCTR_PC_BRANCH_PRED
,
503 = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED
,
506 [C(RESULT_ACCESS
)] = CACHE_OP_UNSUPPORTED
,
507 [C(RESULT_MISS
)] = CACHE_OP_UNSUPPORTED
,
513 * Perf Events counters
515 enum armv7_counters
{
516 ARMV7_CYCLE_COUNTER
= 1, /* Cycle counter */
517 ARMV7_COUNTER0
= 2, /* First event counter */
521 * The cycle counter is ARMV7_CYCLE_COUNTER.
522 * The first event counter is ARMV7_COUNTER0.
523 * The last event counter is (ARMV7_COUNTER0 + armpmu->num_events - 1).
525 #define ARMV7_COUNTER_LAST (ARMV7_COUNTER0 + armpmu->num_events - 1)
528 * ARMv7 low level PMNC access
532 * Per-CPU PMNC: config reg
534 #define ARMV7_PMNC_E (1 << 0) /* Enable all counters */
535 #define ARMV7_PMNC_P (1 << 1) /* Reset all counters */
536 #define ARMV7_PMNC_C (1 << 2) /* Cycle counter reset */
537 #define ARMV7_PMNC_D (1 << 3) /* CCNT counts every 64th cpu cycle */
538 #define ARMV7_PMNC_X (1 << 4) /* Export to ETM */
539 #define ARMV7_PMNC_DP (1 << 5) /* Disable CCNT if non-invasive debug*/
540 #define ARMV7_PMNC_N_SHIFT 11 /* Number of counters supported */
541 #define ARMV7_PMNC_N_MASK 0x1f
542 #define ARMV7_PMNC_MASK 0x3f /* Mask for writable bits */
547 #define ARMV7_CNT0 0 /* First event counter */
548 #define ARMV7_CCNT 31 /* Cycle counter */
550 /* Perf Event to low level counters mapping */
551 #define ARMV7_EVENT_CNT_TO_CNTx (ARMV7_COUNTER0 - ARMV7_CNT0)
554 * CNTENS: counters enable reg
556 #define ARMV7_CNTENS_P(idx) (1 << (idx - ARMV7_EVENT_CNT_TO_CNTx))
557 #define ARMV7_CNTENS_C (1 << ARMV7_CCNT)
560 * CNTENC: counters disable reg
562 #define ARMV7_CNTENC_P(idx) (1 << (idx - ARMV7_EVENT_CNT_TO_CNTx))
563 #define ARMV7_CNTENC_C (1 << ARMV7_CCNT)
566 * INTENS: counters overflow interrupt enable reg
568 #define ARMV7_INTENS_P(idx) (1 << (idx - ARMV7_EVENT_CNT_TO_CNTx))
569 #define ARMV7_INTENS_C (1 << ARMV7_CCNT)
572 * INTENC: counters overflow interrupt disable reg
574 #define ARMV7_INTENC_P(idx) (1 << (idx - ARMV7_EVENT_CNT_TO_CNTx))
575 #define ARMV7_INTENC_C (1 << ARMV7_CCNT)
578 * EVTSEL: Event selection reg
580 #define ARMV7_EVTSEL_MASK 0xff /* Mask for writable bits */
583 * SELECT: Counter selection reg
585 #define ARMV7_SELECT_MASK 0x1f /* Mask for writable bits */
588 * FLAG: counters overflow flag status reg
590 #define ARMV7_FLAG_P(idx) (1 << (idx - ARMV7_EVENT_CNT_TO_CNTx))
591 #define ARMV7_FLAG_C (1 << ARMV7_CCNT)
592 #define ARMV7_FLAG_MASK 0xffffffff /* Mask for writable bits */
593 #define ARMV7_OVERFLOWED_MASK ARMV7_FLAG_MASK
595 static inline unsigned long armv7_pmnc_read(void)
598 asm volatile("mrc p15, 0, %0, c9, c12, 0" : "=r"(val
));
602 static inline void armv7_pmnc_write(unsigned long val
)
604 val
&= ARMV7_PMNC_MASK
;
606 asm volatile("mcr p15, 0, %0, c9, c12, 0" : : "r"(val
));
609 static inline int armv7_pmnc_has_overflowed(unsigned long pmnc
)
611 return pmnc
& ARMV7_OVERFLOWED_MASK
;
614 static inline int armv7_pmnc_counter_has_overflowed(unsigned long pmnc
,
615 enum armv7_counters counter
)
619 if (counter
== ARMV7_CYCLE_COUNTER
)
620 ret
= pmnc
& ARMV7_FLAG_C
;
621 else if ((counter
>= ARMV7_COUNTER0
) && (counter
<= ARMV7_COUNTER_LAST
))
622 ret
= pmnc
& ARMV7_FLAG_P(counter
);
624 pr_err("CPU%u checking wrong counter %d overflow status\n",
625 smp_processor_id(), counter
);
630 static inline int armv7_pmnc_select_counter(unsigned int idx
)
634 if ((idx
< ARMV7_COUNTER0
) || (idx
> ARMV7_COUNTER_LAST
)) {
635 pr_err("CPU%u selecting wrong PMNC counter"
636 " %d\n", smp_processor_id(), idx
);
640 val
= (idx
- ARMV7_EVENT_CNT_TO_CNTx
) & ARMV7_SELECT_MASK
;
641 asm volatile("mcr p15, 0, %0, c9, c12, 5" : : "r" (val
));
647 static inline u32
armv7pmu_read_counter(int idx
)
649 unsigned long value
= 0;
651 if (idx
== ARMV7_CYCLE_COUNTER
)
652 asm volatile("mrc p15, 0, %0, c9, c13, 0" : "=r" (value
));
653 else if ((idx
>= ARMV7_COUNTER0
) && (idx
<= ARMV7_COUNTER_LAST
)) {
654 if (armv7_pmnc_select_counter(idx
) == idx
)
655 asm volatile("mrc p15, 0, %0, c9, c13, 2"
658 pr_err("CPU%u reading wrong counter %d\n",
659 smp_processor_id(), idx
);
664 static inline void armv7pmu_write_counter(int idx
, u32 value
)
666 if (idx
== ARMV7_CYCLE_COUNTER
)
667 asm volatile("mcr p15, 0, %0, c9, c13, 0" : : "r" (value
));
668 else if ((idx
>= ARMV7_COUNTER0
) && (idx
<= ARMV7_COUNTER_LAST
)) {
669 if (armv7_pmnc_select_counter(idx
) == idx
)
670 asm volatile("mcr p15, 0, %0, c9, c13, 2"
673 pr_err("CPU%u writing wrong counter %d\n",
674 smp_processor_id(), idx
);
677 static inline void armv7_pmnc_write_evtsel(unsigned int idx
, u32 val
)
679 if (armv7_pmnc_select_counter(idx
) == idx
) {
680 val
&= ARMV7_EVTSEL_MASK
;
681 asm volatile("mcr p15, 0, %0, c9, c13, 1" : : "r" (val
));
685 static inline u32
armv7_pmnc_enable_counter(unsigned int idx
)
689 if ((idx
!= ARMV7_CYCLE_COUNTER
) &&
690 ((idx
< ARMV7_COUNTER0
) || (idx
> ARMV7_COUNTER_LAST
))) {
691 pr_err("CPU%u enabling wrong PMNC counter"
692 " %d\n", smp_processor_id(), idx
);
696 if (idx
== ARMV7_CYCLE_COUNTER
)
697 val
= ARMV7_CNTENS_C
;
699 val
= ARMV7_CNTENS_P(idx
);
701 asm volatile("mcr p15, 0, %0, c9, c12, 1" : : "r" (val
));
706 static inline u32
armv7_pmnc_disable_counter(unsigned int idx
)
711 if ((idx
!= ARMV7_CYCLE_COUNTER
) &&
712 ((idx
< ARMV7_COUNTER0
) || (idx
> ARMV7_COUNTER_LAST
))) {
713 pr_err("CPU%u disabling wrong PMNC counter"
714 " %d\n", smp_processor_id(), idx
);
718 if (idx
== ARMV7_CYCLE_COUNTER
)
719 val
= ARMV7_CNTENC_C
;
721 val
= ARMV7_CNTENC_P(idx
);
723 asm volatile("mcr p15, 0, %0, c9, c12, 2" : : "r" (val
));
728 static inline u32
armv7_pmnc_enable_intens(unsigned int idx
)
732 if ((idx
!= ARMV7_CYCLE_COUNTER
) &&
733 ((idx
< ARMV7_COUNTER0
) || (idx
> ARMV7_COUNTER_LAST
))) {
734 pr_err("CPU%u enabling wrong PMNC counter"
735 " interrupt enable %d\n", smp_processor_id(), idx
);
739 if (idx
== ARMV7_CYCLE_COUNTER
)
740 val
= ARMV7_INTENS_C
;
742 val
= ARMV7_INTENS_P(idx
);
744 asm volatile("mcr p15, 0, %0, c9, c14, 1" : : "r" (val
));
749 static inline u32
armv7_pmnc_disable_intens(unsigned int idx
)
753 if ((idx
!= ARMV7_CYCLE_COUNTER
) &&
754 ((idx
< ARMV7_COUNTER0
) || (idx
> ARMV7_COUNTER_LAST
))) {
755 pr_err("CPU%u disabling wrong PMNC counter"
756 " interrupt enable %d\n", smp_processor_id(), idx
);
760 if (idx
== ARMV7_CYCLE_COUNTER
)
761 val
= ARMV7_INTENC_C
;
763 val
= ARMV7_INTENC_P(idx
);
765 asm volatile("mcr p15, 0, %0, c9, c14, 2" : : "r" (val
));
770 static inline u32
armv7_pmnc_getreset_flags(void)
775 asm volatile("mrc p15, 0, %0, c9, c12, 3" : "=r" (val
));
777 /* Write to clear flags */
778 val
&= ARMV7_FLAG_MASK
;
779 asm volatile("mcr p15, 0, %0, c9, c12, 3" : : "r" (val
));
785 static void armv7_pmnc_dump_regs(void)
790 printk(KERN_INFO
"PMNC registers dump:\n");
792 asm volatile("mrc p15, 0, %0, c9, c12, 0" : "=r" (val
));
793 printk(KERN_INFO
"PMNC =0x%08x\n", val
);
795 asm volatile("mrc p15, 0, %0, c9, c12, 1" : "=r" (val
));
796 printk(KERN_INFO
"CNTENS=0x%08x\n", val
);
798 asm volatile("mrc p15, 0, %0, c9, c14, 1" : "=r" (val
));
799 printk(KERN_INFO
"INTENS=0x%08x\n", val
);
801 asm volatile("mrc p15, 0, %0, c9, c12, 3" : "=r" (val
));
802 printk(KERN_INFO
"FLAGS =0x%08x\n", val
);
804 asm volatile("mrc p15, 0, %0, c9, c12, 5" : "=r" (val
));
805 printk(KERN_INFO
"SELECT=0x%08x\n", val
);
807 asm volatile("mrc p15, 0, %0, c9, c13, 0" : "=r" (val
));
808 printk(KERN_INFO
"CCNT =0x%08x\n", val
);
810 for (cnt
= ARMV7_COUNTER0
; cnt
< ARMV7_COUNTER_LAST
; cnt
++) {
811 armv7_pmnc_select_counter(cnt
);
812 asm volatile("mrc p15, 0, %0, c9, c13, 2" : "=r" (val
));
813 printk(KERN_INFO
"CNT[%d] count =0x%08x\n",
814 cnt
-ARMV7_EVENT_CNT_TO_CNTx
, val
);
815 asm volatile("mrc p15, 0, %0, c9, c13, 1" : "=r" (val
));
816 printk(KERN_INFO
"CNT[%d] evtsel=0x%08x\n",
817 cnt
-ARMV7_EVENT_CNT_TO_CNTx
, val
);
822 static void armv7pmu_enable_event(struct hw_perf_event
*hwc
, int idx
)
827 * Enable counter and interrupt, and set the counter to count
828 * the event that we're interested in.
830 raw_spin_lock_irqsave(&pmu_lock
, flags
);
835 armv7_pmnc_disable_counter(idx
);
838 * Set event (if destined for PMNx counters)
839 * We don't need to set the event if it's a cycle count
841 if (idx
!= ARMV7_CYCLE_COUNTER
)
842 armv7_pmnc_write_evtsel(idx
, hwc
->config_base
);
845 * Enable interrupt for this counter
847 armv7_pmnc_enable_intens(idx
);
852 armv7_pmnc_enable_counter(idx
);
854 raw_spin_unlock_irqrestore(&pmu_lock
, flags
);
857 static void armv7pmu_disable_event(struct hw_perf_event
*hwc
, int idx
)
862 * Disable counter and interrupt
864 raw_spin_lock_irqsave(&pmu_lock
, flags
);
869 armv7_pmnc_disable_counter(idx
);
872 * Disable interrupt for this counter
874 armv7_pmnc_disable_intens(idx
);
876 raw_spin_unlock_irqrestore(&pmu_lock
, flags
);
879 static irqreturn_t
armv7pmu_handle_irq(int irq_num
, void *dev
)
882 struct perf_sample_data data
;
883 struct cpu_hw_events
*cpuc
;
884 struct pt_regs
*regs
;
888 * Get and reset the IRQ flags
890 pmnc
= armv7_pmnc_getreset_flags();
893 * Did an overflow occur?
895 if (!armv7_pmnc_has_overflowed(pmnc
))
899 * Handle the counter(s) overflow(s)
901 regs
= get_irq_regs();
903 perf_sample_data_init(&data
, 0);
905 cpuc
= &__get_cpu_var(cpu_hw_events
);
906 for (idx
= 0; idx
<= armpmu
->num_events
; ++idx
) {
907 struct perf_event
*event
= cpuc
->events
[idx
];
908 struct hw_perf_event
*hwc
;
910 if (!test_bit(idx
, cpuc
->active_mask
))
914 * We have a single interrupt for all counters. Check that
915 * each counter has overflowed before we process it.
917 if (!armv7_pmnc_counter_has_overflowed(pmnc
, idx
))
921 armpmu_event_update(event
, hwc
, idx
, 1);
922 data
.period
= event
->hw
.last_period
;
923 if (!armpmu_event_set_period(event
, hwc
, idx
))
926 if (perf_event_overflow(event
, 0, &data
, regs
))
927 armpmu
->disable(hwc
, idx
);
931 * Handle the pending perf events.
933 * Note: this call *must* be run with interrupts disabled. For
934 * platforms that can have the PMU interrupts raised as an NMI, this
942 static void armv7pmu_start(void)
946 raw_spin_lock_irqsave(&pmu_lock
, flags
);
947 /* Enable all counters */
948 armv7_pmnc_write(armv7_pmnc_read() | ARMV7_PMNC_E
);
949 raw_spin_unlock_irqrestore(&pmu_lock
, flags
);
952 static void armv7pmu_stop(void)
956 raw_spin_lock_irqsave(&pmu_lock
, flags
);
957 /* Disable all counters */
958 armv7_pmnc_write(armv7_pmnc_read() & ~ARMV7_PMNC_E
);
959 raw_spin_unlock_irqrestore(&pmu_lock
, flags
);
962 static int armv7pmu_get_event_idx(struct cpu_hw_events
*cpuc
,
963 struct hw_perf_event
*event
)
967 /* Always place a cycle counter into the cycle counter. */
968 if (event
->config_base
== ARMV7_PERFCTR_CPU_CYCLES
) {
969 if (test_and_set_bit(ARMV7_CYCLE_COUNTER
, cpuc
->used_mask
))
972 return ARMV7_CYCLE_COUNTER
;
975 * For anything other than a cycle counter, try and use
976 * the events counters
978 for (idx
= ARMV7_COUNTER0
; idx
<= armpmu
->num_events
; ++idx
) {
979 if (!test_and_set_bit(idx
, cpuc
->used_mask
))
983 /* The counters are all in use. */
988 static void armv7pmu_reset(void *info
)
990 u32 idx
, nb_cnt
= armpmu
->num_events
;
992 /* The counter and interrupt enable registers are unknown at reset. */
993 for (idx
= 1; idx
< nb_cnt
; ++idx
)
994 armv7pmu_disable_event(NULL
, idx
);
996 /* Initialize & Reset PMNC: C and P bits */
997 armv7_pmnc_write(ARMV7_PMNC_P
| ARMV7_PMNC_C
);
1000 static struct arm_pmu armv7pmu
= {
1001 .handle_irq
= armv7pmu_handle_irq
,
1002 .enable
= armv7pmu_enable_event
,
1003 .disable
= armv7pmu_disable_event
,
1004 .read_counter
= armv7pmu_read_counter
,
1005 .write_counter
= armv7pmu_write_counter
,
1006 .get_event_idx
= armv7pmu_get_event_idx
,
1007 .start
= armv7pmu_start
,
1008 .stop
= armv7pmu_stop
,
1009 .reset
= armv7pmu_reset
,
1010 .raw_event_mask
= 0xFF,
1011 .max_period
= (1LLU << 32) - 1,
1014 static u32 __init
armv7_read_num_pmnc_events(void)
1018 /* Read the nb of CNTx counters supported from PMNC */
1019 nb_cnt
= (armv7_pmnc_read() >> ARMV7_PMNC_N_SHIFT
) & ARMV7_PMNC_N_MASK
;
1021 /* Add the CPU cycles counter and return */
1025 static const struct arm_pmu
*__init
armv7_a8_pmu_init(void)
1027 armv7pmu
.id
= ARM_PERF_PMU_ID_CA8
;
1028 armv7pmu
.name
= "ARMv7 Cortex-A8";
1029 armv7pmu
.cache_map
= &armv7_a8_perf_cache_map
;
1030 armv7pmu
.event_map
= &armv7_a8_perf_map
;
1031 armv7pmu
.num_events
= armv7_read_num_pmnc_events();
1035 static const struct arm_pmu
*__init
armv7_a9_pmu_init(void)
1037 armv7pmu
.id
= ARM_PERF_PMU_ID_CA9
;
1038 armv7pmu
.name
= "ARMv7 Cortex-A9";
1039 armv7pmu
.cache_map
= &armv7_a9_perf_cache_map
;
1040 armv7pmu
.event_map
= &armv7_a9_perf_map
;
1041 armv7pmu
.num_events
= armv7_read_num_pmnc_events();
1045 static const struct arm_pmu
*__init
armv7_a5_pmu_init(void)
1047 armv7pmu
.id
= ARM_PERF_PMU_ID_CA5
;
1048 armv7pmu
.name
= "ARMv7 Cortex-A5";
1049 armv7pmu
.cache_map
= &armv7_a5_perf_cache_map
;
1050 armv7pmu
.event_map
= &armv7_a5_perf_map
;
1051 armv7pmu
.num_events
= armv7_read_num_pmnc_events();
1055 static const struct arm_pmu
*__init
armv7_a8_pmu_init(void)
1060 static const struct arm_pmu
*__init
armv7_a9_pmu_init(void)
1065 static const struct arm_pmu
*__init
armv7_a5_pmu_init(void)
1069 #endif /* CONFIG_CPU_V7 */